James McCool
commited on
Commit
·
55a782f
1
Parent(s):
c2b7029
Add unique and under-5 duplicate counts to working_df in app.py
Browse files- Implemented calculations for unique lineups and lineups with 5 or fewer duplicates for each BaseName, enhancing data analysis capabilities within the application.
app.py
CHANGED
|
@@ -221,6 +221,15 @@ with tab2:
|
|
| 221 |
axis=1
|
| 222 |
)
|
| 223 |
working_df['dupes'] = working_df.groupby('sorted').transform('size')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 224 |
working_df = working_df.reset_index()
|
| 225 |
working_df['percentile_finish'] = working_df['index'].rank(pct=True)
|
| 226 |
working_df['finish'] = working_df['index']
|
|
|
|
| 221 |
axis=1
|
| 222 |
)
|
| 223 |
working_df['dupes'] = working_df.groupby('sorted').transform('size')
|
| 224 |
+
# For uniques - count how many unique lineups (dupes == 1) each BaseName has
|
| 225 |
+
working_df['uniques'] = working_df.groupby('BaseName').apply(
|
| 226 |
+
lambda x: (x['dupes'] == 1).sum()
|
| 227 |
+
).reindex(working_df['BaseName']).values
|
| 228 |
+
|
| 229 |
+
# For under_5 - count how many lineups with 5 or fewer duplicates each BaseName has
|
| 230 |
+
working_df['under_5'] = working_df.groupby('BaseName').apply(
|
| 231 |
+
lambda x: (x['dupes'] <= 5).sum()
|
| 232 |
+
).reindex(working_df['BaseName']).values
|
| 233 |
working_df = working_df.reset_index()
|
| 234 |
working_df['percentile_finish'] = working_df['index'].rank(pct=True)
|
| 235 |
working_df['finish'] = working_df['index']
|