Spaces:

Multichem-PD
/

DFS_Portfolio_Manager

Running

App Files Files Community

James McCool commited on Dec 1, 2025

Commit

4c05307

1 Parent(s): e31f557

Enhance salary retrieval functions to accept slate type parameter for improved data handling. Implement logic for 'Main', 'Secondary', and 'Auxiliary' slates to manage player records effectively, including sorting and deduplication strategies.

Browse files

Files changed (1) hide show

app.py +109 -9

app.py CHANGED Viewed

@@ -128,12 +128,37 @@ st.markdown("""
 </style>""", unsafe_allow_html=True)
-def grab_nfl_reg_salaries():
     collection = salaries_db["NFL_reg_player_info"]
     today_str = datetime.now().strftime("%Y%m%d")
     records = pd.DataFrame(list(collection.find({'Contest Date': {'$gte': today_str}})))
     records = records[['Display Name', 'draftableId', 'Position', 'Salary']]
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
 def grab_nfl_showdown_salaries():
@@ -144,12 +169,37 @@ def grab_nfl_showdown_salaries():
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
-def grab_nba_reg_salaries():
     collection = salaries_db["NBA_reg_player_info"]
     today_str = datetime.now().strftime("%Y%m%d")
     records = pd.DataFrame(list(collection.find({'Contest Date': {'$gte': today_str}})))
     records = records[['Display Name', 'draftableId', 'Position', 'Salary']]
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
 def grab_nba_showdown_salaries():
@@ -160,12 +210,37 @@ def grab_nba_showdown_salaries():
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
-def grab_mlb_reg_salaries():
     collection = salaries_db["MLB_reg_player_info"]
     today_str = datetime.now().strftime("%Y%m%d")
     records = pd.DataFrame(list(collection.find({'Contest Date': {'$gte': today_str}})))
     records = records[['Display Name', 'draftableId', 'Position', 'Salary']]
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
 def grab_mlb_showdown_salaries():
@@ -176,12 +251,37 @@ def grab_mlb_showdown_salaries():
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
-def grab_nhl_reg_salaries():
     collection = salaries_db["NHL_reg_player_info"]
     today_str = datetime.now().strftime("%Y%m%d")
     records = pd.DataFrame(list(collection.find({'Contest Date': {'$gte': today_str}})))
     records = records[['Display Name', 'draftableId', 'Position', 'Salary']]
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
 def grab_nhl_showdown_salaries():
@@ -282,11 +382,6 @@ except:
     nba_slate_names_fd = []
     nba_slate_name_lookup_fd = {}
-nfl_reg_salaries = grab_nfl_reg_salaries()
-nfl_showdown_salaries = grab_nfl_showdown_salaries()
-nba_reg_salaries = grab_nba_reg_salaries()
-nba_showdown_salaries = grab_nba_showdown_salaries()
 # Memory optimization helper functions
 def chunk_name_matching(portfolio_names, csv_names, chunk_size=1000):
     """Process name matching in chunks to reduce memory usage"""
@@ -649,6 +744,11 @@ with st.container():
                 salary_max = 60000
         elif type_var == 'Showdown':
             salary_max = 60000
     with st.expander("Info and Filters"):
         prio_col, optimals_site_col, optimals_salary_col, optimals_stacks_col = st.columns(4)

 </style>""", unsafe_allow_html=True)
+def grab_nfl_reg_salaries(slate_var: str):
     collection = salaries_db["NFL_reg_player_info"]
     today_str = datetime.now().strftime("%Y%m%d")
     records = pd.DataFrame(list(collection.find({'Contest Date': {'$gte': today_str}})))
     records = records[['Display Name', 'draftableId', 'Position', 'Salary']]
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
+    if slate_var == 'Main':
+        records = records.sort_values(by='ID', ascending=True)
+        records = records.drop_duplicates(subset=['Name'], keep='first')
+    elif slate_var == 'Secondary':
+        records = records.sort_values(by='ID', ascending=True)
+        # Keep middle occurrence: drop first and last, keep middle
+        grouped = records.groupby('Name')
+        middle_records = []
+        for name, group in grouped:
+            if len(group) == 1:
+                # Only one record, keep it
+                middle_records.append(group)
+            elif len(group) == 2:
+                # Two records, keep the second one (last)
+                middle_records.append(group.iloc[1:2])
+            else:
+                # Three or more records, keep the middle one(s)
+                # For odd number of records, keep the true middle
+                # For even number of records, keep the record at index len//2
+                middle_idx = len(group) // 2
+                middle_records.append(group.iloc[middle_idx:middle_idx+1])
+        records = pd.concat(middle_records, ignore_index=True)
+    elif slate_var == 'Auxiliary':
+        records = records.sort_values(by='ID', ascending=True)
+        records = records.drop_duplicates(subset=['Name'], keep='last')
     return records
 def grab_nfl_showdown_salaries():
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
+def grab_nba_reg_salaries(slate_var: str):
     collection = salaries_db["NBA_reg_player_info"]
     today_str = datetime.now().strftime("%Y%m%d")
     records = pd.DataFrame(list(collection.find({'Contest Date': {'$gte': today_str}})))
     records = records[['Display Name', 'draftableId', 'Position', 'Salary']]
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
+    if slate_var == 'Main':
+        records = records.sort_values(by='ID', ascending=True)
+        records = records.drop_duplicates(subset=['Name'], keep='first')
+    elif slate_var == 'Secondary':
+        records = records.sort_values(by='ID', ascending=True)
+        # Keep middle occurrence: drop first and last, keep middle
+        grouped = records.groupby('Name')
+        middle_records = []
+        for name, group in grouped:
+            if len(group) == 1:
+                # Only one record, keep it
+                middle_records.append(group)
+            elif len(group) == 2:
+                # Two records, keep the second one (last)
+                middle_records.append(group.iloc[1:2])
+            else:
+                # Three or more records, keep the middle one(s)
+                # For odd number of records, keep the true middle
+                # For even number of records, keep the record at index len//2
+                middle_idx = len(group) // 2
+                middle_records.append(group.iloc[middle_idx:middle_idx+1])
+        records = pd.concat(middle_records, ignore_index=True)
+    elif slate_var == 'Auxiliary':
+        records = records.sort_values(by='ID', ascending=True)
+        records = records.drop_duplicates(subset=['Name'], keep='last')
     return records
 def grab_nba_showdown_salaries():
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
+def grab_mlb_reg_salaries(slate_var: str):
     collection = salaries_db["MLB_reg_player_info"]
     today_str = datetime.now().strftime("%Y%m%d")
     records = pd.DataFrame(list(collection.find({'Contest Date': {'$gte': today_str}})))
     records = records[['Display Name', 'draftableId', 'Position', 'Salary']]
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
+    if slate_var == 'Main':
+        records = records.sort_values(by='ID', ascending=True)
+        records = records.drop_duplicates(subset=['Name'], keep='first')
+    elif slate_var == 'Secondary':
+        records = records.sort_values(by='ID', ascending=True)
+        # Keep middle occurrence: drop first and last, keep middle
+        grouped = records.groupby('Name')
+        middle_records = []
+        for name, group in grouped:
+            if len(group) == 1:
+                # Only one record, keep it
+                middle_records.append(group)
+            elif len(group) == 2:
+                # Two records, keep the second one (last)
+                middle_records.append(group.iloc[1:2])
+            else:
+                # Three or more records, keep the middle one(s)
+                # For odd number of records, keep the true middle
+                # For even number of records, keep the record at index len//2
+                middle_idx = len(group) // 2
+                middle_records.append(group.iloc[middle_idx:middle_idx+1])
+        records = pd.concat(middle_records, ignore_index=True)
+    elif slate_var == 'Auxiliary':
+        records = records.sort_values(by='ID', ascending=True)
+        records = records.drop_duplicates(subset=['Name'], keep='last')
     return records
 def grab_mlb_showdown_salaries():
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
     return records
+def grab_nhl_reg_salaries(slate_var: str):
     collection = salaries_db["NHL_reg_player_info"]
     today_str = datetime.now().strftime("%Y%m%d")
     records = pd.DataFrame(list(collection.find({'Contest Date': {'$gte': today_str}})))
     records = records[['Display Name', 'draftableId', 'Position', 'Salary']]
     records = records.rename(columns={'Display Name': 'Name', 'draftableId': 'ID', 'Position': 'Roster Position'})
+    if slate_var == 'Main':
+        records = records.sort_values(by='ID', ascending=True)
+        records = records.drop_duplicates(subset=['Name'], keep='first')
+    elif slate_var == 'Secondary':
+        records = records.sort_values(by='ID', ascending=True)
+        # Keep middle occurrence: drop first and last, keep middle
+        grouped = records.groupby('Name')
+        middle_records = []
+        for name, group in grouped:
+            if len(group) == 1:
+                # Only one record, keep it
+                middle_records.append(group)
+            elif len(group) == 2:
+                # Two records, keep the second one (last)
+                middle_records.append(group.iloc[1:2])
+            else:
+                # Three or more records, keep the middle one(s)
+                # For odd number of records, keep the true middle
+                # For even number of records, keep the record at index len//2
+                middle_idx = len(group) // 2
+                middle_records.append(group.iloc[middle_idx:middle_idx+1])
+        records = pd.concat(middle_records, ignore_index=True)
+    elif slate_var == 'Auxiliary':
+        records = records.sort_values(by='ID', ascending=True)
+        records = records.drop_duplicates(subset=['Name'], keep='last')
     return records
 def grab_nhl_showdown_salaries():
     nba_slate_names_fd = []
     nba_slate_name_lookup_fd = {}
 # Memory optimization helper functions
 def chunk_name_matching(portfolio_names, csv_names, chunk_size=1000):
     """Process name matching in chunks to reduce memory usage"""
                 salary_max = 60000
         elif type_var == 'Showdown':
             salary_max = 60000
+    nfl_reg_salaries = grab_nfl_reg_salaries(slate_var3)
+    nfl_showdown_salaries = grab_nfl_showdown_salaries(slate_var3)
+    nba_reg_salaries = grab_nba_reg_salaries(slate_var3)
+    nba_showdown_salaries = grab_nba_showdown_salaries(slate_var3)
     with st.expander("Info and Filters"):
         prio_col, optimals_site_col, optimals_salary_col, optimals_stacks_col = st.columns(4)