ai-deadlines

Sleeping

App Files Files Community

nielsr HF Staff commited on Dec 26, 2025

Commit

004e138

1 Parent(s): 283c3bd

Ruff

Browse files

Files changed (6) hide show

.github/scripts/update_conferences.py +135 -117
.github/scripts/update_conferences_new.py +148 -130
agents/agent.py +37 -22
agents/modal_agent.py +27 -26
pyproject.toml +1 -0
uv.lock +28 -0

.github/scripts/update_conferences.py CHANGED Viewed

@@ -6,21 +6,21 @@ from typing import Dict, List, Any
 def fetch_conference_files() -> List[Dict[str, Any]]:
     """Fetch all conference YAML files from ccfddl repository."""
     # First get the directory listing from GitHub API
     api_url = "https://api.github.com/repos/ccfddl/ccf-deadlines/contents/conference/AI"
     response = requests.get(api_url)
     files = response.json()
     conferences = []
     for file in files:
-        if file['name'].endswith('.yml'):
-            yaml_content = requests.get(file['download_url']).text
             conf_data = yaml.safe_load(yaml_content)
             # The data is a list with a single item
             if isinstance(conf_data, list) and len(conf_data) > 0:
                 conferences.append(conf_data[0])
     return conferences
@@ -28,37 +28,37 @@ def parse_date_range(date_str: str, year: str) -> tuple[str, str]:
     """Parse various date formats and return start and end dates."""
     # Remove the year if it appears at the end of the string
     date_str = date_str.replace(f", {year}", "")
     # Handle various date formats
     try:
         # Split into start and end dates
-        if ' - ' in date_str:
-            start, end = date_str.split(' - ')
-        elif '-' in date_str:
-            start, end = date_str.split('-')
         else:
             # For single date format like "May 19, 2025"
             start = end = date_str
         # Clean up month abbreviations
         month_map = {
-            'Sept': 'September',  # Handle Sept before Sep
-            'Jan': 'January',
-            'Feb': 'February',
-            'Mar': 'March',
-            'Apr': 'April',
-            'Jun': 'June',
-            'Jul': 'July',
-            'Aug': 'August',
-            'Sep': 'September',
-            'Oct': 'October',
-            'Nov': 'November',
-            'Dec': 'December'
         }
         # Create a set of all month names (full and abbreviated)
         all_months = set(month_map.keys()) | set(month_map.values())
         # Handle cases like "April 29-May 4"
         has_month = any(month in end for month in all_months)
         if not has_month:
@@ -66,178 +66,196 @@ def parse_date_range(date_str: str, year: str) -> tuple[str, str]:
             start_parts = start.split()
             if len(start_parts) >= 1:
                 end = f"{start_parts[0]} {end.strip()}"
         # Replace month abbreviations
         for abbr, full in month_map.items():
             start = start.replace(abbr, full)
             end = end.replace(abbr, full)
         # Clean up any extra spaces
-        start = ' '.join(start.split())
-        end = ' '.join(end.split())
         # Parse start date
         start_date = datetime.strptime(f"{start}, {year}", "%B %d, %Y")
         # Parse end date
         end_date = datetime.strptime(f"{end}, {year}", "%B %d, %Y")
-        return start_date.strftime('%Y-%m-%d'), end_date.strftime('%Y-%m-%d')
     except Exception as e:
         raise ValueError(f"Could not parse date: {date_str} ({e})")
-def transform_conference_data(conferences: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
     """Transform ccfddl format to our format."""
     transformed = []
     current_year = datetime.now().year
     for conf in conferences:
         # Get the most recent or upcoming conference instance
         recent_conf = None
-        if 'confs' in conf:
-            for instance in conf['confs']:
-                if instance['year'] >= current_year:
                     recent_conf = instance
                     break
         if not recent_conf:
             continue
         # Transform to our format
         transformed_conf = {
-            'title': conf.get('title', ''),
-            'year': recent_conf['year'],
-            'id': recent_conf['id'],
-            'full_name': conf.get('description', ''),
-            'link': recent_conf.get('link', ''),
-            'deadline': recent_conf.get('timeline', [{}])[0].get('deadline', ''),
-            'timezone': recent_conf.get('timezone', ''),
-            'date': recent_conf.get('date', ''),
-            'tags': [],  # We'll need to maintain a mapping for tags
         }
         # Handle city and country fields instead of place
-        place = recent_conf.get('place', '')
         if place:
             # Try to parse the place into city and country if it contains a comma
-            if ',' in place:
-                city, country = place.split(',', 1)
-                transformed_conf['city'] = city.strip()
-                transformed_conf['country'] = country.strip()
             else:
                 # If we can't parse, just set the country
-                transformed_conf['country'] = place.strip()
         # Add optional fields
-        timeline = recent_conf.get('timeline', [{}])[0]
-        if 'abstract_deadline' in timeline:
-            transformed_conf['abstract_deadline'] = timeline['abstract_deadline']
         # Parse date range for start/end
         try:
-            if transformed_conf['date']:
                 start_date, end_date = parse_date_range(
-                    transformed_conf['date'],
-                    str(transformed_conf['year'])
                 )
-                transformed_conf['start'] = start_date
-                transformed_conf['end'] = end_date
         except Exception as e:
             print(f"Warning: Could not parse date for {transformed_conf['title']}: {e}")
         # Add rankings as separate field
-        if 'rank' in conf:
             rankings = []
-            for rank_type, rank_value in conf['rank'].items():
                 rankings.append(f"{rank_type.upper()}: {rank_value}")
             if rankings:
-                transformed_conf['rankings'] = ', '.join(rankings)
         transformed.append(transformed_conf)
     return transformed
 def main():
     try:
         # Fetch current conferences.yml
-        current_file = 'src/data/conferences.yml'
-        with open(current_file, 'r') as f:
             current_conferences = yaml.safe_load(f)
         # Fetch and transform new data
         new_conferences = fetch_conference_files()
         if not new_conferences:
             print("Warning: No conferences fetched from ccfddl")
             return
         transformed_conferences = transform_conference_data(new_conferences)
         if not transformed_conferences:
             print("Warning: No conferences transformed")
             return
         # Create a dictionary of current conferences by ID
-        current_conf_dict = {conf['id']: conf for conf in current_conferences}
         # Create a set of existing conference title+year combinations to check for duplicates
-        existing_conf_keys = {(conf['title'], conf['year']) for conf in current_conferences}
         # Update or add new conferences while preserving existing ones
         for new_conf in transformed_conferences:
             # Check if this is a duplicate based on title and year
-            conf_key = (new_conf['title'], new_conf['year'])
             # Skip if we already have a conference with this title and year but different ID
-            if conf_key in existing_conf_keys and new_conf['id'] not in current_conf_dict:
-                print(f"Skipping duplicate conference: {new_conf['title']} {new_conf['year']} (ID: {new_conf['id']})")
                 continue
-            if new_conf['id'] in current_conf_dict:
                 # Update existing conference while preserving fields
-                curr_conf = current_conf_dict[new_conf['id']]
                 # Preserve existing fields
                 preserved_fields = [
-                    'tags', 'venue', 'hindex', 'submission_deadline',
-                    'timezone_submission', 'rebuttal_period_start',
-                    'rebuttal_period_end', 'final_decision_date',
-                    'review_release_date', 'commitment_deadline',
-                    'start', 'end', 'note', 'city', 'country'  # Added city and country to preserved fields
                 ]
                 for field in preserved_fields:
                     if field in curr_conf:
                         new_conf[field] = curr_conf[field]
                 # If start/end not in current conference but we parsed them, keep the parsed ones
-                if 'start' not in curr_conf and 'start' in new_conf:
-                    new_conf['start'] = new_conf['start']
-                if 'end' not in curr_conf and 'end' in new_conf:
-                    new_conf['end'] = new_conf['end']
                 # Preserve existing rankings if available
-                if 'rankings' in curr_conf:
-                    new_conf['rankings'] = curr_conf['rankings']
                 # Update the conference in the dictionary
-                current_conf_dict[new_conf['id']] = new_conf
             else:
                 # Add new conference to the dictionary
-                current_conf_dict[new_conf['id']] = new_conf
                 # Add to our set of existing conference keys
                 existing_conf_keys.add(conf_key)
         # Convert back to list and sort by deadline
         all_conferences = list(current_conf_dict.values())
-        all_conferences.sort(key=lambda x: x.get('deadline', '9999'))
         # Write back to file with newlines between conferences
-        with open(current_file, 'w') as f:
             for i, conf in enumerate(all_conferences):
                 if i > 0:
-                    f.write('\n\n')  # Add two newlines between conferences
                 yaml_str = yaml.dump(
                     [conf],
                     allow_unicode=True,
@@ -250,16 +268,16 @@ def main():
                     default_style=None,
                 )
                 f.write(yaml_str.rstrip())  # Remove trailing whitespace
             # Add final newline
-            f.write('\n')
         print(f"Successfully updated {len(all_conferences)} conferences")
     except Exception as e:
         print(f"Error: {e}")
         raise
 if __name__ == "__main__":
-    main()

 def fetch_conference_files() -> List[Dict[str, Any]]:
     """Fetch all conference YAML files from ccfddl repository."""
     # First get the directory listing from GitHub API
     api_url = "https://api.github.com/repos/ccfddl/ccf-deadlines/contents/conference/AI"
     response = requests.get(api_url)
     files = response.json()
     conferences = []
     for file in files:
+        if file["name"].endswith(".yml"):
+            yaml_content = requests.get(file["download_url"]).text
             conf_data = yaml.safe_load(yaml_content)
             # The data is a list with a single item
             if isinstance(conf_data, list) and len(conf_data) > 0:
                 conferences.append(conf_data[0])
     return conferences
     """Parse various date formats and return start and end dates."""
     # Remove the year if it appears at the end of the string
     date_str = date_str.replace(f", {year}", "")
     # Handle various date formats
     try:
         # Split into start and end dates
+        if " - " in date_str:
+            start, end = date_str.split(" - ")
+        elif "-" in date_str:
+            start, end = date_str.split("-")
         else:
             # For single date format like "May 19, 2025"
             start = end = date_str
         # Clean up month abbreviations
         month_map = {
+            "Sept": "September",  # Handle Sept before Sep
+            "Jan": "January",
+            "Feb": "February",
+            "Mar": "March",
+            "Apr": "April",
+            "Jun": "June",
+            "Jul": "July",
+            "Aug": "August",
+            "Sep": "September",
+            "Oct": "October",
+            "Nov": "November",
+            "Dec": "December",
         }
         # Create a set of all month names (full and abbreviated)
         all_months = set(month_map.keys()) | set(month_map.values())
         # Handle cases like "April 29-May 4"
         has_month = any(month in end for month in all_months)
         if not has_month:
             start_parts = start.split()
             if len(start_parts) >= 1:
                 end = f"{start_parts[0]} {end.strip()}"
         # Replace month abbreviations
         for abbr, full in month_map.items():
             start = start.replace(abbr, full)
             end = end.replace(abbr, full)
         # Clean up any extra spaces
+        start = " ".join(start.split())
+        end = " ".join(end.split())
         # Parse start date
         start_date = datetime.strptime(f"{start}, {year}", "%B %d, %Y")
         # Parse end date
         end_date = datetime.strptime(f"{end}, {year}", "%B %d, %Y")
+        return start_date.strftime("%Y-%m-%d"), end_date.strftime("%Y-%m-%d")
     except Exception as e:
         raise ValueError(f"Could not parse date: {date_str} ({e})")
+def transform_conference_data(
+    conferences: List[Dict[str, Any]],
+) -> List[Dict[str, Any]]:
     """Transform ccfddl format to our format."""
     transformed = []
     current_year = datetime.now().year
     for conf in conferences:
         # Get the most recent or upcoming conference instance
         recent_conf = None
+        if "confs" in conf:
+            for instance in conf["confs"]:
+                if instance["year"] >= current_year:
                     recent_conf = instance
                     break
         if not recent_conf:
             continue
         # Transform to our format
         transformed_conf = {
+            "title": conf.get("title", ""),
+            "year": recent_conf["year"],
+            "id": recent_conf["id"],
+            "full_name": conf.get("description", ""),
+            "link": recent_conf.get("link", ""),
+            "deadline": recent_conf.get("timeline", [{}])[0].get("deadline", ""),
+            "timezone": recent_conf.get("timezone", ""),
+            "date": recent_conf.get("date", ""),
+            "tags": [],  # We'll need to maintain a mapping for tags
         }
         # Handle city and country fields instead of place
+        place = recent_conf.get("place", "")
         if place:
             # Try to parse the place into city and country if it contains a comma
+            if "," in place:
+                city, country = place.split(",", 1)
+                transformed_conf["city"] = city.strip()
+                transformed_conf["country"] = country.strip()
             else:
                 # If we can't parse, just set the country
+                transformed_conf["country"] = place.strip()
         # Add optional fields
+        timeline = recent_conf.get("timeline", [{}])[0]
+        if "abstract_deadline" in timeline:
+            transformed_conf["abstract_deadline"] = timeline["abstract_deadline"]
         # Parse date range for start/end
         try:
+            if transformed_conf["date"]:
                 start_date, end_date = parse_date_range(
+                    transformed_conf["date"], str(transformed_conf["year"])
                 )
+                transformed_conf["start"] = start_date
+                transformed_conf["end"] = end_date
         except Exception as e:
             print(f"Warning: Could not parse date for {transformed_conf['title']}: {e}")
         # Add rankings as separate field
+        if "rank" in conf:
             rankings = []
+            for rank_type, rank_value in conf["rank"].items():
                 rankings.append(f"{rank_type.upper()}: {rank_value}")
             if rankings:
+                transformed_conf["rankings"] = ", ".join(rankings)
         transformed.append(transformed_conf)
     return transformed
 def main():
     try:
         # Fetch current conferences.yml
+        current_file = "src/data/conferences.yml"
+        with open(current_file, "r") as f:
             current_conferences = yaml.safe_load(f)
         # Fetch and transform new data
         new_conferences = fetch_conference_files()
         if not new_conferences:
             print("Warning: No conferences fetched from ccfddl")
             return
         transformed_conferences = transform_conference_data(new_conferences)
         if not transformed_conferences:
             print("Warning: No conferences transformed")
             return
         # Create a dictionary of current conferences by ID
+        current_conf_dict = {conf["id"]: conf for conf in current_conferences}
         # Create a set of existing conference title+year combinations to check for duplicates
+        existing_conf_keys = {
+            (conf["title"], conf["year"]) for conf in current_conferences
+        }
         # Update or add new conferences while preserving existing ones
         for new_conf in transformed_conferences:
             # Check if this is a duplicate based on title and year
+            conf_key = (new_conf["title"], new_conf["year"])
             # Skip if we already have a conference with this title and year but different ID
+            if (
+                conf_key in existing_conf_keys
+                and new_conf["id"] not in current_conf_dict
+            ):
+                print(
+                    f"Skipping duplicate conference: {new_conf['title']} {new_conf['year']} (ID: {new_conf['id']})"
+                )
                 continue
+            if new_conf["id"] in current_conf_dict:
                 # Update existing conference while preserving fields
+                curr_conf = current_conf_dict[new_conf["id"]]
                 # Preserve existing fields
                 preserved_fields = [
+                    "tags",
+                    "venue",
+                    "hindex",
+                    "submission_deadline",
+                    "timezone_submission",
+                    "rebuttal_period_start",
+                    "rebuttal_period_end",
+                    "final_decision_date",
+                    "review_release_date",
+                    "commitment_deadline",
+                    "start",
+                    "end",
+                    "note",
+                    "city",
+                    "country",  # Added city and country to preserved fields
                 ]
                 for field in preserved_fields:
                     if field in curr_conf:
                         new_conf[field] = curr_conf[field]
                 # If start/end not in current conference but we parsed them, keep the parsed ones
+                if "start" not in curr_conf and "start" in new_conf:
+                    new_conf["start"] = new_conf["start"]
+                if "end" not in curr_conf and "end" in new_conf:
+                    new_conf["end"] = new_conf["end"]
                 # Preserve existing rankings if available
+                if "rankings" in curr_conf:
+                    new_conf["rankings"] = curr_conf["rankings"]
                 # Update the conference in the dictionary
+                current_conf_dict[new_conf["id"]] = new_conf
             else:
                 # Add new conference to the dictionary
+                current_conf_dict[new_conf["id"]] = new_conf
                 # Add to our set of existing conference keys
                 existing_conf_keys.add(conf_key)
         # Convert back to list and sort by deadline
         all_conferences = list(current_conf_dict.values())
+        all_conferences.sort(key=lambda x: x.get("deadline", "9999"))
         # Write back to file with newlines between conferences
+        with open(current_file, "w") as f:
             for i, conf in enumerate(all_conferences):
                 if i > 0:
+                    f.write("\n\n")  # Add two newlines between conferences
                 yaml_str = yaml.dump(
                     [conf],
                     allow_unicode=True,
                     default_style=None,
                 )
                 f.write(yaml_str.rstrip())  # Remove trailing whitespace
             # Add final newline
+            f.write("\n")
         print(f"Successfully updated {len(all_conferences)} conferences")
     except Exception as e:
         print(f"Error: {e}")
         raise
 if __name__ == "__main__":
+    main()

.github/scripts/update_conferences_new.py CHANGED Viewed

@@ -8,21 +8,21 @@ from typing import Dict, List, Any
 def fetch_conference_files() -> List[Dict[str, Any]]:
     """Fetch all conference YAML files from ccfddl repository."""
     # First get the directory listing from GitHub API
     api_url = "https://api.github.com/repos/ccfddl/ccf-deadlines/contents/conference/AI"
     response = requests.get(api_url)
     files = response.json()
     conferences = []
     for file in files:
-        if file['name'].endswith('.yml'):
-            yaml_content = requests.get(file['download_url']).text
             conf_data = yaml.safe_load(yaml_content)
             # The data is a list with a single item
             if isinstance(conf_data, list) and len(conf_data) > 0:
                 conferences.append(conf_data[0])
     return conferences
@@ -30,37 +30,37 @@ def parse_date_range(date_str: str, year: str) -> tuple[str, str]:
     """Parse various date formats and return start and end dates."""
     # Remove the year if it appears at the end of the string
     date_str = date_str.replace(f", {year}", "")
     # Handle various date formats
     try:
         # Split into start and end dates
-        if ' - ' in date_str:
-            start, end = date_str.split(' - ')
-        elif '-' in date_str:
-            start, end = date_str.split('-')
         else:
             # For single date format like "May 19, 2025"
             start = end = date_str
         # Clean up month abbreviations
         month_map = {
-            'Sept': 'September',  # Handle Sept before Sep
-            'Jan': 'January',
-            'Feb': 'February',
-            'Mar': 'March',
-            'Apr': 'April',
-            'Jun': 'June',
-            'Jul': 'July',
-            'Aug': 'August',
-            'Sep': 'September',
-            'Oct': 'October',
-            'Nov': 'November',
-            'Dec': 'December'
         }
         # Create a set of all month names (full and abbreviated)
         all_months = set(month_map.keys()) | set(month_map.values())
         # Handle cases like "April 29-May 4"
         has_month = any(month in end for month in all_months)
         if not has_month:
@@ -68,152 +68,153 @@ def parse_date_range(date_str: str, year: str) -> tuple[str, str]:
             start_parts = start.split()
             if len(start_parts) >= 1:
                 end = f"{start_parts[0]} {end.strip()}"
         # Replace month abbreviations
         for abbr, full in month_map.items():
             start = start.replace(abbr, full)
             end = end.replace(abbr, full)
         # Clean up any extra spaces
-        start = ' '.join(start.split())
-        end = ' '.join(end.split())
         # Parse start date
         start_date = datetime.strptime(f"{start}, {year}", "%B %d, %Y")
         # Parse end date
         end_date = datetime.strptime(f"{end}, {year}", "%B %d, %Y")
-        return start_date.strftime('%Y-%m-%d'), end_date.strftime('%Y-%m-%d')
     except Exception as e:
         raise ValueError(f"Could not parse date: {date_str} ({e})")
-def transform_conference_data(conferences: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
     """Transform ccfddl format to our format."""
     transformed = []
     current_year = datetime.now().year
     for conf in conferences:
         # Get the most recent or upcoming conference instance
         recent_conf = None
-        if 'confs' in conf:
-            for instance in conf['confs']:
-                if instance['year'] >= current_year:
                     recent_conf = instance
                     break
         if not recent_conf:
             continue
         # Transform to our format
         transformed_conf = {
-            'title': conf.get('title', ''),
-            'year': recent_conf['year'],
-            'id': recent_conf['id'],
-            'full_name': conf.get('description', ''),
-            'link': recent_conf.get('link', ''),
-            'deadline': recent_conf.get('timeline', [{}])[0].get('deadline', ''),
-            'timezone': recent_conf.get('timezone', ''),
-            'date': recent_conf.get('date', ''),
-            'tags': [],  # We'll need to maintain a mapping for tags
         }
         # Handle city and country fields instead of place
-        place = recent_conf.get('place', '')
         if place:
             # Try to parse the place into city and country if it contains a comma
-            if ',' in place:
-                city, country = place.split(',', 1)
-                transformed_conf['city'] = city.strip()
-                transformed_conf['country'] = country.strip()
             else:
                 # If we can't parse, just set the country
-                transformed_conf['country'] = place.strip()
         # Add optional fields
-        timeline = recent_conf.get('timeline', [{}])[0]
-        if 'abstract_deadline' in timeline:
-            transformed_conf['abstract_deadline'] = timeline['abstract_deadline']
         # Parse date range for start/end
         try:
-            if transformed_conf['date']:
                 start_date, end_date = parse_date_range(
-                    transformed_conf['date'],
-                    str(transformed_conf['year'])
                 )
-                transformed_conf['start'] = start_date
-                transformed_conf['end'] = end_date
         except Exception as e:
             print(f"Warning: Could not parse date for {transformed_conf['title']}: {e}")
         # Add rankings as separate field
-        if 'rank' in conf:
             rankings = []
-            for rank_type, rank_value in conf['rank'].items():
                 rankings.append(f"{rank_type.upper()}: {rank_value}")
             if rankings:
-                transformed_conf['rankings'] = ', '.join(rankings)
         transformed.append(transformed_conf)
     return transformed
 def load_all_current_conferences() -> Dict[str, List[Dict[str, Any]]]:
     """Load all current conferences from individual files."""
-    conferences_dir = 'src/data/conferences'
     conference_groups = {}
     if not os.path.exists(conferences_dir):
         return {}
     for filename in os.listdir(conferences_dir):
-        if filename.endswith('.yml'):
             filepath = os.path.join(conferences_dir, filename)
-            with open(filepath, 'r') as f:
                 conferences = yaml.safe_load(f)
                 if conferences:
                     # Extract conference title from the first entry
-                    title = conferences[0]['title']
                     conference_groups[title] = conferences
     return conference_groups
 def create_filename_from_title(title: str) -> str:
     """Create a filename-safe version of the conference title."""
-    filename = re.sub(r'[^a-zA-Z0-9\s&()-]', '', title.lower())
-    filename = re.sub(r'\s+', '_', filename)
-    filename = filename.replace('&', 'and')
-    filename = filename.strip('_')
     return filename
 def update_conference_loader():
     """Update the conference loader file with all current conferences."""
-    conferences_dir = 'src/data/conferences'
-    loader_path = 'src/utils/conferenceLoader.ts'
     # Get all conference files
     conference_files = []
     if os.path.exists(conferences_dir):
         for filename in sorted(os.listdir(conferences_dir)):
-            if filename.endswith('.yml'):
                 conference_files.append(filename)
     # Generate import statements
     imports = []
     variable_names = []
     for filename in conference_files:
         # Create variable name from filename
-        var_name = filename.replace('.yml', '').replace('-', '_') + 'Data'
         variable_names.append(var_name)
         imports.append(f"import {var_name} from '@/data/conferences/{filename}';")
     # Generate the loader file content
     loader_content = f"""import {{ Conference }} from '@/types/conference';
@@ -222,15 +223,15 @@ def update_conference_loader():
 // Combine all conference data into a single array
 const allConferencesData: Conference[] = [
-{chr(10).join(f'  ...{var_name},' for var_name in variable_names)}
 ];
 export default allConferencesData;"""
     # Write the loader file
-    with open(loader_path, 'w') as f:
         f.write(loader_content)
     print(f"Updated conference loader with {len(conference_files)} conference files")
@@ -238,83 +239,100 @@ def main():
     try:
         # Load current conferences from individual files
         current_conference_groups = load_all_current_conferences()
         # Fetch and transform new data
         new_conferences = fetch_conference_files()
         if not new_conferences:
             print("Warning: No conferences fetched from ccfddl")
             return
         transformed_conferences = transform_conference_data(new_conferences)
         if not transformed_conferences:
             print("Warning: No conferences transformed")
             return
         # Create conferences directory if it doesn't exist
-        conferences_dir = 'src/data/conferences'
         os.makedirs(conferences_dir, exist_ok=True)
         # Group new conferences by title
         new_conference_groups = {}
         for conf in transformed_conferences:
-            title = conf['title']
             if title not in new_conference_groups:
                 new_conference_groups[title] = []
             new_conference_groups[title].append(conf)
         # Update each conference group
         updated_count = 0
         for title, new_confs in new_conference_groups.items():
-            filename = create_filename_from_title(title) + '.yml'
             filepath = os.path.join(conferences_dir, filename)
             # Get current conferences for this title
             current_confs = current_conference_groups.get(title, [])
-            current_conf_dict = {conf['id']: conf for conf in current_confs}
             # Update or add new conferences
             for new_conf in new_confs:
-                if new_conf['id'] in current_conf_dict:
                     # Update existing conference while preserving fields
-                    curr_conf = current_conf_dict[new_conf['id']]
                     # Preserve existing fields
                     preserved_fields = [
-                        'tags', 'venue', 'hindex', 'submission_deadline',
-                        'timezone_submission', 'rebuttal_period_start',
-                        'rebuttal_period_end', 'final_decision_date',
-                        'review_release_date', 'commitment_deadline',
-                        'start', 'end', 'note', 'city', 'country', 'deadlines'
                     ]
                     for field in preserved_fields:
                         if field in curr_conf:
                             new_conf[field] = curr_conf[field]
                     # Preserve existing rankings if available
-                    if 'rankings' in curr_conf:
-                        new_conf['rankings'] = curr_conf['rankings']
-                    current_conf_dict[new_conf['id']] = new_conf
                 else:
                     # Add new conference
-                    current_conf_dict[new_conf['id']] = new_conf
             # Convert back to list and sort by year
             all_confs = list(current_conf_dict.values())
-            all_confs.sort(key=lambda x: x.get('year', 9999))
             # Write to individual file
-            with open(filepath, 'w') as f:
-                yaml.dump(all_confs, f, default_flow_style=False, sort_keys=False, allow_unicode=True)
             updated_count += 1
             print(f"Updated {filename} with {len(all_confs)} entries")
         # Update the conference loader
         update_conference_loader()
         print(f"Successfully updated {updated_count} conference files")
     except Exception as e:
         print(f"Error: {e}")
         raise

 def fetch_conference_files() -> List[Dict[str, Any]]:
     """Fetch all conference YAML files from ccfddl repository."""
     # First get the directory listing from GitHub API
     api_url = "https://api.github.com/repos/ccfddl/ccf-deadlines/contents/conference/AI"
     response = requests.get(api_url)
     files = response.json()
     conferences = []
     for file in files:
+        if file["name"].endswith(".yml"):
+            yaml_content = requests.get(file["download_url"]).text
             conf_data = yaml.safe_load(yaml_content)
             # The data is a list with a single item
             if isinstance(conf_data, list) and len(conf_data) > 0:
                 conferences.append(conf_data[0])
     return conferences
     """Parse various date formats and return start and end dates."""
     # Remove the year if it appears at the end of the string
     date_str = date_str.replace(f", {year}", "")
     # Handle various date formats
     try:
         # Split into start and end dates
+        if " - " in date_str:
+            start, end = date_str.split(" - ")
+        elif "-" in date_str:
+            start, end = date_str.split("-")
         else:
             # For single date format like "May 19, 2025"
             start = end = date_str
         # Clean up month abbreviations
         month_map = {
+            "Sept": "September",  # Handle Sept before Sep
+            "Jan": "January",
+            "Feb": "February",
+            "Mar": "March",
+            "Apr": "April",
+            "Jun": "June",
+            "Jul": "July",
+            "Aug": "August",
+            "Sep": "September",
+            "Oct": "October",
+            "Nov": "November",
+            "Dec": "December",
         }
         # Create a set of all month names (full and abbreviated)
         all_months = set(month_map.keys()) | set(month_map.values())
         # Handle cases like "April 29-May 4"
         has_month = any(month in end for month in all_months)
         if not has_month:
             start_parts = start.split()
             if len(start_parts) >= 1:
                 end = f"{start_parts[0]} {end.strip()}"
         # Replace month abbreviations
         for abbr, full in month_map.items():
             start = start.replace(abbr, full)
             end = end.replace(abbr, full)
         # Clean up any extra spaces
+        start = " ".join(start.split())
+        end = " ".join(end.split())
         # Parse start date
         start_date = datetime.strptime(f"{start}, {year}", "%B %d, %Y")
         # Parse end date
         end_date = datetime.strptime(f"{end}, {year}", "%B %d, %Y")
+        return start_date.strftime("%Y-%m-%d"), end_date.strftime("%Y-%m-%d")
     except Exception as e:
         raise ValueError(f"Could not parse date: {date_str} ({e})")
+def transform_conference_data(
+    conferences: List[Dict[str, Any]],
+) -> List[Dict[str, Any]]:
     """Transform ccfddl format to our format."""
     transformed = []
     current_year = datetime.now().year
     for conf in conferences:
         # Get the most recent or upcoming conference instance
         recent_conf = None
+        if "confs" in conf:
+            for instance in conf["confs"]:
+                if instance["year"] >= current_year:
                     recent_conf = instance
                     break
         if not recent_conf:
             continue
         # Transform to our format
         transformed_conf = {
+            "title": conf.get("title", ""),
+            "year": recent_conf["year"],
+            "id": recent_conf["id"],
+            "full_name": conf.get("description", ""),
+            "link": recent_conf.get("link", ""),
+            "deadline": recent_conf.get("timeline", [{}])[0].get("deadline", ""),
+            "timezone": recent_conf.get("timezone", ""),
+            "date": recent_conf.get("date", ""),
+            "tags": [],  # We'll need to maintain a mapping for tags
         }
         # Handle city and country fields instead of place
+        place = recent_conf.get("place", "")
         if place:
             # Try to parse the place into city and country if it contains a comma
+            if "," in place:
+                city, country = place.split(",", 1)
+                transformed_conf["city"] = city.strip()
+                transformed_conf["country"] = country.strip()
             else:
                 # If we can't parse, just set the country
+                transformed_conf["country"] = place.strip()
         # Add optional fields
+        timeline = recent_conf.get("timeline", [{}])[0]
+        if "abstract_deadline" in timeline:
+            transformed_conf["abstract_deadline"] = timeline["abstract_deadline"]
         # Parse date range for start/end
         try:
+            if transformed_conf["date"]:
                 start_date, end_date = parse_date_range(
+                    transformed_conf["date"], str(transformed_conf["year"])
                 )
+                transformed_conf["start"] = start_date
+                transformed_conf["end"] = end_date
         except Exception as e:
             print(f"Warning: Could not parse date for {transformed_conf['title']}: {e}")
         # Add rankings as separate field
+        if "rank" in conf:
             rankings = []
+            for rank_type, rank_value in conf["rank"].items():
                 rankings.append(f"{rank_type.upper()}: {rank_value}")
             if rankings:
+                transformed_conf["rankings"] = ", ".join(rankings)
         transformed.append(transformed_conf)
     return transformed
 def load_all_current_conferences() -> Dict[str, List[Dict[str, Any]]]:
     """Load all current conferences from individual files."""
+    conferences_dir = "src/data/conferences"
     conference_groups = {}
     if not os.path.exists(conferences_dir):
         return {}
     for filename in os.listdir(conferences_dir):
+        if filename.endswith(".yml"):
             filepath = os.path.join(conferences_dir, filename)
+            with open(filepath, "r") as f:
                 conferences = yaml.safe_load(f)
                 if conferences:
                     # Extract conference title from the first entry
+                    title = conferences[0]["title"]
                     conference_groups[title] = conferences
     return conference_groups
 def create_filename_from_title(title: str) -> str:
     """Create a filename-safe version of the conference title."""
+    filename = re.sub(r"[^a-zA-Z0-9\s&()-]", "", title.lower())
+    filename = re.sub(r"\s+", "_", filename)
+    filename = filename.replace("&", "and")
+    filename = filename.strip("_")
     return filename
 def update_conference_loader():
     """Update the conference loader file with all current conferences."""
+    conferences_dir = "src/data/conferences"
+    loader_path = "src/utils/conferenceLoader.ts"
     # Get all conference files
     conference_files = []
     if os.path.exists(conferences_dir):
         for filename in sorted(os.listdir(conferences_dir)):
+            if filename.endswith(".yml"):
                 conference_files.append(filename)
     # Generate import statements
     imports = []
     variable_names = []
     for filename in conference_files:
         # Create variable name from filename
+        var_name = filename.replace(".yml", "").replace("-", "_") + "Data"
         variable_names.append(var_name)
         imports.append(f"import {var_name} from '@/data/conferences/{filename}';")
     # Generate the loader file content
     loader_content = f"""import {{ Conference }} from '@/types/conference';
 // Combine all conference data into a single array
 const allConferencesData: Conference[] = [
+{chr(10).join(f"  ...{var_name}," for var_name in variable_names)}
 ];
 export default allConferencesData;"""
     # Write the loader file
+    with open(loader_path, "w") as f:
         f.write(loader_content)
     print(f"Updated conference loader with {len(conference_files)} conference files")
     try:
         # Load current conferences from individual files
         current_conference_groups = load_all_current_conferences()
         # Fetch and transform new data
         new_conferences = fetch_conference_files()
         if not new_conferences:
             print("Warning: No conferences fetched from ccfddl")
             return
         transformed_conferences = transform_conference_data(new_conferences)
         if not transformed_conferences:
             print("Warning: No conferences transformed")
             return
         # Create conferences directory if it doesn't exist
+        conferences_dir = "src/data/conferences"
         os.makedirs(conferences_dir, exist_ok=True)
         # Group new conferences by title
         new_conference_groups = {}
         for conf in transformed_conferences:
+            title = conf["title"]
             if title not in new_conference_groups:
                 new_conference_groups[title] = []
             new_conference_groups[title].append(conf)
         # Update each conference group
         updated_count = 0
         for title, new_confs in new_conference_groups.items():
+            filename = create_filename_from_title(title) + ".yml"
             filepath = os.path.join(conferences_dir, filename)
             # Get current conferences for this title
             current_confs = current_conference_groups.get(title, [])
+            current_conf_dict = {conf["id"]: conf for conf in current_confs}
             # Update or add new conferences
             for new_conf in new_confs:
+                if new_conf["id"] in current_conf_dict:
                     # Update existing conference while preserving fields
+                    curr_conf = current_conf_dict[new_conf["id"]]
                     # Preserve existing fields
                     preserved_fields = [
+                        "tags",
+                        "venue",
+                        "hindex",
+                        "submission_deadline",
+                        "timezone_submission",
+                        "rebuttal_period_start",
+                        "rebuttal_period_end",
+                        "final_decision_date",
+                        "review_release_date",
+                        "commitment_deadline",
+                        "start",
+                        "end",
+                        "note",
+                        "city",
+                        "country",
+                        "deadlines",
                     ]
                     for field in preserved_fields:
                         if field in curr_conf:
                             new_conf[field] = curr_conf[field]
                     # Preserve existing rankings if available
+                    if "rankings" in curr_conf:
+                        new_conf["rankings"] = curr_conf["rankings"]
+                    current_conf_dict[new_conf["id"]] = new_conf
                 else:
                     # Add new conference
+                    current_conf_dict[new_conf["id"]] = new_conf
             # Convert back to list and sort by year
             all_confs = list(current_conf_dict.values())
+            all_confs.sort(key=lambda x: x.get("year", 9999))
             # Write to individual file
+            with open(filepath, "w") as f:
+                yaml.dump(
+                    all_confs,
+                    f,
+                    default_flow_style=False,
+                    sort_keys=False,
+                    allow_unicode=True,
+                )
             updated_count += 1
             print(f"Updated {filename} with {len(all_confs)} entries")
         # Update the conference loader
         update_conference_loader()
         print(f"Successfully updated {updated_count} conference files")
     except Exception as e:
         print(f"Error: {e}")
         raise

agents/agent.py CHANGED Viewed

@@ -33,7 +33,11 @@ SCRIPT_DIR = Path(__file__).parent
 # Project root directory - use current working directory if set (for Modal),
 # otherwise use parent of agents/ directory (for local development)
 # This allows Modal to clone the repo and chdir to it before importing this module
-PROJECT_ROOT = Path(os.getcwd()) if os.environ.get("USE_CWD_AS_PROJECT_ROOT") else SCRIPT_DIR.parent
 async def read_prompt(filename: str) -> str:
@@ -52,37 +56,41 @@ async def read_app_readme() -> str:
 async def load_conference_data(conference_name: str) -> str:
     """Load conference data from YAML file.
     Args:
         conference_name: The name of the conference (e.g., 'neurips', 'aaai')
     Returns:
         The YAML content as a string, or an empty string if file not found.
     """
     yaml_path = PROJECT_ROOT / "src" / "data" / "conferences" / f"{conference_name}.yml"
     if not yaml_path.exists():
         print(f"Warning: Conference file not found at {yaml_path}")
         return ""
     async with aiofiles.open(yaml_path, "r", encoding="utf-8") as f:
         return await f.read()
-def format_user_prompt(template: str, conference_name: str, conference_data: str) -> str:
     """Format the user prompt template with conference name and data.
     Args:
         template: The user prompt template with placeholders.
         conference_name: The name of the conference.
         conference_data: The YAML content of the conference data.
     Returns:
         The formatted user prompt.
     """
     return template.format(
         conference_name=conference_name,
-        conference_data=conference_data if conference_data else "No existing data found.",
     )
@@ -96,19 +104,22 @@ async def find_conference_deadlines(conference_name: str) -> None:
     # Load conference data from YAML file
     conference_data = await load_conference_data(conference_name)
     # Read app README for system prompt
     app_readme = await read_app_readme()
     # Read and format system prompt
     system_prompt_template = await read_prompt("prompts/system_prompt.md")
-    from datetime import datetime
     def format_date_verbose(dt: datetime) -> str:
         # e.g. "Monday, the 1st of April, 2025"
         day = dt.day
-        suffix = "th" if 11 <= day <= 13 else {1: "st", 2: "nd", 3: "rd"}.get(day % 10, "th")
-        return f"{dt.strftime('%A')}, the {day}{suffix} of {dt.strftime('%B')}, {dt.year}"
     system_prompt = system_prompt_template.format(
         conference_name=conference_name,
@@ -130,14 +141,14 @@ async def find_conference_deadlines(conference_name: str) -> None:
         # Fallback to home directory (for Modal non-root user)
         settings_path = Path.home() / ".claude" / "settings.local.json"
     settings_path = str(settings_path)
     # Configure Exa MCP server for web search capabilities (only if API key is available)
     # See: https://docs.exa.ai/reference/exa-mcp
     # Note: On Modal, MCP causes claude-agent-sdk to exit early, so we disable it there
     exa_api_key = os.environ.get("EXA_API_KEY", "")
     disable_mcp = os.environ.get("DISABLE_EXA_MCP", "").lower() in ("1", "true", "yes")
     mcp_servers: dict[str, McpHttpServerConfig] = {}
     if disable_mcp:
         print("Exa MCP disabled via DISABLE_EXA_MCP environment variable")
         print("Using built-in WebSearch tool instead")
@@ -150,7 +161,7 @@ async def find_conference_deadlines(conference_name: str) -> None:
         )
     else:
         print("EXA_API_KEY not found, Exa MCP will not be available")
     # Only pass mcp_servers if we have any configured
     # Passing empty dict or MCP servers can cause issues in some environments
     options_kwargs = {
@@ -163,7 +174,7 @@ async def find_conference_deadlines(conference_name: str) -> None:
         print(f"Configuring with MCP servers: {list(mcp_servers.keys())}")
     else:
         print("No MCP servers configured, using built-in tools only")
     options = ClaudeAgentOptions(**options_kwargs)
     # Run the agent query
@@ -216,14 +227,18 @@ async def find_conference_deadlines(conference_name: str) -> None:
                             # Get the tool name from our tracking dict
                             tool_name = tool_names.get(block.tool_use_id, "unknown")
                             # Truncate long results for readability
-                            content_str = str(block.content) if block.content else "(empty)"
                             if len(content_str) > 500:
                                 content_str = content_str[:500] + "... (truncated)"
                             error_indicator = " [ERROR]" if block.is_error else ""
-                            print(f"[result]{error_indicator} {tool_name}: {content_str}")
             elif isinstance(message, ResultMessage):
                 # Print result details
-                if hasattr(message, 'error') and message.error:
                     print(f"[result] ERROR: {message.error}")
                 if message.total_cost_usd and message.total_cost_usd > 0:
                     print(f"\nCost: ${message.total_cost_usd:.4f}")
@@ -249,4 +264,4 @@ if __name__ == "__main__":
     args = parser.parse_args()
     conference_name = args.conference_name
-    asyncio.run(find_conference_deadlines(conference_name))

 # Project root directory - use current working directory if set (for Modal),
 # otherwise use parent of agents/ directory (for local development)
 # This allows Modal to clone the repo and chdir to it before importing this module
+PROJECT_ROOT = (
+    Path(os.getcwd())
+    if os.environ.get("USE_CWD_AS_PROJECT_ROOT")
+    else SCRIPT_DIR.parent
+)
 async def read_prompt(filename: str) -> str:
 async def load_conference_data(conference_name: str) -> str:
     """Load conference data from YAML file.
     Args:
         conference_name: The name of the conference (e.g., 'neurips', 'aaai')
     Returns:
         The YAML content as a string, or an empty string if file not found.
     """
     yaml_path = PROJECT_ROOT / "src" / "data" / "conferences" / f"{conference_name}.yml"
     if not yaml_path.exists():
         print(f"Warning: Conference file not found at {yaml_path}")
         return ""
     async with aiofiles.open(yaml_path, "r", encoding="utf-8") as f:
         return await f.read()
+def format_user_prompt(
+    template: str, conference_name: str, conference_data: str
+) -> str:
     """Format the user prompt template with conference name and data.
     Args:
         template: The user prompt template with placeholders.
         conference_name: The name of the conference.
         conference_data: The YAML content of the conference data.
     Returns:
         The formatted user prompt.
     """
     return template.format(
         conference_name=conference_name,
+        conference_data=conference_data
+        if conference_data
+        else "No existing data found.",
     )
     # Load conference data from YAML file
     conference_data = await load_conference_data(conference_name)
     # Read app README for system prompt
     app_readme = await read_app_readme()
     # Read and format system prompt
     system_prompt_template = await read_prompt("prompts/system_prompt.md")
     def format_date_verbose(dt: datetime) -> str:
         # e.g. "Monday, the 1st of April, 2025"
         day = dt.day
+        suffix = (
+            "th" if 11 <= day <= 13 else {1: "st", 2: "nd", 3: "rd"}.get(day % 10, "th")
+        )
+        return (
+            f"{dt.strftime('%A')}, the {day}{suffix} of {dt.strftime('%B')}, {dt.year}"
+        )
     system_prompt = system_prompt_template.format(
         conference_name=conference_name,
         # Fallback to home directory (for Modal non-root user)
         settings_path = Path.home() / ".claude" / "settings.local.json"
     settings_path = str(settings_path)
     # Configure Exa MCP server for web search capabilities (only if API key is available)
     # See: https://docs.exa.ai/reference/exa-mcp
     # Note: On Modal, MCP causes claude-agent-sdk to exit early, so we disable it there
     exa_api_key = os.environ.get("EXA_API_KEY", "")
     disable_mcp = os.environ.get("DISABLE_EXA_MCP", "").lower() in ("1", "true", "yes")
     mcp_servers: dict[str, McpHttpServerConfig] = {}
     if disable_mcp:
         print("Exa MCP disabled via DISABLE_EXA_MCP environment variable")
         print("Using built-in WebSearch tool instead")
         )
     else:
         print("EXA_API_KEY not found, Exa MCP will not be available")
     # Only pass mcp_servers if we have any configured
     # Passing empty dict or MCP servers can cause issues in some environments
     options_kwargs = {
         print(f"Configuring with MCP servers: {list(mcp_servers.keys())}")
     else:
         print("No MCP servers configured, using built-in tools only")
     options = ClaudeAgentOptions(**options_kwargs)
     # Run the agent query
                             # Get the tool name from our tracking dict
                             tool_name = tool_names.get(block.tool_use_id, "unknown")
                             # Truncate long results for readability
+                            content_str = (
+                                str(block.content) if block.content else "(empty)"
+                            )
                             if len(content_str) > 500:
                                 content_str = content_str[:500] + "... (truncated)"
                             error_indicator = " [ERROR]" if block.is_error else ""
+                            print(
+                                f"[result]{error_indicator} {tool_name}: {content_str}"
+                            )
             elif isinstance(message, ResultMessage):
                 # Print result details
+                if hasattr(message, "error") and message.error:
                     print(f"[result] ERROR: {message.error}")
                 if message.total_cost_usd and message.total_cost_usd > 0:
                     print(f"\nCost: ${message.total_cost_usd:.4f}")
     args = parser.parse_args()
     conference_name = args.conference_name
+    asyncio.run(find_conference_deadlines(conference_name))

agents/modal_agent.py CHANGED Viewed

@@ -43,22 +43,21 @@ CONFERENCES_DIR = "src/data/conferences"
 def get_conferences(base_dir: str = REPO_DIR) -> list[str]:
     """Get list of all conferences by reading yml files from the conferences directory.
     Args:
         base_dir: Base directory of the repository.
     Returns:
         Sorted list of conference names (yml filenames without extension).
     """
     conferences_path = Path(base_dir) / CONFERENCES_DIR
     if not conferences_path.exists():
         raise FileNotFoundError(f"Conferences directory not found: {conferences_path}")
-    conferences = [
-        f.stem for f in conferences_path.glob("*.yml")
-    ]
     return sorted(conferences)
 # Define the Modal image with all required dependencies
 image = (
     modal.Image.debian_slim(python_version="3.11")
@@ -160,7 +159,7 @@ def setup_git_and_clone():
 @app.function(timeout=600)
 def process_single_conference(conference_name: str) -> dict:
     """Process a single conference using the Claude Agent SDK.
     The agent will update the conference data and handle git add/commit/push.
     Args:
@@ -181,10 +180,10 @@ def process_single_conference(conference_name: str) -> dict:
     os.environ["HOME"] = agent_user.pw_dir
     os.environ["USER"] = "agent"
     os.environ["LOGNAME"] = "agent"
     # Ensure subprocess inherits correct user context
     os.environ["SHELL"] = "/bin/bash"
     # Disable MCP for now - known issue where MCP causes SDK to exit early on Modal
     # The agent will use built-in WebSearch tool instead
     # See MODAL_DEBUGGING.md for details
@@ -200,7 +199,7 @@ def process_single_conference(conference_name: str) -> dict:
     # Change to repo directory so relative paths work
     os.chdir(REPO_DIR)
     # Tell agent.py to use current working directory as PROJECT_ROOT
     # This ensures conference data is read from the cloned repo, not the mounted app directory
     os.environ["USE_CWD_AS_PROJECT_ROOT"] = "1"
@@ -228,7 +227,7 @@ def process_single_conference(conference_name: str) -> dict:
 @app.function(timeout=43200)  # 12 hours max for all conferences
 def process_all_conferences() -> list[dict]:
     """Process all conferences sequentially.
     Each conference is processed one at a time. The agent handles
     git add/commit/push for each conference via its Bash tool.
@@ -236,16 +235,16 @@ def process_all_conferences() -> list[dict]:
         List of results for each processed conference.
     """
     import pwd
     # Switch to non-root user (required for git operations)
     agent_user = pwd.getpwnam("agent")
     os.setgid(agent_user.pw_gid)
     os.setuid(agent_user.pw_uid)
     os.environ["HOME"] = agent_user.pw_dir
     # Clone repo first to get the list of conferences
     setup_git_and_clone()
     # Get conferences from yml files in the cloned repo
     conferences = get_conferences()
     results = []
@@ -263,11 +262,13 @@ def process_all_conferences() -> list[dict]:
         except Exception as e:
             print(f"Error processing {conference}: {e}")
-            results.append({
-                "conference": conference,
-                "status": "error",
-                "error": str(e),
-            })
     print(f"\n{'=' * 60}")
     print(f"Completed processing {len(conferences)} conferences")
@@ -284,15 +285,15 @@ def scheduled_run():
     """Scheduled weekly run of all conferences."""
     print("Starting scheduled weekly conference update...")
     results = process_all_conferences.remote()
     # Summary
     completed = sum(1 for r in results if r.get("status") == "completed")
     errors = sum(1 for r in results if r.get("status") == "error")
-    print(f"\nWeekly run completed:")
     print(f"  - Completed: {completed}")
     print(f"  - Errors: {errors}")
     return results
@@ -335,13 +336,13 @@ def main(
         print(f"\n{'=' * 60}")
         print("Summary:")
         print(f"{'=' * 60}")
         completed = [r for r in results if r.get("status") == "completed"]
         errors = [r for r in results if r.get("status") == "error"]
         print(f"Completed: {len(completed)}")
         print(f"Errors: {len(errors)}")
         if errors:
             print("\nErrors:")
             for r in errors:

 def get_conferences(base_dir: str = REPO_DIR) -> list[str]:
     """Get list of all conferences by reading yml files from the conferences directory.
     Args:
         base_dir: Base directory of the repository.
     Returns:
         Sorted list of conference names (yml filenames without extension).
     """
     conferences_path = Path(base_dir) / CONFERENCES_DIR
     if not conferences_path.exists():
         raise FileNotFoundError(f"Conferences directory not found: {conferences_path}")
+    conferences = [f.stem for f in conferences_path.glob("*.yml")]
     return sorted(conferences)
 # Define the Modal image with all required dependencies
 image = (
     modal.Image.debian_slim(python_version="3.11")
 @app.function(timeout=600)
 def process_single_conference(conference_name: str) -> dict:
     """Process a single conference using the Claude Agent SDK.
     The agent will update the conference data and handle git add/commit/push.
     Args:
     os.environ["HOME"] = agent_user.pw_dir
     os.environ["USER"] = "agent"
     os.environ["LOGNAME"] = "agent"
     # Ensure subprocess inherits correct user context
     os.environ["SHELL"] = "/bin/bash"
     # Disable MCP for now - known issue where MCP causes SDK to exit early on Modal
     # The agent will use built-in WebSearch tool instead
     # See MODAL_DEBUGGING.md for details
     # Change to repo directory so relative paths work
     os.chdir(REPO_DIR)
     # Tell agent.py to use current working directory as PROJECT_ROOT
     # This ensures conference data is read from the cloned repo, not the mounted app directory
     os.environ["USE_CWD_AS_PROJECT_ROOT"] = "1"
 @app.function(timeout=43200)  # 12 hours max for all conferences
 def process_all_conferences() -> list[dict]:
     """Process all conferences sequentially.
     Each conference is processed one at a time. The agent handles
     git add/commit/push for each conference via its Bash tool.
         List of results for each processed conference.
     """
     import pwd
     # Switch to non-root user (required for git operations)
     agent_user = pwd.getpwnam("agent")
     os.setgid(agent_user.pw_gid)
     os.setuid(agent_user.pw_uid)
     os.environ["HOME"] = agent_user.pw_dir
     # Clone repo first to get the list of conferences
     setup_git_and_clone()
     # Get conferences from yml files in the cloned repo
     conferences = get_conferences()
     results = []
         except Exception as e:
             print(f"Error processing {conference}: {e}")
+            results.append(
+                {
+                    "conference": conference,
+                    "status": "error",
+                    "error": str(e),
+                }
+            )
     print(f"\n{'=' * 60}")
     print(f"Completed processing {len(conferences)} conferences")
     """Scheduled weekly run of all conferences."""
     print("Starting scheduled weekly conference update...")
     results = process_all_conferences.remote()
     # Summary
     completed = sum(1 for r in results if r.get("status") == "completed")
     errors = sum(1 for r in results if r.get("status") == "error")
+    print("\nWeekly run completed:")
     print(f"  - Completed: {completed}")
     print(f"  - Errors: {errors}")
     return results
         print(f"\n{'=' * 60}")
         print("Summary:")
         print(f"{'=' * 60}")
         completed = [r for r in results if r.get("status") == "completed"]
         errors = [r for r in results if r.get("status") == "error"]
         print(f"Completed: {len(completed)}")
         print(f"Errors: {len(errors)}")
         if errors:
             print("\nErrors:")
             for r in errors:

pyproject.toml CHANGED Viewed

@@ -7,4 +7,5 @@ requires-python = ">=3.12"
 dependencies = [
     "aiofiles>=25.1.0",
     "claude-agent-sdk>=0.1.18",
 ]

 dependencies = [
     "aiofiles>=25.1.0",
     "claude-agent-sdk>=0.1.18",
+    "ruff>=0.14.10",
 ]

uv.lock CHANGED Viewed

@@ -9,12 +9,14 @@ source = { virtual = "." }
 dependencies = [
     { name = "aiofiles" },
     { name = "claude-agent-sdk" },
 ]
 [package.metadata]
 requires-dist = [
     { name = "aiofiles", specifier = ">=25.1.0" },
     { name = "claude-agent-sdk", specifier = ">=0.1.18" },
 ]
 [[package]]
@@ -571,6 +573,32 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/d0/02/fa464cdfbe6b26e0600b62c528b72d8608f5cc49f96b8d6e38c95d60c676/rpds_py-0.30.0-cp314-cp314t-win_amd64.whl", hash = "sha256:27f4b0e92de5bfbc6f86e43959e6edd1425c33b5e69aab0984a72047f2bcf1e3", size = 226532 },
 ]
 [[package]]
 name = "sse-starlette"
 version = "3.0.4"

 dependencies = [
     { name = "aiofiles" },
     { name = "claude-agent-sdk" },
+    { name = "ruff" },
 ]
 [package.metadata]
 requires-dist = [
     { name = "aiofiles", specifier = ">=25.1.0" },
     { name = "claude-agent-sdk", specifier = ">=0.1.18" },
+    { name = "ruff", specifier = ">=0.14.10" },
 ]
 [[package]]
     { url = "https://files.pythonhosted.org/packages/d0/02/fa464cdfbe6b26e0600b62c528b72d8608f5cc49f96b8d6e38c95d60c676/rpds_py-0.30.0-cp314-cp314t-win_amd64.whl", hash = "sha256:27f4b0e92de5bfbc6f86e43959e6edd1425c33b5e69aab0984a72047f2bcf1e3", size = 226532 },
 ]
+[[package]]
+name = "ruff"
+version = "0.14.10"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/57/08/52232a877978dd8f9cf2aeddce3e611b40a63287dfca29b6b8da791f5e8d/ruff-0.14.10.tar.gz", hash = "sha256:9a2e830f075d1a42cd28420d7809ace390832a490ed0966fe373ba288e77aaf4", size = 5859763 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/60/01/933704d69f3f05ee16ef11406b78881733c186fe14b6a46b05cfcaf6d3b2/ruff-0.14.10-py3-none-linux_armv6l.whl", hash = "sha256:7a3ce585f2ade3e1f29ec1b92df13e3da262178df8c8bdf876f48fa0e8316c49", size = 13527080 },
+    { url = "https://files.pythonhosted.org/packages/df/58/a0349197a7dfa603ffb7f5b0470391efa79ddc327c1e29c4851e85b09cc5/ruff-0.14.10-py3-none-macosx_10_12_x86_64.whl", hash = "sha256:674f9be9372907f7257c51f1d4fc902cb7cf014b9980152b802794317941f08f", size = 13797320 },
+    { url = "https://files.pythonhosted.org/packages/7b/82/36be59f00a6082e38c23536df4e71cdbc6af8d7c707eade97fcad5c98235/ruff-0.14.10-py3-none-macosx_11_0_arm64.whl", hash = "sha256:d85713d522348837ef9df8efca33ccb8bd6fcfc86a2cde3ccb4bc9d28a18003d", size = 12918434 },
+    { url = "https://files.pythonhosted.org/packages/a6/00/45c62a7f7e34da92a25804f813ebe05c88aa9e0c25e5cb5a7d23dd7450e3/ruff-0.14.10-py3-none-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:6987ebe0501ae4f4308d7d24e2d0fe3d7a98430f5adfd0f1fead050a740a3a77", size = 13371961 },
+    { url = "https://files.pythonhosted.org/packages/40/31/a5906d60f0405f7e57045a70f2d57084a93ca7425f22e1d66904769d1628/ruff-0.14.10-py3-none-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:16a01dfb7b9e4eee556fbfd5392806b1b8550c9b4a9f6acd3dbe6812b193c70a", size = 13275629 },
+    { url = "https://files.pythonhosted.org/packages/3e/60/61c0087df21894cf9d928dc04bcd4fb10e8b2e8dca7b1a276ba2155b2002/ruff-0.14.10-py3-none-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:7165d31a925b7a294465fa81be8c12a0e9b60fb02bf177e79067c867e71f8b1f", size = 14029234 },
+    { url = "https://files.pythonhosted.org/packages/44/84/77d911bee3b92348b6e5dab5a0c898d87084ea03ac5dc708f46d88407def/ruff-0.14.10-py3-none-manylinux_2_17_ppc64.manylinux2014_ppc64.whl", hash = "sha256:c561695675b972effb0c0a45db233f2c816ff3da8dcfbe7dfc7eed625f218935", size = 15449890 },
+    { url = "https://files.pythonhosted.org/packages/e9/36/480206eaefa24a7ec321582dda580443a8f0671fdbf6b1c80e9c3e93a16a/ruff-0.14.10-py3-none-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:4bb98fcbbc61725968893682fd4df8966a34611239c9fd07a1f6a07e7103d08e", size = 15123172 },
+    { url = "https://files.pythonhosted.org/packages/5c/38/68e414156015ba80cef5473d57919d27dfb62ec804b96180bafdeaf0e090/ruff-0.14.10-py3-none-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:f24b47993a9d8cb858429e97bdf8544c78029f09b520af615c1d261bf827001d", size = 14460260 },
+    { url = "https://files.pythonhosted.org/packages/b3/19/9e050c0dca8aba824d67cc0db69fb459c28d8cd3f6855b1405b3f29cc91d/ruff-0.14.10-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:59aabd2e2c4fd614d2862e7939c34a532c04f1084476d6833dddef4afab87e9f", size = 14229978 },
+    { url = "https://files.pythonhosted.org/packages/51/eb/e8dd1dd6e05b9e695aa9dd420f4577debdd0f87a5ff2fedda33c09e9be8c/ruff-0.14.10-py3-none-manylinux_2_31_riscv64.whl", hash = "sha256:213db2b2e44be8625002dbea33bb9c60c66ea2c07c084a00d55732689d697a7f", size = 14338036 },
+    { url = "https://files.pythonhosted.org/packages/6a/12/f3e3a505db7c19303b70af370d137795fcfec136d670d5de5391e295c134/ruff-0.14.10-py3-none-musllinux_1_2_aarch64.whl", hash = "sha256:b914c40ab64865a17a9a5b67911d14df72346a634527240039eb3bd650e5979d", size = 13264051 },
+    { url = "https://files.pythonhosted.org/packages/08/64/8c3a47eaccfef8ac20e0484e68e0772013eb85802f8a9f7603ca751eb166/ruff-0.14.10-py3-none-musllinux_1_2_armv7l.whl", hash = "sha256:1484983559f026788e3a5c07c81ef7d1e97c1c78ed03041a18f75df104c45405", size = 13283998 },
+    { url = "https://files.pythonhosted.org/packages/12/84/534a5506f4074e5cc0529e5cd96cfc01bb480e460c7edf5af70d2bcae55e/ruff-0.14.10-py3-none-musllinux_1_2_i686.whl", hash = "sha256:c70427132db492d25f982fffc8d6c7535cc2fd2c83fc8888f05caaa248521e60", size = 13601891 },
+    { url = "https://files.pythonhosted.org/packages/0d/1e/14c916087d8598917dbad9b2921d340f7884824ad6e9c55de948a93b106d/ruff-0.14.10-py3-none-musllinux_1_2_x86_64.whl", hash = "sha256:5bcf45b681e9f1ee6445d317ce1fa9d6cba9a6049542d1c3d5b5958986be8830", size = 14336660 },
+    { url = "https://files.pythonhosted.org/packages/f2/1c/d7b67ab43f30013b47c12b42d1acd354c195351a3f7a1d67f59e54227ede/ruff-0.14.10-py3-none-win32.whl", hash = "sha256:104c49fc7ab73f3f3a758039adea978869a918f31b73280db175b43a2d9b51d6", size = 13196187 },
+    { url = "https://files.pythonhosted.org/packages/fb/9c/896c862e13886fae2af961bef3e6312db9ebc6adc2b156fe95e615dee8c1/ruff-0.14.10-py3-none-win_amd64.whl", hash = "sha256:466297bd73638c6bdf06485683e812db1c00c7ac96d4ddd0294a338c62fdc154", size = 14661283 },
+    { url = "https://files.pythonhosted.org/packages/74/31/b0e29d572670dca3674eeee78e418f20bdf97fa8aa9ea71380885e175ca0/ruff-0.14.10-py3-none-win_arm64.whl", hash = "sha256:e51d046cf6dda98a4633b8a8a771451107413b0f07183b2bef03f075599e44e6", size = 13729839 },
+]
 [[package]]
 name = "sse-starlette"
 version = "3.0.4"