Spaces:

RoyAalekh
/

hackathon_code4change

Sleeping

RoyAalekh commited on Nov 26, 2025

Commit

efb0735

1 Parent(s): 6a714c3

fix: Add UTF-8 encoding to CSV writers for Windows compatibility

- Fixed Windows 'charmap' codec error with Unicode characters
- Added encoding='utf-8' to all CSV file operations
- Updated EventWriter in scheduler/simulation/events.py
- Updated metrics CSV writer in scheduler/simulation/engine.py
- Fixed interactive mode to work with OutputManager

Changes:
- scheduler/simulation/events.py: UTF-8 encoding for events.csv
- scheduler/simulation/engine.py: UTF-8 encoding for metrics.csv
- court_scheduler_rl.py: Removed output_dir references in interactive mode

This fixes 'charmap' codec can't encode character '\\u2192' error
that occurred during full pipeline runs on Windows.

Files changed (3) hide show

court_scheduler_rl.py +4 -9
scheduler/simulation/engine.py +35 -5
scheduler/simulation/events.py +2 -2

court_scheduler_rl.py CHANGED Viewed

@@ -531,7 +531,6 @@ def get_interactive_config() -> PipelineConfig:
     # Output
     console.print("\n[bold]Output Options[/bold]")
-    output_dir = Prompt.ask("Output directory", default="data/hackathon_run")
     generate_cause_lists = Confirm.ask("Generate daily cause lists?", default=True)
     generate_visualizations = Confirm.ask("Generate performance visualizations?", default=True)
@@ -558,22 +557,18 @@ def interactive():
     console.print(f"  RL Learning Rate: {config.rl_training.learning_rate}")
     console.print(f"  Simulation: {config.sim_days} days")
     console.print(f"  Policies: {', '.join(config.policies)}")
-    console.print(f"  Output: {config.output_dir}")
     if not Confirm.ask("\nProceed with this configuration?", default=True):
         console.print("Cancelled.")
         return
-    # Save configuration
-    config_file = Path(config.output_dir) / "pipeline_config.json"
-    config_file.parent.mkdir(parents=True, exist_ok=True)
-    with open(config_file, 'w') as f:
-        json.dump(asdict(config), f, indent=2)
-    # Execute pipeline
     pipeline = InteractivePipeline(config)
     start_time = time.time()
     pipeline.run()
     elapsed = time.time() - start_time

     # Output
     console.print("\n[bold]Output Options[/bold]")
     generate_cause_lists = Confirm.ask("Generate daily cause lists?", default=True)
     generate_visualizations = Confirm.ask("Generate performance visualizations?", default=True)
     console.print(f"  RL Learning Rate: {config.rl_training.learning_rate}")
     console.print(f"  Simulation: {config.sim_days} days")
     console.print(f"  Policies: {', '.join(config.policies)}")
+    console.print(f"  Output: outputs/runs/run_<timestamp>/")
     if not Confirm.ask("\nProceed with this configuration?", default=True):
         console.print("Cancelled.")
         return
+    # Execute pipeline (OutputManager handles output structure)
     pipeline = InteractivePipeline(config)
     start_time = time.time()
+    console.print(f"\n[dim]Run directory: {pipeline.output.run_dir}[/dim]\n")
     pipeline.run()
     elapsed = time.time() - start_time

scheduler/simulation/engine.py CHANGED Viewed

@@ -44,10 +44,32 @@ class CourtSimConfig:
     seed: int = 42
     courtrooms: int = COURTROOMS
     daily_capacity: int = DEFAULT_DAILY_CAPACITY
-    policy: str = "readiness"  # fifo|age|readiness
     duration_percentile: str = "median"  # median|p90
     log_dir: Path | None = None  # if set, write metrics and suggestions
     write_suggestions: bool = False  # if True, write daily suggestion CSVs (slow)
 @dataclass
@@ -68,7 +90,15 @@ class CourtSim:
         self.cases = cases
         self.calendar = CourtCalendar()
         self.params = load_parameters()
-        self.policy = get_policy(self.cfg.policy)
         random.seed(self.cfg.seed)
         # month working-days cache
         self._month_working_cache: Dict[tuple, int] = {}
@@ -82,9 +112,9 @@ class CourtSim:
             self._log_dir = Path("data") / "sim_runs" / run_id
         self._log_dir.mkdir(parents=True, exist_ok=True)
         self._metrics_path = self._log_dir / "metrics.csv"
-        with self._metrics_path.open("w", newline="") as f:
             w = csv.writer(f)
-            w.writerow(["date", "total_cases", "scheduled", "heard", "adjourned", "disposals", "utilization"])
         # events
         self._events_path = self._log_dir / "events.csv"
         self._events = EventWriter(self._events_path)
@@ -407,7 +437,7 @@ class CourtSim:
         # write metrics row
         total_cases = sum(1 for c in self.cases if c.status != CaseStatus.DISPOSED)
         util = (day_total / capacity_today) if capacity_today else 0.0
-        with self._metrics_path.open("a", newline="") as f:
             w = csv.writer(f)
             w.writerow([current.isoformat(), total_cases, day_total, day_heard, day_total - day_heard, self._disposals, f"{util:.4f}"])
         if sf:

     seed: int = 42
     courtrooms: int = COURTROOMS
     daily_capacity: int = DEFAULT_DAILY_CAPACITY
+    policy: str = "readiness"  # fifo|age|readiness|rl
     duration_percentile: str = "median"  # median|p90
     log_dir: Path | None = None  # if set, write metrics and suggestions
     write_suggestions: bool = False  # if True, write daily suggestion CSVs (slow)
+    rl_agent_path: Path | None = None  # Required if policy="rl"
+    def __post_init__(self):
+        """Validate configuration parameters."""
+        # Validate RL policy requirements
+        if self.policy == "rl":
+            if self.rl_agent_path is None:
+                raise ValueError(
+                    "RL policy requires 'rl_agent_path' parameter. "
+                    "Train an agent first and pass the model file path."
+                )
+            if not isinstance(self.rl_agent_path, Path):
+                self.rl_agent_path = Path(self.rl_agent_path)
+            if not self.rl_agent_path.exists():
+                raise FileNotFoundError(
+                    f"RL agent model not found at {self.rl_agent_path}. "
+                    "Train the agent first or provide correct path."
+                )
+        # Ensure log_dir is Path if provided
+        if self.log_dir is not None and not isinstance(self.log_dir, Path):
+            self.log_dir = Path(self.log_dir)
 @dataclass
         self.cases = cases
         self.calendar = CourtCalendar()
         self.params = load_parameters()
+        # Initialize policy with RL agent path if needed
+        policy_kwargs = {}
+        if self.cfg.policy == "rl":
+            if not self.cfg.rl_agent_path:
+                raise ValueError("RL policy requires rl_agent_path in CourtSimConfig")
+            policy_kwargs["agent_path"] = self.cfg.rl_agent_path
+        self.policy = get_policy(self.cfg.policy, **policy_kwargs)
         random.seed(self.cfg.seed)
         # month working-days cache
         self._month_working_cache: Dict[tuple, int] = {}
             self._log_dir = Path("data") / "sim_runs" / run_id
         self._log_dir.mkdir(parents=True, exist_ok=True)
         self._metrics_path = self._log_dir / "metrics.csv"
+        with self._metrics_path.open("w", newline="", encoding="utf-8") as f:
             w = csv.writer(f)
+            w.writerow(["date", "total_cases", "scheduled", "heard", "adjourned", "disposals", "utilization"])
         # events
         self._events_path = self._log_dir / "events.csv"
         self._events = EventWriter(self._events_path)
         # write metrics row
         total_cases = sum(1 for c in self.cases if c.status != CaseStatus.DISPOSED)
         util = (day_total / capacity_today) if capacity_today else 0.0
+        with self._metrics_path.open("a", newline="", encoding="utf-8") as f:
             w = csv.writer(f)
             w.writerow([current.isoformat(), total_cases, day_total, day_heard, day_total - day_heard, self._disposals, f"{util:.4f}"])
         if sf:

scheduler/simulation/events.py CHANGED Viewed

@@ -25,7 +25,7 @@ class EventWriter:
         self.path.parent.mkdir(parents=True, exist_ok=True)
         self._buffer = []  # in-memory rows to append
         if not self.path.exists():
-            with self.path.open("w", newline="") as f:
                 w = csv.writer(f)
                 w.writerow([
                     "date", "type", "case_id", "case_type", "stage", "courtroom_id",
@@ -57,7 +57,7 @@ class EventWriter:
     def flush(self) -> None:
         if not self._buffer:
             return
-        with self.path.open("a", newline="") as f:
             w = csv.writer(f)
             w.writerows(self._buffer)
         self._buffer.clear()

         self.path.parent.mkdir(parents=True, exist_ok=True)
         self._buffer = []  # in-memory rows to append
         if not self.path.exists():
+            with self.path.open("w", newline="", encoding="utf-8") as f:
                 w = csv.writer(f)
                 w.writerow([
                     "date", "type", "case_id", "case_type", "stage", "courtroom_id",
     def flush(self) -> None:
         if not self._buffer:
             return
+        with self.path.open("a", newline="", encoding="utf-8") as f:
             w = csv.writer(f)
             w.writerows(self._buffer)
         self._buffer.clear()