Spaces:
Running on T4
Running on T4
Claude commited on
Fix hardcoded values in report: dynamic customer count and eval episode labels
Browse files
layer1/training_logger.py
CHANGED
|
@@ -244,7 +244,7 @@ class ReportGenerator:
|
|
| 244 |
bars = ax2.bar(x, eval_rewards, color=["#e74c3c", "#f39c12", "#27ae60"])
|
| 245 |
ax2.set_xticks(list(x))
|
| 246 |
ax2.set_xticklabels([l.split("(")[1].rstrip(")") for l in labels])
|
| 247 |
-
ax2.set_ylabel("Mean Reward (
|
| 248 |
ax2.set_title("Checkpoint Comparison")
|
| 249 |
ax2.grid(True, alpha=0.3, axis="y")
|
| 250 |
|
|
@@ -383,7 +383,7 @@ class ReportGenerator:
|
|
| 383 |
lines.append("")
|
| 384 |
|
| 385 |
# Example conversations
|
| 386 |
-
lines.append("## Example Conversations (
|
| 387 |
lines.append("")
|
| 388 |
customer_letters = "ABCDEFGHIJ"
|
| 389 |
for ci, cust in enumerate(example_conversations):
|
|
|
|
| 244 |
bars = ax2.bar(x, eval_rewards, color=["#e74c3c", "#f39c12", "#27ae60"])
|
| 245 |
ax2.set_xticks(list(x))
|
| 246 |
ax2.set_xticklabels([l.split("(")[1].rstrip(")") for l in labels])
|
| 247 |
+
ax2.set_ylabel(f"Mean Reward ({checkpoint_evals[0].get('num_episodes', '?')}-episode eval)")
|
| 248 |
ax2.set_title("Checkpoint Comparison")
|
| 249 |
ax2.grid(True, alpha=0.3, axis="y")
|
| 250 |
|
|
|
|
| 383 |
lines.append("")
|
| 384 |
|
| 385 |
# Example conversations
|
| 386 |
+
lines.append(f"## Example Conversations ({len(example_conversations)} Customers x {len(checkpoints)} Agents)")
|
| 387 |
lines.append("")
|
| 388 |
customer_letters = "ABCDEFGHIJ"
|
| 389 |
for ci, cust in enumerate(example_conversations):
|