Somuai12 commited on
Commit
dd5366d
·
1 Parent(s): 47a298a

Final Submission: Aligned ports (8000), synchronized README, and purged workspace logs/caches

Browse files
Files changed (8) hide show
  1. README.md +2 -2
  2. run1.json +0 -1
  3. run1_8b.json +0 -1
  4. run2.json +0 -1
  5. run2_8b.json +0 -1
  6. run_final_1.json +0 -1
  7. run_final_2.json +0 -1
  8. test_result.json +0 -31
README.md CHANGED
@@ -3,7 +3,7 @@ title: PolicyEvolverEnv
3
  colorFrom: blue
4
  colorTo: indigo
5
  sdk: docker
6
- app_port: 7860
7
  base_path: /dashboard/
8
  ---
9
  # PolicyEvolverEnv — Multi-Modal Strategic Governance Sandbox
@@ -140,7 +140,7 @@ pip install -r server/requirements.txt
140
  ### 2. Run the Environment API
141
  Start the FastAPI environment server locally:
142
  ```bash
143
- uvicorn server.app:app --port 7860
144
  ```
145
  This boots all core endpoint paths (`/reset`, `/step`, `/state`, `/tasks`, `/grader`, `/health`).
146
 
 
3
  colorFrom: blue
4
  colorTo: indigo
5
  sdk: docker
6
+ app_port: 8000
7
  base_path: /dashboard/
8
  ---
9
  # PolicyEvolverEnv — Multi-Modal Strategic Governance Sandbox
 
140
  ### 2. Run the Environment API
141
  Start the FastAPI environment server locally:
142
  ```bash
143
+ uvicorn server.app:app --port 8000
144
  ```
145
  This boots all core endpoint paths (`/reset`, `/step`, `/state`, `/tasks`, `/grader`, `/health`).
146
 
run1.json DELETED
@@ -1 +0,0 @@
1
- {"baseline_scores": {"overall_avg": 0.815}, "model": "llama-3.3-70b-versatile", "runtime_seconds": 13.21, "detail": [{"task_id": "task_easy", "reward": 0.745, "steps": 5}, {"task_id": "task_medium", "reward": 0.8, "steps": 5}, {"task_id": "task_hard", "reward": 0.9, "steps": 1}]}
 
 
run1_8b.json DELETED
@@ -1 +0,0 @@
1
- {"baseline_scores": {"overall_avg": 0.945}, "model": "llama-3.1-8b-instant", "runtime_seconds": 5.21, "detail": [{"task_id": "task_easy", "reward": 0.935, "steps": 1}, {"task_id": "task_medium", "reward": 1.0, "steps": 1}, {"task_id": "task_hard", "reward": 0.9, "steps": 1}]}
 
 
run2.json DELETED
@@ -1 +0,0 @@
1
- {"baseline_scores": {"overall_avg": 0.8983}, "model": "llama-3.3-70b-versatile", "runtime_seconds": 9.94, "detail": [{"task_id": "task_easy", "reward": 0.795, "steps": 5}, {"task_id": "task_medium", "reward": 1.0, "steps": 1}, {"task_id": "task_hard", "reward": 0.9, "steps": 1}]}
 
 
run2_8b.json DELETED
@@ -1 +0,0 @@
1
- {"baseline_scores": {"overall_avg": 0.945}, "model": "llama-3.1-8b-instant", "runtime_seconds": 3.86, "detail": [{"task_id": "task_easy", "reward": 0.935, "steps": 1}, {"task_id": "task_medium", "reward": 1.0, "steps": 1}, {"task_id": "task_hard", "reward": 0.9, "steps": 1}]}
 
 
run_final_1.json DELETED
@@ -1 +0,0 @@
1
- {"baseline_scores": {"overall_avg": 0.945}, "model": "llama-3.1-8b-instant", "runtime_seconds": 3.81, "detail": [{"task_id": "task_easy", "reward": 0.935, "steps": 1}, {"task_id": "task_medium", "reward": 1.0, "steps": 1}, {"task_id": "task_hard", "reward": 0.9, "steps": 1}]}
 
 
run_final_2.json DELETED
@@ -1 +0,0 @@
1
- {"baseline_scores": {"overall_avg": 0.945}, "model": "llama-3.1-8b-instant", "runtime_seconds": 3.78, "detail": [{"task_id": "task_easy", "reward": 0.935, "steps": 1}, {"task_id": "task_medium", "reward": 1.0, "steps": 1}, {"task_id": "task_hard", "reward": 0.9, "steps": 1}]}
 
 
test_result.json DELETED
@@ -1,31 +0,0 @@
1
- {
2
- "baseline_scores": {
3
- "task_easy": 0.85,
4
- "task_medium": 0.85,
5
- "task_hard": 0.70,
6
- "overall_avg": 0.80
7
- },
8
- "mode": "llm",
9
- "model": "meta-llama/Llama-3.3-70B-Instruct",
10
- "runtime_seconds": 4.36,
11
- "detail": [
12
- {
13
- "task_id": "task_easy",
14
- "reward": 0.85,
15
- "mode": "llm",
16
- "done": false
17
- },
18
- {
19
- "task_id": "task_medium",
20
- "reward": 0.85,
21
- "mode": "llm",
22
- "done": false
23
- },
24
- {
25
- "task_id": "task_hard",
26
- "reward": 0.70,
27
- "mode": "llm",
28
- "done": false
29
- }
30
- ]
31
- }