Update training.py
Browse files- training.py +2 -2
training.py
CHANGED
|
@@ -175,7 +175,7 @@ def supervised_warmup(model, tokenizer, n_examples=500, epochs=2):
|
|
| 175 |
]
|
| 176 |
last_output = random.choice(last_outputs)
|
| 177 |
# Use same prompt structure as build_prompt
|
| 178 |
-
prompt = f"""You are a code review agent.
|
| 179 |
|
| 180 |
Code:
|
| 181 |
{code}
|
|
@@ -292,7 +292,7 @@ def build_prompt(obs, history_lines: List[str]) -> str:
|
|
| 292 |
# Personality hint (optional but helpful)
|
| 293 |
author_personality = getattr(obs, "author_personality", "defensive") # e.g., from env
|
| 294 |
|
| 295 |
-
prompt = f"""You are an AI code review agent. Your goal is to convince a simulated human developer to accept your proposed fix.
|
| 296 |
|
| 297 |
The developer has a **{author_personality}** personality and will only accept if you provide solid evidence:
|
| 298 |
- Tests pass (high pass ratio)
|
|
|
|
| 175 |
]
|
| 176 |
last_output = random.choice(last_outputs)
|
| 177 |
# Use same prompt structure as build_prompt
|
| 178 |
+
prompt = f"""You are a code review agent and name your proposed fix function fix.
|
| 179 |
|
| 180 |
Code:
|
| 181 |
{code}
|
|
|
|
| 292 |
# Personality hint (optional but helpful)
|
| 293 |
author_personality = getattr(obs, "author_personality", "defensive") # e.g., from env
|
| 294 |
|
| 295 |
+
prompt = f"""You are an AI code review agent. Your goal is to convince a simulated human developer to accept your proposed fix and name your proposed fix function fix.
|
| 296 |
|
| 297 |
The developer has a **{author_personality}** personality and will only accept if you provide solid evidence:
|
| 298 |
- Tests pass (high pass ratio)
|