propagate changes
Browse files- raw_response -> api_output
- remove flow_run_cache
- CF_CodeCriticWrongAttempt.yaml +1 -1
- CF_CodeCriticWrongAttemptWithPlan.yaml +1 -1
- CF_CodeDebug.yaml +3 -2
- CF_CodeDebugCollab.yaml +3 -2
- CF_CodeDebugCollabWithPlan.yaml +3 -2
- CF_CodeDebugCritic.yaml +3 -3
- CF_CodeDebugCriticWithPlan.yaml +3 -3
- CF_CodeWithPlan.yaml +1 -0
- CF_Plan.yaml +1 -0
- CF_PlanCollab.yaml +4 -2
- CF_PlanCollab_Code.yaml +1 -1
- CF_PlanReflect.yaml +3 -1
- CF_PlanReflect_Code.yaml +1 -1
- CF_Plan_Code.yaml +1 -1
- CodeTesting.py +2 -4
- FixedReply_PlanReflect.yaml +1 -1
- LC_CodeCriticWrongAttempt.yaml +1 -1
- LC_CodeCriticWrongAttemptWithPlan.yaml +1 -1
- LC_CodeDebug.yaml +3 -2
- LC_CodeDebugCollab.yaml +3 -2
- LC_CodeDebugCollabWithPlan.yaml +3 -2
- LC_CodeDebugCritic.yaml +3 -3
- LC_CodeDebugCriticWithPlan.yaml +3 -3
- LC_CodeTesting.yaml +1 -1
- LC_CodeWithPlan.yaml +1 -0
- LC_Plan.yaml +1 -0
- LC_PlanCollab.yaml +4 -2
- LC_PlanCollab_Code.yaml +1 -1
- LC_PlanReflect.yaml +3 -1
- LC_Plan_Code.yaml +1 -1
- src/data_transformations/testing_results_summary_generation.py +1 -1
CF_CodeCriticWrongAttempt.yaml
CHANGED
|
@@ -82,6 +82,6 @@ input_keys:
|
|
| 82 |
output_data_transformations:
|
| 83 |
- _target_: flows.data_transformations.KeyRename
|
| 84 |
old_key2new_key:
|
| 85 |
-
|
| 86 |
output_keys:
|
| 87 |
- "code_feedback"
|
|
|
|
| 82 |
output_data_transformations:
|
| 83 |
- _target_: flows.data_transformations.KeyRename
|
| 84 |
old_key2new_key:
|
| 85 |
+
api_output: "code_feedback"
|
| 86 |
output_keys:
|
| 87 |
- "code_feedback"
|
CF_CodeCriticWrongAttemptWithPlan.yaml
CHANGED
|
@@ -89,6 +89,6 @@ input_keys:
|
|
| 89 |
output_data_transformations:
|
| 90 |
- _target_: flows.data_transformations.KeyRename
|
| 91 |
old_key2new_key:
|
| 92 |
-
|
| 93 |
output_keys:
|
| 94 |
- "code_feedback"
|
|
|
|
| 89 |
output_data_transformations:
|
| 90 |
- _target_: flows.data_transformations.KeyRename
|
| 91 |
old_key2new_key:
|
| 92 |
+
api_output: "code_feedback"
|
| 93 |
output_keys:
|
| 94 |
- "code_feedback"
|
CF_CodeDebug.yaml
CHANGED
|
@@ -17,7 +17,7 @@ input_keys:
|
|
| 17 |
output_data_transformations:
|
| 18 |
- _target_: flows.data_transformations.KeyRename
|
| 19 |
old_key2new_key:
|
| 20 |
-
|
| 21 |
output_keys:
|
| 22 |
- "code"
|
| 23 |
|
|
@@ -46,13 +46,14 @@ subflows_config:
|
|
| 46 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 47 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 48 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 49 |
-
input_key: "
|
| 50 |
output_key: "code"
|
| 51 |
strip: True
|
| 52 |
assert_unique: True
|
| 53 |
|
| 54 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 55 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 56 |
output_key: "end_of_interaction"
|
| 57 |
|
| 58 |
output_keys:
|
|
|
|
| 17 |
output_data_transformations:
|
| 18 |
- _target_: flows.data_transformations.KeyRename
|
| 19 |
old_key2new_key:
|
| 20 |
+
code: "code"
|
| 21 |
output_keys:
|
| 22 |
- "code"
|
| 23 |
|
|
|
|
| 46 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 47 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 48 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 49 |
+
input_key: "api_output"
|
| 50 |
output_key: "code"
|
| 51 |
strip: True
|
| 52 |
assert_unique: True
|
| 53 |
|
| 54 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 55 |
end_of_interaction_string: "Final answer"
|
| 56 |
+
input_key: "api_output"
|
| 57 |
output_key: "end_of_interaction"
|
| 58 |
|
| 59 |
output_keys:
|
CF_CodeDebugCollab.yaml
CHANGED
|
@@ -17,7 +17,7 @@ input_keys:
|
|
| 17 |
output_data_transformations:
|
| 18 |
- _target_: flows.data_transformations.KeyRename
|
| 19 |
old_key2new_key:
|
| 20 |
-
|
| 21 |
output_keys:
|
| 22 |
- "code"
|
| 23 |
|
|
@@ -51,13 +51,14 @@ subflows_config:
|
|
| 51 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 52 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 53 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 54 |
-
input_key: "
|
| 55 |
output_key: "code"
|
| 56 |
strip: True
|
| 57 |
assert_unique: True
|
| 58 |
|
| 59 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 60 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 61 |
output_key: "end_of_interaction"
|
| 62 |
|
| 63 |
output_keys:
|
|
|
|
| 17 |
output_data_transformations:
|
| 18 |
- _target_: flows.data_transformations.KeyRename
|
| 19 |
old_key2new_key:
|
| 20 |
+
code: "code"
|
| 21 |
output_keys:
|
| 22 |
- "code"
|
| 23 |
|
|
|
|
| 51 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 52 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 53 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 54 |
+
input_key: "api_output"
|
| 55 |
output_key: "code"
|
| 56 |
strip: True
|
| 57 |
assert_unique: True
|
| 58 |
|
| 59 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 60 |
end_of_interaction_string: "Final answer"
|
| 61 |
+
input_key: "api_output"
|
| 62 |
output_key: "end_of_interaction"
|
| 63 |
|
| 64 |
output_keys:
|
CF_CodeDebugCollabWithPlan.yaml
CHANGED
|
@@ -18,7 +18,7 @@ input_keys:
|
|
| 18 |
output_data_transformations:
|
| 19 |
- _target_: flows.data_transformations.KeyRename
|
| 20 |
old_key2new_key:
|
| 21 |
-
|
| 22 |
output_keys:
|
| 23 |
- "code"
|
| 24 |
|
|
@@ -52,13 +52,14 @@ subflows_config:
|
|
| 52 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 53 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 54 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 55 |
-
input_key: "
|
| 56 |
output_key: "code"
|
| 57 |
strip: True
|
| 58 |
assert_unique: True
|
| 59 |
|
| 60 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 61 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 62 |
output_key: "end_of_interaction"
|
| 63 |
|
| 64 |
output_keys:
|
|
|
|
| 18 |
output_data_transformations:
|
| 19 |
- _target_: flows.data_transformations.KeyRename
|
| 20 |
old_key2new_key:
|
| 21 |
+
code: "code"
|
| 22 |
output_keys:
|
| 23 |
- "code"
|
| 24 |
|
|
|
|
| 52 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 53 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 54 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 55 |
+
input_key: "api_output"
|
| 56 |
output_key: "code"
|
| 57 |
strip: True
|
| 58 |
assert_unique: True
|
| 59 |
|
| 60 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 61 |
end_of_interaction_string: "Final answer"
|
| 62 |
+
input_key: "api_output"
|
| 63 |
output_key: "end_of_interaction"
|
| 64 |
|
| 65 |
output_keys:
|
CF_CodeDebugCritic.yaml
CHANGED
|
@@ -15,9 +15,9 @@ input_keys:
|
|
| 15 |
output_data_transformations:
|
| 16 |
- _target_: flows.data_transformations.KeyRename
|
| 17 |
old_key2new_key:
|
| 18 |
-
|
| 19 |
-
|
| 20 |
-
|
| 21 |
output_keys:
|
| 22 |
- "testing_results_summary"
|
| 23 |
- "all_tests_passed"
|
|
|
|
| 15 |
output_data_transformations:
|
| 16 |
- _target_: flows.data_transformations.KeyRename
|
| 17 |
old_key2new_key:
|
| 18 |
+
testing_results_summary: "testing_results_summary"
|
| 19 |
+
all_tests_passed: "all_tests_passed"
|
| 20 |
+
code_feedback: "code_feedback"
|
| 21 |
output_keys:
|
| 22 |
- "testing_results_summary"
|
| 23 |
- "all_tests_passed"
|
CF_CodeDebugCriticWithPlan.yaml
CHANGED
|
@@ -16,9 +16,9 @@ input_keys:
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
output_keys:
|
| 23 |
- "testing_results_summary"
|
| 24 |
- "all_tests_passed"
|
|
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
+
testing_results_summary: "testing_results_summary"
|
| 20 |
+
all_tests_passed: "all_tests_passed"
|
| 21 |
+
code_feedback: "code_feedback"
|
| 22 |
output_keys:
|
| 23 |
- "testing_results_summary"
|
| 24 |
- "all_tests_passed"
|
CF_CodeWithPlan.yaml
CHANGED
|
@@ -82,6 +82,7 @@ output_data_transformations:
|
|
| 82 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 83 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 84 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
|
|
|
| 85 |
output_key: "code"
|
| 86 |
strip: True
|
| 87 |
assert_unique: True
|
|
|
|
| 82 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 83 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 84 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 85 |
+
input_key: "api_output"
|
| 86 |
output_key: "code"
|
| 87 |
strip: True
|
| 88 |
assert_unique: True
|
CF_Plan.yaml
CHANGED
|
@@ -24,6 +24,7 @@ output_data_transformations:
|
|
| 24 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 25 |
regex_fallback:
|
| 26 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
|
|
|
| 27 |
output_key: "plan"
|
| 28 |
strip: True
|
| 29 |
assert_unique: True
|
|
|
|
| 24 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 25 |
regex_fallback:
|
| 26 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 27 |
+
input_key: "api_output"
|
| 28 |
output_key: "plan"
|
| 29 |
strip: True
|
| 30 |
assert_unique: True
|
CF_PlanCollab.yaml
CHANGED
|
@@ -16,7 +16,7 @@ input_keys:
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
-
|
| 20 |
output_keys:
|
| 21 |
- "plan"
|
| 22 |
|
|
@@ -48,12 +48,14 @@ subflows_config:
|
|
| 48 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 49 |
regex_fallback:
|
| 50 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
|
|
|
| 51 |
output_key: "plan"
|
| 52 |
strip: True
|
| 53 |
assert_unique: True
|
| 54 |
|
| 55 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 56 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 57 |
output_key: "end_of_interaction"
|
| 58 |
|
| 59 |
output_keys:
|
|
@@ -65,4 +67,4 @@ subflows_config:
|
|
| 65 |
output_data_transformations:
|
| 66 |
- _target_: flows.data_transformations.KeyRename
|
| 67 |
old_key2new_key:
|
| 68 |
-
|
|
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
+
plan: "plan"
|
| 20 |
output_keys:
|
| 21 |
- "plan"
|
| 22 |
|
|
|
|
| 48 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 49 |
regex_fallback:
|
| 50 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 51 |
+
input_key: "api_output"
|
| 52 |
output_key: "plan"
|
| 53 |
strip: True
|
| 54 |
assert_unique: True
|
| 55 |
|
| 56 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 57 |
end_of_interaction_string: "Final answer"
|
| 58 |
+
input_key: "api_output"
|
| 59 |
output_key: "end_of_interaction"
|
| 60 |
|
| 61 |
output_keys:
|
|
|
|
| 67 |
output_data_transformations:
|
| 68 |
- _target_: flows.data_transformations.KeyRename
|
| 69 |
old_key2new_key:
|
| 70 |
+
api_output: "plan_feedback"
|
CF_PlanCollab_Code.yaml
CHANGED
|
@@ -13,7 +13,7 @@ input_keys:
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
-
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
|
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
+
code: "code"
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
CF_PlanReflect.yaml
CHANGED
|
@@ -16,7 +16,7 @@ input_keys:
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
-
|
| 20 |
output_keys:
|
| 21 |
- "plan"
|
| 22 |
|
|
@@ -34,12 +34,14 @@ subflows_config:
|
|
| 34 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 35 |
regex_fallback:
|
| 36 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
|
|
|
| 37 |
output_key: "plan"
|
| 38 |
strip: True
|
| 39 |
assert_unique: True
|
| 40 |
|
| 41 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 42 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 43 |
output_key: "end_of_interaction"
|
| 44 |
|
| 45 |
output_keys:
|
|
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
+
plan: "plan"
|
| 20 |
output_keys:
|
| 21 |
- "plan"
|
| 22 |
|
|
|
|
| 34 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 35 |
regex_fallback:
|
| 36 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 37 |
+
input_key: "api_output"
|
| 38 |
output_key: "plan"
|
| 39 |
strip: True
|
| 40 |
assert_unique: True
|
| 41 |
|
| 42 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 43 |
end_of_interaction_string: "Final answer"
|
| 44 |
+
input_key: "api_output"
|
| 45 |
output_key: "end_of_interaction"
|
| 46 |
|
| 47 |
output_keys:
|
CF_PlanReflect_Code.yaml
CHANGED
|
@@ -13,7 +13,7 @@ input_keys:
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
-
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
|
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
+
code: "code"
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
CF_Plan_Code.yaml
CHANGED
|
@@ -13,7 +13,7 @@ input_keys:
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
-
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
|
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
+
code: "code"
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
CodeTesting.py
CHANGED
|
@@ -33,14 +33,12 @@ class CodeTesting(AtomicFlow):
|
|
| 33 |
return cls(**kwargs)
|
| 34 |
|
| 35 |
def run(self,
|
| 36 |
-
input_data: Dict[str, Any],
|
| 37 |
-
private_keys: Optional[List[str]] = [],
|
| 38 |
-
keys_to_ignore_for_hash: Optional[List[str]] = []) -> Dict[str, Any]:
|
| 39 |
|
| 40 |
# ~~~ Retrieve the test data ~~~
|
| 41 |
test_data = self._get_test_data(input_data)
|
| 42 |
|
| 43 |
# ~~~ Run tests ~~~
|
| 44 |
-
response = self._run_tests(input_data, test_data)
|
| 45 |
|
| 46 |
return response
|
|
|
|
| 33 |
return cls(**kwargs)
|
| 34 |
|
| 35 |
def run(self,
|
| 36 |
+
input_data: Dict[str, Any]) -> Dict[str, Any]:
|
|
|
|
|
|
|
| 37 |
|
| 38 |
# ~~~ Retrieve the test data ~~~
|
| 39 |
test_data = self._get_test_data(input_data)
|
| 40 |
|
| 41 |
# ~~~ Run tests ~~~
|
| 42 |
+
response: Dict[str, Any] = self._run_tests(input_data, test_data)
|
| 43 |
|
| 44 |
return response
|
FixedReply_PlanReflect.yaml
CHANGED
|
@@ -8,7 +8,7 @@ input_keys: []
|
|
| 8 |
output_data_transformations:
|
| 9 |
- _target_: flows.data_transformations.KeyRename
|
| 10 |
old_key2new_key:
|
| 11 |
-
|
| 12 |
output_keys:
|
| 13 |
- "plan_reflect_message"
|
| 14 |
|
|
|
|
| 8 |
output_data_transformations:
|
| 9 |
- _target_: flows.data_transformations.KeyRename
|
| 10 |
old_key2new_key:
|
| 11 |
+
fixed_reply: "plan_reflect_message"
|
| 12 |
output_keys:
|
| 13 |
- "plan_reflect_message"
|
| 14 |
|
LC_CodeCriticWrongAttempt.yaml
CHANGED
|
@@ -83,6 +83,6 @@ input_keys:
|
|
| 83 |
output_data_transformations:
|
| 84 |
- _target_: flows.data_transformations.KeyRename
|
| 85 |
old_key2new_key:
|
| 86 |
-
|
| 87 |
output_keys:
|
| 88 |
- "code_feedback"
|
|
|
|
| 83 |
output_data_transformations:
|
| 84 |
- _target_: flows.data_transformations.KeyRename
|
| 85 |
old_key2new_key:
|
| 86 |
+
api_output: "code_feedback"
|
| 87 |
output_keys:
|
| 88 |
- "code_feedback"
|
LC_CodeCriticWrongAttemptWithPlan.yaml
CHANGED
|
@@ -91,6 +91,6 @@ input_keys:
|
|
| 91 |
output_data_transformations:
|
| 92 |
- _target_: flows.data_transformations.KeyRename
|
| 93 |
old_key2new_key:
|
| 94 |
-
|
| 95 |
output_keys:
|
| 96 |
- "code_feedback"
|
|
|
|
| 91 |
output_data_transformations:
|
| 92 |
- _target_: flows.data_transformations.KeyRename
|
| 93 |
old_key2new_key:
|
| 94 |
+
api_output: "code_feedback"
|
| 95 |
output_keys:
|
| 96 |
- "code_feedback"
|
LC_CodeDebug.yaml
CHANGED
|
@@ -17,7 +17,7 @@ input_keys:
|
|
| 17 |
output_data_transformations:
|
| 18 |
- _target_: flows.data_transformations.KeyRename
|
| 19 |
old_key2new_key:
|
| 20 |
-
|
| 21 |
output_keys:
|
| 22 |
- "code"
|
| 23 |
|
|
@@ -46,13 +46,14 @@ subflows_config:
|
|
| 46 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 47 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 48 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 49 |
-
input_key: "
|
| 50 |
output_key: "code"
|
| 51 |
strip: True
|
| 52 |
assert_unique: True
|
| 53 |
|
| 54 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 55 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 56 |
output_key: "end_of_interaction"
|
| 57 |
|
| 58 |
output_keys:
|
|
|
|
| 17 |
output_data_transformations:
|
| 18 |
- _target_: flows.data_transformations.KeyRename
|
| 19 |
old_key2new_key:
|
| 20 |
+
code: "code"
|
| 21 |
output_keys:
|
| 22 |
- "code"
|
| 23 |
|
|
|
|
| 46 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 47 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 48 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 49 |
+
input_key: "api_output"
|
| 50 |
output_key: "code"
|
| 51 |
strip: True
|
| 52 |
assert_unique: True
|
| 53 |
|
| 54 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 55 |
end_of_interaction_string: "Final answer"
|
| 56 |
+
input_key: "api_output"
|
| 57 |
output_key: "end_of_interaction"
|
| 58 |
|
| 59 |
output_keys:
|
LC_CodeDebugCollab.yaml
CHANGED
|
@@ -17,7 +17,7 @@ input_keys:
|
|
| 17 |
output_data_transformations:
|
| 18 |
- _target_: flows.data_transformations.KeyRename
|
| 19 |
old_key2new_key:
|
| 20 |
-
|
| 21 |
output_keys:
|
| 22 |
- "code"
|
| 23 |
|
|
@@ -51,13 +51,14 @@ subflows_config:
|
|
| 51 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 52 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 53 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 54 |
-
input_key: "
|
| 55 |
output_key: "code"
|
| 56 |
strip: True
|
| 57 |
assert_unique: True
|
| 58 |
|
| 59 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 60 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 61 |
output_key: "end_of_interaction"
|
| 62 |
|
| 63 |
output_keys:
|
|
|
|
| 17 |
output_data_transformations:
|
| 18 |
- _target_: flows.data_transformations.KeyRename
|
| 19 |
old_key2new_key:
|
| 20 |
+
code: "code"
|
| 21 |
output_keys:
|
| 22 |
- "code"
|
| 23 |
|
|
|
|
| 51 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 52 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 53 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 54 |
+
input_key: "api_output"
|
| 55 |
output_key: "code"
|
| 56 |
strip: True
|
| 57 |
assert_unique: True
|
| 58 |
|
| 59 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 60 |
end_of_interaction_string: "Final answer"
|
| 61 |
+
input_key: "api_output"
|
| 62 |
output_key: "end_of_interaction"
|
| 63 |
|
| 64 |
output_keys:
|
LC_CodeDebugCollabWithPlan.yaml
CHANGED
|
@@ -18,7 +18,7 @@ input_keys:
|
|
| 18 |
output_data_transformations:
|
| 19 |
- _target_: flows.data_transformations.KeyRename
|
| 20 |
old_key2new_key:
|
| 21 |
-
|
| 22 |
output_keys:
|
| 23 |
- "code"
|
| 24 |
|
|
@@ -52,13 +52,14 @@ subflows_config:
|
|
| 52 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 53 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 54 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 55 |
-
input_key: "
|
| 56 |
output_key: "code"
|
| 57 |
strip: True
|
| 58 |
assert_unique: True
|
| 59 |
|
| 60 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 61 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 62 |
output_key: "end_of_interaction"
|
| 63 |
|
| 64 |
output_keys:
|
|
|
|
| 18 |
output_data_transformations:
|
| 19 |
- _target_: flows.data_transformations.KeyRename
|
| 20 |
old_key2new_key:
|
| 21 |
+
code: "code"
|
| 22 |
output_keys:
|
| 23 |
- "code"
|
| 24 |
|
|
|
|
| 52 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 53 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 54 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 55 |
+
input_key: "api_output"
|
| 56 |
output_key: "code"
|
| 57 |
strip: True
|
| 58 |
assert_unique: True
|
| 59 |
|
| 60 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 61 |
end_of_interaction_string: "Final answer"
|
| 62 |
+
input_key: "api_output"
|
| 63 |
output_key: "end_of_interaction"
|
| 64 |
|
| 65 |
output_keys:
|
LC_CodeDebugCritic.yaml
CHANGED
|
@@ -15,9 +15,9 @@ input_keys:
|
|
| 15 |
output_data_transformations:
|
| 16 |
- _target_: flows.data_transformations.KeyRename
|
| 17 |
old_key2new_key:
|
| 18 |
-
|
| 19 |
-
|
| 20 |
-
|
| 21 |
output_keys:
|
| 22 |
- "testing_results_summary"
|
| 23 |
- "all_tests_passed"
|
|
|
|
| 15 |
output_data_transformations:
|
| 16 |
- _target_: flows.data_transformations.KeyRename
|
| 17 |
old_key2new_key:
|
| 18 |
+
testing_results_summary: "testing_results_summary"
|
| 19 |
+
all_tests_passed: "all_tests_passed"
|
| 20 |
+
code_feedback: "code_feedback"
|
| 21 |
output_keys:
|
| 22 |
- "testing_results_summary"
|
| 23 |
- "all_tests_passed"
|
LC_CodeDebugCriticWithPlan.yaml
CHANGED
|
@@ -16,9 +16,9 @@ input_keys:
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
output_keys:
|
| 23 |
- "testing_results_summary"
|
| 24 |
- "all_tests_passed"
|
|
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
+
testing_results_summary: "testing_results_summary"
|
| 20 |
+
all_tests_passed: "all_tests_passed"
|
| 21 |
+
code_feedback: "code_feedback"
|
| 22 |
output_keys:
|
| 23 |
- "testing_results_summary"
|
| 24 |
- "all_tests_passed"
|
LC_CodeTesting.yaml
CHANGED
|
@@ -12,7 +12,7 @@ output_keys:
|
|
| 12 |
- "testing_results_summary"
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: .src.data_transformations.CorrectnessFlag
|
| 15 |
-
input_key: "
|
| 16 |
output_key: "all_tests_passed"
|
| 17 |
- _target_: .src.data_transformations.TestingResultsSummaryGeneration
|
| 18 |
output_key: "testing_results_summary"
|
|
|
|
| 12 |
- "testing_results_summary"
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: .src.data_transformations.CorrectnessFlag
|
| 15 |
+
input_key: "public_tests_results"
|
| 16 |
output_key: "all_tests_passed"
|
| 17 |
- _target_: .src.data_transformations.TestingResultsSummaryGeneration
|
| 18 |
output_key: "testing_results_summary"
|
LC_CodeWithPlan.yaml
CHANGED
|
@@ -83,6 +83,7 @@ output_data_transformations:
|
|
| 83 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 84 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 85 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
|
|
|
| 86 |
output_key: "code"
|
| 87 |
strip: True
|
| 88 |
assert_unique: True
|
|
|
|
| 83 |
- _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
|
| 84 |
regex: '(?<=```python)([\s\S]*?)(?=```)'
|
| 85 |
regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
|
| 86 |
+
input_key: "api_output"
|
| 87 |
output_key: "code"
|
| 88 |
strip: True
|
| 89 |
assert_unique: True
|
LC_Plan.yaml
CHANGED
|
@@ -23,6 +23,7 @@ output_data_transformations:
|
|
| 23 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 24 |
regex_fallback:
|
| 25 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
|
|
|
| 26 |
output_key: "plan"
|
| 27 |
strip: True
|
| 28 |
assert_unique: True
|
|
|
|
| 23 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 24 |
regex_fallback:
|
| 25 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 26 |
+
input_key: "api_output"
|
| 27 |
output_key: "plan"
|
| 28 |
strip: True
|
| 29 |
assert_unique: True
|
LC_PlanCollab.yaml
CHANGED
|
@@ -16,7 +16,7 @@ input_keys:
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
-
|
| 20 |
output_keys:
|
| 21 |
- "plan"
|
| 22 |
|
|
@@ -48,12 +48,14 @@ subflows_config:
|
|
| 48 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 49 |
regex_fallback:
|
| 50 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
|
|
|
| 51 |
output_key: "plan"
|
| 52 |
strip: True
|
| 53 |
assert_unique: True
|
| 54 |
|
| 55 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 56 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 57 |
output_key: "end_of_interaction"
|
| 58 |
|
| 59 |
output_keys:
|
|
@@ -65,4 +67,4 @@ subflows_config:
|
|
| 65 |
output_data_transformations:
|
| 66 |
- _target_: flows.data_transformations.KeyRename
|
| 67 |
old_key2new_key:
|
| 68 |
-
|
|
|
|
| 16 |
output_data_transformations:
|
| 17 |
- _target_: flows.data_transformations.KeyRename
|
| 18 |
old_key2new_key:
|
| 19 |
+
plan: "plan"
|
| 20 |
output_keys:
|
| 21 |
- "plan"
|
| 22 |
|
|
|
|
| 48 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 49 |
regex_fallback:
|
| 50 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 51 |
+
input_key: "api_output"
|
| 52 |
output_key: "plan"
|
| 53 |
strip: True
|
| 54 |
assert_unique: True
|
| 55 |
|
| 56 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 57 |
end_of_interaction_string: "Final answer"
|
| 58 |
+
input_key: "api_output"
|
| 59 |
output_key: "end_of_interaction"
|
| 60 |
|
| 61 |
output_keys:
|
|
|
|
| 67 |
output_data_transformations:
|
| 68 |
- _target_: flows.data_transformations.KeyRename
|
| 69 |
old_key2new_key:
|
| 70 |
+
api_output: "plan_feedback"
|
LC_PlanCollab_Code.yaml
CHANGED
|
@@ -13,7 +13,7 @@ input_keys:
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
-
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
|
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
+
code: "code"
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
LC_PlanReflect.yaml
CHANGED
|
@@ -15,7 +15,7 @@ input_keys:
|
|
| 15 |
output_data_transformations:
|
| 16 |
- _target_: flows.data_transformations.KeyRename
|
| 17 |
old_key2new_key:
|
| 18 |
-
|
| 19 |
output_keys:
|
| 20 |
- "plan"
|
| 21 |
|
|
@@ -33,12 +33,14 @@ subflows_config:
|
|
| 33 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 34 |
regex_fallback:
|
| 35 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
|
|
|
| 36 |
output_key: "plan"
|
| 37 |
strip: True
|
| 38 |
assert_unique: True
|
| 39 |
|
| 40 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 41 |
end_of_interaction_string: "Final answer"
|
|
|
|
| 42 |
output_key: "end_of_interaction"
|
| 43 |
|
| 44 |
output_keys:
|
|
|
|
| 15 |
output_data_transformations:
|
| 16 |
- _target_: flows.data_transformations.KeyRename
|
| 17 |
old_key2new_key:
|
| 18 |
+
plan: "plan"
|
| 19 |
output_keys:
|
| 20 |
- "plan"
|
| 21 |
|
|
|
|
| 33 |
regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 34 |
regex_fallback:
|
| 35 |
- '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
|
| 36 |
+
input_key: "api_output"
|
| 37 |
output_key: "plan"
|
| 38 |
strip: True
|
| 39 |
assert_unique: True
|
| 40 |
|
| 41 |
- _target_: flows.data_transformations.EndOfInteraction
|
| 42 |
end_of_interaction_string: "Final answer"
|
| 43 |
+
input_key: "api_output"
|
| 44 |
output_key: "end_of_interaction"
|
| 45 |
|
| 46 |
output_keys:
|
LC_Plan_Code.yaml
CHANGED
|
@@ -13,7 +13,7 @@ input_keys:
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
-
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
|
|
|
| 13 |
output_data_transformations:
|
| 14 |
- _target_: flows.data_transformations.KeyRename
|
| 15 |
old_key2new_key:
|
| 16 |
+
code: "code"
|
| 17 |
output_keys:
|
| 18 |
- "code"
|
| 19 |
|
src/data_transformations/testing_results_summary_generation.py
CHANGED
|
@@ -17,7 +17,7 @@ class TestingResultsSummaryGeneration(DataTransformation):
|
|
| 17 |
data_dict[self.output_key] = self.params["no_error_template"]
|
| 18 |
return data_dict
|
| 19 |
|
| 20 |
-
test_data = unflatten_dict(data_dict)
|
| 21 |
|
| 22 |
if not test_data["compilation_status"]:
|
| 23 |
# compilation error occurred
|
|
|
|
| 17 |
data_dict[self.output_key] = self.params["no_error_template"]
|
| 18 |
return data_dict
|
| 19 |
|
| 20 |
+
test_data = unflatten_dict(data_dict)
|
| 21 |
|
| 22 |
if not test_data["compilation_status"]:
|
| 23 |
# compilation error occurred
|