yeeef commited on
Commit
ae49f4f
1 Parent(s): dca49e6

propagate changes

Browse files

- raw_response -> api_output
- remove flow_run_cache

CF_CodeCriticWrongAttempt.yaml CHANGED
@@ -82,6 +82,6 @@ input_keys:
82
  output_data_transformations:
83
  - _target_: flows.data_transformations.KeyRename
84
  old_key2new_key:
85
- raw_response: "code_feedback"
86
  output_keys:
87
  - "code_feedback"
 
82
  output_data_transformations:
83
  - _target_: flows.data_transformations.KeyRename
84
  old_key2new_key:
85
+ api_output: "code_feedback"
86
  output_keys:
87
  - "code_feedback"
CF_CodeCriticWrongAttemptWithPlan.yaml CHANGED
@@ -89,6 +89,6 @@ input_keys:
89
  output_data_transformations:
90
  - _target_: flows.data_transformations.KeyRename
91
  old_key2new_key:
92
- raw_response: "code_feedback"
93
  output_keys:
94
  - "code_feedback"
 
89
  output_data_transformations:
90
  - _target_: flows.data_transformations.KeyRename
91
  old_key2new_key:
92
+ api_output: "code_feedback"
93
  output_keys:
94
  - "code_feedback"
CF_CodeDebug.yaml CHANGED
@@ -17,7 +17,7 @@ input_keys:
17
  output_data_transformations:
18
  - _target_: flows.data_transformations.KeyRename
19
  old_key2new_key:
20
- raw_response.code: "code"
21
  output_keys:
22
  - "code"
23
 
@@ -46,13 +46,14 @@ subflows_config:
46
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
47
  regex: '(?<=```python)([\s\S]*?)(?=```)'
48
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
49
- input_key: "raw_response"
50
  output_key: "code"
51
  strip: True
52
  assert_unique: True
53
 
54
  - _target_: flows.data_transformations.EndOfInteraction
55
  end_of_interaction_string: "Final answer"
 
56
  output_key: "end_of_interaction"
57
 
58
  output_keys:
 
17
  output_data_transformations:
18
  - _target_: flows.data_transformations.KeyRename
19
  old_key2new_key:
20
+ code: "code"
21
  output_keys:
22
  - "code"
23
 
 
46
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
47
  regex: '(?<=```python)([\s\S]*?)(?=```)'
48
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
49
+ input_key: "api_output"
50
  output_key: "code"
51
  strip: True
52
  assert_unique: True
53
 
54
  - _target_: flows.data_transformations.EndOfInteraction
55
  end_of_interaction_string: "Final answer"
56
+ input_key: "api_output"
57
  output_key: "end_of_interaction"
58
 
59
  output_keys:
CF_CodeDebugCollab.yaml CHANGED
@@ -17,7 +17,7 @@ input_keys:
17
  output_data_transformations:
18
  - _target_: flows.data_transformations.KeyRename
19
  old_key2new_key:
20
- raw_response.code: "code"
21
  output_keys:
22
  - "code"
23
 
@@ -51,13 +51,14 @@ subflows_config:
51
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
52
  regex: '(?<=```python)([\s\S]*?)(?=```)'
53
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
54
- input_key: "raw_response"
55
  output_key: "code"
56
  strip: True
57
  assert_unique: True
58
 
59
  - _target_: flows.data_transformations.EndOfInteraction
60
  end_of_interaction_string: "Final answer"
 
61
  output_key: "end_of_interaction"
62
 
63
  output_keys:
 
17
  output_data_transformations:
18
  - _target_: flows.data_transformations.KeyRename
19
  old_key2new_key:
20
+ code: "code"
21
  output_keys:
22
  - "code"
23
 
 
51
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
52
  regex: '(?<=```python)([\s\S]*?)(?=```)'
53
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
54
+ input_key: "api_output"
55
  output_key: "code"
56
  strip: True
57
  assert_unique: True
58
 
59
  - _target_: flows.data_transformations.EndOfInteraction
60
  end_of_interaction_string: "Final answer"
61
+ input_key: "api_output"
62
  output_key: "end_of_interaction"
63
 
64
  output_keys:
CF_CodeDebugCollabWithPlan.yaml CHANGED
@@ -18,7 +18,7 @@ input_keys:
18
  output_data_transformations:
19
  - _target_: flows.data_transformations.KeyRename
20
  old_key2new_key:
21
- raw_response.code: "code"
22
  output_keys:
23
  - "code"
24
 
@@ -52,13 +52,14 @@ subflows_config:
52
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
53
  regex: '(?<=```python)([\s\S]*?)(?=```)'
54
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
55
- input_key: "raw_response"
56
  output_key: "code"
57
  strip: True
58
  assert_unique: True
59
 
60
  - _target_: flows.data_transformations.EndOfInteraction
61
  end_of_interaction_string: "Final answer"
 
62
  output_key: "end_of_interaction"
63
 
64
  output_keys:
 
18
  output_data_transformations:
19
  - _target_: flows.data_transformations.KeyRename
20
  old_key2new_key:
21
+ code: "code"
22
  output_keys:
23
  - "code"
24
 
 
52
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
53
  regex: '(?<=```python)([\s\S]*?)(?=```)'
54
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
55
+ input_key: "api_output"
56
  output_key: "code"
57
  strip: True
58
  assert_unique: True
59
 
60
  - _target_: flows.data_transformations.EndOfInteraction
61
  end_of_interaction_string: "Final answer"
62
+ input_key: "api_output"
63
  output_key: "end_of_interaction"
64
 
65
  output_keys:
CF_CodeDebugCritic.yaml CHANGED
@@ -15,9 +15,9 @@ input_keys:
15
  output_data_transformations:
16
  - _target_: flows.data_transformations.KeyRename
17
  old_key2new_key:
18
- raw_response.testing_results_summary: "testing_results_summary"
19
- raw_response.all_tests_passed: "all_tests_passed"
20
- raw_response.code_feedback: "code_feedback"
21
  output_keys:
22
  - "testing_results_summary"
23
  - "all_tests_passed"
 
15
  output_data_transformations:
16
  - _target_: flows.data_transformations.KeyRename
17
  old_key2new_key:
18
+ testing_results_summary: "testing_results_summary"
19
+ all_tests_passed: "all_tests_passed"
20
+ code_feedback: "code_feedback"
21
  output_keys:
22
  - "testing_results_summary"
23
  - "all_tests_passed"
CF_CodeDebugCriticWithPlan.yaml CHANGED
@@ -16,9 +16,9 @@ input_keys:
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
- raw_response.testing_results_summary: "testing_results_summary"
20
- raw_response.all_tests_passed: "all_tests_passed"
21
- raw_response.code_feedback: "code_feedback"
22
  output_keys:
23
  - "testing_results_summary"
24
  - "all_tests_passed"
 
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
+ testing_results_summary: "testing_results_summary"
20
+ all_tests_passed: "all_tests_passed"
21
+ code_feedback: "code_feedback"
22
  output_keys:
23
  - "testing_results_summary"
24
  - "all_tests_passed"
CF_CodeTesting.yaml CHANGED
@@ -10,7 +10,7 @@ output_keys:
10
  - "testing_results_summary"
11
  output_data_transformations:
12
  - _target_: martinjosifoski.CC_flows.src.data_transformations.CorrectnessFlag # ToDo: This import style would not work if the flow is synced in the current implementation (the outer directory is a hash and not the name; figure out how to do the import robustly; e.g., using relative imports)
13
- input_key: "raw_response.public_tests_results"
14
  output_key: "all_tests_passed"
15
  - _target_: martinjosifoski.CC_flows.src.data_transformations.TestingResultsSummaryGeneration
16
  output_key: "testing_results_summary"
 
10
  - "testing_results_summary"
11
  output_data_transformations:
12
  - _target_: martinjosifoski.CC_flows.src.data_transformations.CorrectnessFlag # ToDo: This import style would not work if the flow is synced in the current implementation (the outer directory is a hash and not the name; figure out how to do the import robustly; e.g., using relative imports)
13
+ input_key: "public_tests_results"
14
  output_key: "all_tests_passed"
15
  - _target_: martinjosifoski.CC_flows.src.data_transformations.TestingResultsSummaryGeneration
16
  output_key: "testing_results_summary"
CF_CodeWithPlan.yaml CHANGED
@@ -82,6 +82,7 @@ output_data_transformations:
82
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
83
  regex: '(?<=```python)([\s\S]*?)(?=```)'
84
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
 
85
  output_key: "code"
86
  strip: True
87
  assert_unique: True
 
82
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
83
  regex: '(?<=```python)([\s\S]*?)(?=```)'
84
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
85
+ input_key: "api_output"
86
  output_key: "code"
87
  strip: True
88
  assert_unique: True
CF_Plan.yaml CHANGED
@@ -24,6 +24,7 @@ output_data_transformations:
24
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
25
  regex_fallback:
26
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
 
27
  output_key: "plan"
28
  strip: True
29
  assert_unique: True
 
24
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
25
  regex_fallback:
26
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
27
+ input_key: "api_output"
28
  output_key: "plan"
29
  strip: True
30
  assert_unique: True
CF_PlanCollab.yaml CHANGED
@@ -16,7 +16,7 @@ input_keys:
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
- raw_response.plan: "plan"
20
  output_keys:
21
  - "plan"
22
 
@@ -48,12 +48,14 @@ subflows_config:
48
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
49
  regex_fallback:
50
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
 
51
  output_key: "plan"
52
  strip: True
53
  assert_unique: True
54
 
55
  - _target_: flows.data_transformations.EndOfInteraction
56
  end_of_interaction_string: "Final answer"
 
57
  output_key: "end_of_interaction"
58
 
59
  output_keys:
@@ -65,4 +67,4 @@ subflows_config:
65
  output_data_transformations:
66
  - _target_: flows.data_transformations.KeyRename
67
  old_key2new_key:
68
- raw_response: "plan_feedback"
 
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
+ plan: "plan"
20
  output_keys:
21
  - "plan"
22
 
 
48
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
49
  regex_fallback:
50
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
51
+ input_key: "api_output"
52
  output_key: "plan"
53
  strip: True
54
  assert_unique: True
55
 
56
  - _target_: flows.data_transformations.EndOfInteraction
57
  end_of_interaction_string: "Final answer"
58
+ input_key: "api_output"
59
  output_key: "end_of_interaction"
60
 
61
  output_keys:
 
67
  output_data_transformations:
68
  - _target_: flows.data_transformations.KeyRename
69
  old_key2new_key:
70
+ api_output: "plan_feedback"
CF_PlanCollab_Code.yaml CHANGED
@@ -13,7 +13,7 @@ input_keys:
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
- raw_response.code: "code"
17
  output_keys:
18
  - "code"
19
 
 
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
+ code: "code"
17
  output_keys:
18
  - "code"
19
 
CF_PlanReflect.yaml CHANGED
@@ -16,7 +16,7 @@ input_keys:
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
- raw_response.plan: "plan"
20
  output_keys:
21
  - "plan"
22
 
@@ -34,12 +34,14 @@ subflows_config:
34
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
35
  regex_fallback:
36
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
 
37
  output_key: "plan"
38
  strip: True
39
  assert_unique: True
40
 
41
  - _target_: flows.data_transformations.EndOfInteraction
42
  end_of_interaction_string: "Final answer"
 
43
  output_key: "end_of_interaction"
44
 
45
  output_keys:
 
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
+ plan: "plan"
20
  output_keys:
21
  - "plan"
22
 
 
34
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
35
  regex_fallback:
36
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
37
+ input_key: "api_output"
38
  output_key: "plan"
39
  strip: True
40
  assert_unique: True
41
 
42
  - _target_: flows.data_transformations.EndOfInteraction
43
  end_of_interaction_string: "Final answer"
44
+ input_key: "api_output"
45
  output_key: "end_of_interaction"
46
 
47
  output_keys:
CF_PlanReflect_Code.yaml CHANGED
@@ -13,7 +13,7 @@ input_keys:
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
- raw_response.code: "code"
17
  output_keys:
18
  - "code"
19
 
 
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
+ code: "code"
17
  output_keys:
18
  - "code"
19
 
CF_Plan_Code.yaml CHANGED
@@ -13,7 +13,7 @@ input_keys:
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
- raw_response.code: "code"
17
  output_keys:
18
  - "code"
19
 
 
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
+ code: "code"
17
  output_keys:
18
  - "code"
19
 
CodeTesting.py CHANGED
@@ -33,14 +33,12 @@ class CodeTesting(AtomicFlow):
33
  return cls(**kwargs)
34
 
35
  def run(self,
36
- input_data: Dict[str, Any],
37
- private_keys: Optional[List[str]] = [],
38
- keys_to_ignore_for_hash: Optional[List[str]] = []) -> Dict[str, Any]:
39
 
40
  # ~~~ Retrieve the test data ~~~
41
  test_data = self._get_test_data(input_data)
42
 
43
  # ~~~ Run tests ~~~
44
- response = self._run_tests(input_data, test_data)
45
 
46
  return response
 
33
  return cls(**kwargs)
34
 
35
  def run(self,
36
+ input_data: Dict[str, Any]) -> Dict[str, Any]:
 
 
37
 
38
  # ~~~ Retrieve the test data ~~~
39
  test_data = self._get_test_data(input_data)
40
 
41
  # ~~~ Run tests ~~~
42
+ response: Dict[str, Any] = self._run_tests(input_data, test_data)
43
 
44
  return response
FixedReply_PlanReflect.yaml CHANGED
@@ -8,7 +8,7 @@ input_keys: []
8
  output_data_transformations:
9
  - _target_: flows.data_transformations.KeyRename
10
  old_key2new_key:
11
- raw_response: "plan_reflect_message"
12
  output_keys:
13
  - "plan_reflect_message"
14
 
 
8
  output_data_transformations:
9
  - _target_: flows.data_transformations.KeyRename
10
  old_key2new_key:
11
+ fixed_reply: "plan_reflect_message"
12
  output_keys:
13
  - "plan_reflect_message"
14
 
LC_CodeCriticWrongAttempt.yaml CHANGED
@@ -83,6 +83,6 @@ input_keys:
83
  output_data_transformations:
84
  - _target_: flows.data_transformations.KeyRename
85
  old_key2new_key:
86
- raw_response: "code_feedback"
87
  output_keys:
88
  - "code_feedback"
 
83
  output_data_transformations:
84
  - _target_: flows.data_transformations.KeyRename
85
  old_key2new_key:
86
+ api_output: "code_feedback"
87
  output_keys:
88
  - "code_feedback"
LC_CodeCriticWrongAttemptWithPlan.yaml CHANGED
@@ -91,6 +91,6 @@ input_keys:
91
  output_data_transformations:
92
  - _target_: flows.data_transformations.KeyRename
93
  old_key2new_key:
94
- raw_response: "code_feedback"
95
  output_keys:
96
  - "code_feedback"
 
91
  output_data_transformations:
92
  - _target_: flows.data_transformations.KeyRename
93
  old_key2new_key:
94
+ api_output: "code_feedback"
95
  output_keys:
96
  - "code_feedback"
LC_CodeDebug.yaml CHANGED
@@ -17,7 +17,7 @@ input_keys:
17
  output_data_transformations:
18
  - _target_: flows.data_transformations.KeyRename
19
  old_key2new_key:
20
- raw_response.code: "code"
21
  output_keys:
22
  - "code"
23
 
@@ -46,13 +46,14 @@ subflows_config:
46
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
47
  regex: '(?<=```python)([\s\S]*?)(?=```)'
48
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
49
- input_key: "raw_response"
50
  output_key: "code"
51
  strip: True
52
  assert_unique: True
53
 
54
  - _target_: flows.data_transformations.EndOfInteraction
55
  end_of_interaction_string: "Final answer"
 
56
  output_key: "end_of_interaction"
57
 
58
  output_keys:
 
17
  output_data_transformations:
18
  - _target_: flows.data_transformations.KeyRename
19
  old_key2new_key:
20
+ code: "code"
21
  output_keys:
22
  - "code"
23
 
 
46
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
47
  regex: '(?<=```python)([\s\S]*?)(?=```)'
48
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
49
+ input_key: "api_output"
50
  output_key: "code"
51
  strip: True
52
  assert_unique: True
53
 
54
  - _target_: flows.data_transformations.EndOfInteraction
55
  end_of_interaction_string: "Final answer"
56
+ input_key: "api_output"
57
  output_key: "end_of_interaction"
58
 
59
  output_keys:
LC_CodeDebugCollab.yaml CHANGED
@@ -17,7 +17,7 @@ input_keys:
17
  output_data_transformations:
18
  - _target_: flows.data_transformations.KeyRename
19
  old_key2new_key:
20
- raw_response.code: "code"
21
  output_keys:
22
  - "code"
23
 
@@ -51,13 +51,14 @@ subflows_config:
51
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
52
  regex: '(?<=```python)([\s\S]*?)(?=```)'
53
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
54
- input_key: "raw_response"
55
  output_key: "code"
56
  strip: True
57
  assert_unique: True
58
 
59
  - _target_: flows.data_transformations.EndOfInteraction
60
  end_of_interaction_string: "Final answer"
 
61
  output_key: "end_of_interaction"
62
 
63
  output_keys:
 
17
  output_data_transformations:
18
  - _target_: flows.data_transformations.KeyRename
19
  old_key2new_key:
20
+ code: "code"
21
  output_keys:
22
  - "code"
23
 
 
51
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
52
  regex: '(?<=```python)([\s\S]*?)(?=```)'
53
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
54
+ input_key: "api_output"
55
  output_key: "code"
56
  strip: True
57
  assert_unique: True
58
 
59
  - _target_: flows.data_transformations.EndOfInteraction
60
  end_of_interaction_string: "Final answer"
61
+ input_key: "api_output"
62
  output_key: "end_of_interaction"
63
 
64
  output_keys:
LC_CodeDebugCollabWithPlan.yaml CHANGED
@@ -18,7 +18,7 @@ input_keys:
18
  output_data_transformations:
19
  - _target_: flows.data_transformations.KeyRename
20
  old_key2new_key:
21
- raw_response.code: "code"
22
  output_keys:
23
  - "code"
24
 
@@ -52,13 +52,14 @@ subflows_config:
52
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
53
  regex: '(?<=```python)([\s\S]*?)(?=```)'
54
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
55
- input_key: "raw_response"
56
  output_key: "code"
57
  strip: True
58
  assert_unique: True
59
 
60
  - _target_: flows.data_transformations.EndOfInteraction
61
  end_of_interaction_string: "Final answer"
 
62
  output_key: "end_of_interaction"
63
 
64
  output_keys:
 
18
  output_data_transformations:
19
  - _target_: flows.data_transformations.KeyRename
20
  old_key2new_key:
21
+ code: "code"
22
  output_keys:
23
  - "code"
24
 
 
52
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
53
  regex: '(?<=```python)([\s\S]*?)(?=```)'
54
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
55
+ input_key: "api_output"
56
  output_key: "code"
57
  strip: True
58
  assert_unique: True
59
 
60
  - _target_: flows.data_transformations.EndOfInteraction
61
  end_of_interaction_string: "Final answer"
62
+ input_key: "api_output"
63
  output_key: "end_of_interaction"
64
 
65
  output_keys:
LC_CodeDebugCritic.yaml CHANGED
@@ -15,9 +15,9 @@ input_keys:
15
  output_data_transformations:
16
  - _target_: flows.data_transformations.KeyRename
17
  old_key2new_key:
18
- raw_response.testing_results_summary: "testing_results_summary"
19
- raw_response.all_tests_passed: "all_tests_passed"
20
- raw_response.code_feedback: "code_feedback"
21
  output_keys:
22
  - "testing_results_summary"
23
  - "all_tests_passed"
 
15
  output_data_transformations:
16
  - _target_: flows.data_transformations.KeyRename
17
  old_key2new_key:
18
+ testing_results_summary: "testing_results_summary"
19
+ all_tests_passed: "all_tests_passed"
20
+ code_feedback: "code_feedback"
21
  output_keys:
22
  - "testing_results_summary"
23
  - "all_tests_passed"
LC_CodeDebugCriticWithPlan.yaml CHANGED
@@ -16,9 +16,9 @@ input_keys:
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
- raw_response.testing_results_summary: "testing_results_summary"
20
- raw_response.all_tests_passed: "all_tests_passed"
21
- raw_response.code_feedback: "code_feedback"
22
  output_keys:
23
  - "testing_results_summary"
24
  - "all_tests_passed"
 
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
+ testing_results_summary: "testing_results_summary"
20
+ all_tests_passed: "all_tests_passed"
21
+ code_feedback: "code_feedback"
22
  output_keys:
23
  - "testing_results_summary"
24
  - "all_tests_passed"
LC_CodeTesting.yaml CHANGED
@@ -12,7 +12,7 @@ output_keys:
12
  - "testing_results_summary"
13
  output_data_transformations:
14
  - _target_: .src.data_transformations.CorrectnessFlag
15
- input_key: "raw_response.public_tests_results"
16
  output_key: "all_tests_passed"
17
  - _target_: .src.data_transformations.TestingResultsSummaryGeneration
18
  output_key: "testing_results_summary"
 
12
  - "testing_results_summary"
13
  output_data_transformations:
14
  - _target_: .src.data_transformations.CorrectnessFlag
15
+ input_key: "public_tests_results"
16
  output_key: "all_tests_passed"
17
  - _target_: .src.data_transformations.TestingResultsSummaryGeneration
18
  output_key: "testing_results_summary"
LC_CodeWithPlan.yaml CHANGED
@@ -83,6 +83,7 @@ output_data_transformations:
83
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
84
  regex: '(?<=```python)([\s\S]*?)(?=```)'
85
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
 
86
  output_key: "code"
87
  strip: True
88
  assert_unique: True
 
83
  - _target_: flows.data_transformations.RegexFirstOccurrenceExtractor
84
  regex: '(?<=```python)([\s\S]*?)(?=```)'
85
  regex_fallback: '(?<=```)([\s\S]*?)(?=```)'
86
+ input_key: "api_output"
87
  output_key: "code"
88
  strip: True
89
  assert_unique: True
LC_Plan.yaml CHANGED
@@ -23,6 +23,7 @@ output_data_transformations:
23
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
24
  regex_fallback:
25
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
 
26
  output_key: "plan"
27
  strip: True
28
  assert_unique: True
 
23
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
24
  regex_fallback:
25
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
26
+ input_key: "api_output"
27
  output_key: "plan"
28
  strip: True
29
  assert_unique: True
LC_PlanCollab.yaml CHANGED
@@ -16,7 +16,7 @@ input_keys:
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
- raw_response.plan: "plan"
20
  output_keys:
21
  - "plan"
22
 
@@ -48,12 +48,14 @@ subflows_config:
48
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
49
  regex_fallback:
50
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
 
51
  output_key: "plan"
52
  strip: True
53
  assert_unique: True
54
 
55
  - _target_: flows.data_transformations.EndOfInteraction
56
  end_of_interaction_string: "Final answer"
 
57
  output_key: "end_of_interaction"
58
 
59
  output_keys:
@@ -65,4 +67,4 @@ subflows_config:
65
  output_data_transformations:
66
  - _target_: flows.data_transformations.KeyRename
67
  old_key2new_key:
68
- raw_response: "plan_feedback"
 
16
  output_data_transformations:
17
  - _target_: flows.data_transformations.KeyRename
18
  old_key2new_key:
19
+ plan: "plan"
20
  output_keys:
21
  - "plan"
22
 
 
48
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
49
  regex_fallback:
50
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
51
+ input_key: "api_output"
52
  output_key: "plan"
53
  strip: True
54
  assert_unique: True
55
 
56
  - _target_: flows.data_transformations.EndOfInteraction
57
  end_of_interaction_string: "Final answer"
58
+ input_key: "api_output"
59
  output_key: "end_of_interaction"
60
 
61
  output_keys:
 
67
  output_data_transformations:
68
  - _target_: flows.data_transformations.KeyRename
69
  old_key2new_key:
70
+ api_output: "plan_feedback"
LC_PlanCollab_Code.yaml CHANGED
@@ -13,7 +13,7 @@ input_keys:
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
- raw_response.code: "code"
17
  output_keys:
18
  - "code"
19
 
 
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
+ code: "code"
17
  output_keys:
18
  - "code"
19
 
LC_PlanReflect.yaml CHANGED
@@ -15,7 +15,7 @@ input_keys:
15
  output_data_transformations:
16
  - _target_: flows.data_transformations.KeyRename
17
  old_key2new_key:
18
- raw_response.plan: "plan"
19
  output_keys:
20
  - "plan"
21
 
@@ -33,12 +33,14 @@ subflows_config:
33
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
34
  regex_fallback:
35
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
 
36
  output_key: "plan"
37
  strip: True
38
  assert_unique: True
39
 
40
  - _target_: flows.data_transformations.EndOfInteraction
41
  end_of_interaction_string: "Final answer"
 
42
  output_key: "end_of_interaction"
43
 
44
  output_keys:
 
15
  output_data_transformations:
16
  - _target_: flows.data_transformations.KeyRename
17
  old_key2new_key:
18
+ plan: "plan"
19
  output_keys:
20
  - "plan"
21
 
 
33
  regex: '(?<=Conceptual solution)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
34
  regex_fallback:
35
  - '(?<=Conceptual solution:)([\s\S]*?)(?=\n\n# [A-Z]|\Z)'
36
+ input_key: "api_output"
37
  output_key: "plan"
38
  strip: True
39
  assert_unique: True
40
 
41
  - _target_: flows.data_transformations.EndOfInteraction
42
  end_of_interaction_string: "Final answer"
43
+ input_key: "api_output"
44
  output_key: "end_of_interaction"
45
 
46
  output_keys:
LC_Plan_Code.yaml CHANGED
@@ -13,7 +13,7 @@ input_keys:
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
- raw_response.code: "code"
17
  output_keys:
18
  - "code"
19
 
 
13
  output_data_transformations:
14
  - _target_: flows.data_transformations.KeyRename
15
  old_key2new_key:
16
+ code: "code"
17
  output_keys:
18
  - "code"
19
 
src/data_transformations/testing_results_summary_generation.py CHANGED
@@ -17,7 +17,7 @@ class TestingResultsSummaryGeneration(DataTransformation):
17
  data_dict[self.output_key] = self.params["no_error_template"]
18
  return data_dict
19
 
20
- test_data = unflatten_dict(data_dict)["raw_response"]
21
 
22
  if not test_data["compilation_status"]:
23
  # compilation error occurred
 
17
  data_dict[self.output_key] = self.params["no_error_template"]
18
  return data_dict
19
 
20
+ test_data = unflatten_dict(data_dict)
21
 
22
  if not test_data["compilation_status"]:
23
  # compilation error occurred