-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
1 parent
b15156f
commit de2b833
Showing
206 changed files
with
13,467 additions
and
48,429 deletions.
There are no files selected for viewing
96 changes: 37 additions & 59 deletions
96
....5-Sonnet/babyai/BabyAI-MixedTrainLocal-v0/goto/BabyAI-MixedTrainLocal-v0/goto_run_00.csv
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,63 +1,41 @@ | ||
Step,Observation,Action,Reasoning,Reward,Done | ||
0,"a wall 1 step right | ||
a grey ball 3 steps left and 3 steps forward | ||
a blue key 3 steps left and 1 step forward | ||
a grey ball 2 steps left and 1 step forward | ||
a green key 2 steps left | ||
a blue key 3 steps forward",turn left,,0,False | ||
1,"a wall 1 step right | ||
a grey ball 3 steps left and 2 steps forward | ||
a blue key 3 steps left | ||
a grey ball 2 steps left | ||
a blue key 2 steps forward",go forward,,0,False | ||
2,"a wall 1 step right | ||
a grey ball 3 steps left and 1 step forward | ||
a blue key 1 step forward",go forward,,0,False | ||
3,"a wall 1 step right | ||
a grey ball 3 steps left and 1 step forward | ||
a blue key 1 step forward",go forward,,0,False | ||
4,"a wall 1 step right | ||
a grey ball 3 steps left and 1 step forward | ||
a blue key 1 step forward",toggle,,0,False | ||
5,"You carry a blue key | ||
a wall 2 steps forward | ||
a wall 1 step right | ||
a grey ball 3 steps left and 1 step forward",pick up,,0,False | ||
6,"You carry a blue key | ||
a wall 6 steps forward | ||
Step,Action,Reasoning,Observation,Reward,Done | ||
0,turn left,,"a wall 4 steps forward | ||
a wall 2 steps right | ||
a green key 2 steps left and 4 steps forward | ||
a green key 2 steps left and 2 steps forward | ||
a blue ball 1 step left and 5 steps forward | ||
a blue key 1 step left and 3 steps forward | ||
a grey ball 1 step left and 2 steps forward | ||
a grey ball 1 step right and 5 steps forward | ||
a grey ball 1 step right and 3 steps forward",turn left,,0,False | ||
7,"You carry a blue key | ||
a wall 5 steps forward | ||
a grey ball 1 step right and 2 steps forward",0,False | ||
1,go forward,,"a wall 3 steps forward | ||
a wall 2 steps right | ||
a green key 2 steps left and 3 steps forward | ||
a green key 2 steps left and 1 step forward | ||
a blue ball 1 step left and 4 steps forward | ||
a blue key 1 step left and 2 steps forward | ||
a grey ball 1 step left and 1 step forward | ||
a grey ball 1 step right and 4 steps forward | ||
a grey ball 1 step right and 2 steps forward",go forward,,0,False | ||
8,"You carry a blue key | ||
a wall 4 steps forward | ||
a grey ball 1 step right and 1 step forward",0,False | ||
2,turn right,,"a wall 2 steps forward | ||
a wall 3 steps left | ||
a grey ball 1 step left and 1 step forward",0,False | ||
3,turn left,,"a wall 3 steps forward | ||
a wall 2 steps right | ||
a grey ball 1 step right and 1 step forward",0,False | ||
4,turn right,,"a wall 2 steps forward | ||
a wall 3 steps left | ||
a grey ball 1 step left and 1 step forward",0,False | ||
5,turn left,,"a wall 3 steps forward | ||
a wall 2 steps right | ||
a grey ball 1 step right and 1 step forward",0,False | ||
6,turn right,,"a wall 2 steps forward | ||
a wall 3 steps left | ||
a grey ball 1 step left and 1 step forward",0,False | ||
7,turn left,,"a wall 3 steps forward | ||
a wall 2 steps right | ||
a grey ball 1 step right and 1 step forward",0,False | ||
8,turn right,,"a wall 2 steps forward | ||
a wall 3 steps left | ||
a grey ball 1 step left and 1 step forward",0,False | ||
9,turn left,,"a wall 3 steps forward | ||
a wall 2 steps right | ||
a green key 2 steps left and 2 steps forward | ||
a green key 2 steps left | ||
a blue ball 1 step left and 3 steps forward | ||
a blue key 1 step left and 1 step forward | ||
a grey ball 1 step left | ||
a grey ball 1 step right and 3 steps forward | ||
a grey ball 1 step right and 1 step forward",go forward,,0,False | ||
9,"You carry a blue key | ||
a grey ball 1 step right and 1 step forward",0,False | ||
10,turn right,,"a wall 2 steps forward | ||
a wall 3 steps left | ||
a green key 2 steps forward | ||
a grey ball 1 step forward | ||
a blue key 1 step right and 1 step forward | ||
a purple ball 2 steps right and 4 steps forward | ||
a green key 2 steps right and 2 steps forward | ||
a blue ball 3 steps right and 1 step forward",turn left,,0.859375,True | ||
a grey ball 1 step left and 1 step forward",0,False | ||
11,turn left,,"a wall 3 steps forward | ||
a wall 2 steps right | ||
a grey ball 1 step right and 1 step forward",0,False | ||
12,go forward,,"a wall 2 steps forward | ||
a grey ball 1 step right",0,False | ||
13,turn right,,"a wall 2 steps left | ||
a grey ball 1 step forward",0.803125,True |
27 changes: 14 additions & 13 deletions
27
...5-Sonnet/babyai/BabyAI-MixedTrainLocal-v0/goto/BabyAI-MixedTrainLocal-v0/goto_run_00.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,39 +1,40 @@ | ||
{ | ||
"task": "BabyAI-MixedTrainLocal-v0/goto", | ||
"action_frequency": { | ||
"turn left": 3, | ||
"go forward": 5, | ||
"toggle": 1, | ||
"pick up": 1 | ||
"turn left": 6, | ||
"go forward": 2, | ||
"turn right": 6 | ||
}, | ||
"input_tokens": 5503, | ||
"output_tokens": 86, | ||
"input_tokens": 9926, | ||
"output_tokens": 70, | ||
"done": true, | ||
"episode_return": 0.859375, | ||
"num_steps": 10, | ||
"episode_return": 0.803125, | ||
"num_steps": 14, | ||
"failed_candidates": [], | ||
"mission": "go to a grey ball", | ||
"mission": "go to the grey ball", | ||
"progression": 1.0, | ||
"process_num": "ForkProcess-1", | ||
"seed": 587100551, | ||
"seed": 917751506, | ||
"agent": { | ||
"type": "naive", | ||
"remember_cot": true, | ||
"max_history": 16, | ||
"max_image_history": 0, | ||
"max_cot_history": 1, | ||
"max_icl_history": 1000, | ||
"cache_icl": false | ||
}, | ||
"client": { | ||
"client_name": "claude", | ||
"model_id": "claude-3-5-sonnet-20240620", | ||
"base_url": "http://localhost:8000/v1", | ||
"model_id": "claude-3-5-sonnet-latest", | ||
"base_url": "http://localhost:8080/v1", | ||
"generate_kwargs": { | ||
"temperature": 0.0, | ||
"max_tokens": 1024 | ||
}, | ||
"timeout": 60, | ||
"max_retries": 5, | ||
"delay": 2 | ||
"delay": 2, | ||
"alternate_roles": false | ||
} | ||
} |
65 changes: 38 additions & 27 deletions
65
....5-Sonnet/babyai/BabyAI-MixedTrainLocal-v0/goto/BabyAI-MixedTrainLocal-v0/goto_run_01.csv
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,29 +1,40 @@ | ||
Step,Observation,Action,Reasoning,Reward,Done | ||
0,"a wall 5 steps forward | ||
Step,Action,Reasoning,Observation,Reward,Done | ||
0,turn left,,"a wall 6 steps forward | ||
a wall 3 steps right | ||
a purple box 3 steps left and 2 steps forward | ||
a red box 3 steps left and 1 step forward | ||
a yellow key 2 steps left and 4 steps forward | ||
a red ball 1 step left and 4 steps forward | ||
a green ball 1 step left and 2 steps forward | ||
a green box 1 step left and 1 step forward | ||
a red ball 1 step right and 2 steps forward | ||
a yellow key 2 steps right and 4 steps forward",turn right,,0,False | ||
1,"a wall 4 steps forward | ||
a grey ball 2 steps right and 1 step forward",0,False | ||
1,turn right,,"a wall 3 steps forward | ||
a wall 1 step right | ||
a grey ball 1 step left and 2 steps forward",0,False | ||
2,turn left,,"a wall 6 steps forward | ||
a wall 3 steps right | ||
a purple box 3 steps left and 1 step forward | ||
a red box 3 steps left | ||
a yellow key 2 steps left and 3 steps forward | ||
a red ball 1 step left and 3 steps forward | ||
a green ball 1 step left and 1 step forward | ||
a green box 1 step left | ||
a red ball 1 step right and 1 step forward | ||
a yellow key 2 steps right and 3 steps forward",go forward,,0,False | ||
2,"a wall 3 steps left | ||
a green ball 2 steps left and 3 steps forward | ||
a red box 3 steps forward | ||
a green box 1 step forward | ||
a purple box 1 step right and 3 steps forward | ||
a green ball 1 step right and 1 step forward | ||
a yellow key 3 steps right and 2 steps forward | ||
a red ball 3 steps right and 1 step forward",turn left,,0.9578125,True | ||
a grey ball 2 steps right and 1 step forward",0,False | ||
3,turn right,,"a wall 3 steps forward | ||
a wall 1 step right | ||
a grey ball 1 step left and 2 steps forward",0,False | ||
4,turn left,,"a wall 6 steps forward | ||
a wall 3 steps right | ||
a grey ball 2 steps right and 1 step forward",0,False | ||
5,turn right,,"a wall 3 steps forward | ||
a wall 1 step right | ||
a grey ball 1 step left and 2 steps forward",0,False | ||
6,turn left,,"a wall 6 steps forward | ||
a wall 3 steps right | ||
a grey ball 2 steps right and 1 step forward",0,False | ||
7,turn right,,"a wall 3 steps forward | ||
a wall 1 step right | ||
a grey ball 1 step left and 2 steps forward",0,False | ||
8,turn left,,"a wall 6 steps forward | ||
a wall 3 steps right | ||
a grey ball 2 steps right and 1 step forward",0,False | ||
9,turn right,,"a wall 3 steps forward | ||
a wall 1 step right | ||
a grey ball 1 step left and 2 steps forward",0,False | ||
10,turn left,,"a wall 6 steps forward | ||
a wall 3 steps right | ||
a grey ball 2 steps right and 1 step forward",0,False | ||
11,go forward,,"a wall 5 steps forward | ||
a grey ball 2 steps right",0,False | ||
12,turn right,,"a wall 2 steps right | ||
a grey ball 2 steps forward",0,False | ||
13,go forward,,"a wall 2 steps right | ||
a grey ball 1 step forward",0.803125,True |
26 changes: 14 additions & 12 deletions
26
...5-Sonnet/babyai/BabyAI-MixedTrainLocal-v0/goto/BabyAI-MixedTrainLocal-v0/goto_run_01.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,38 +1,40 @@ | ||
{ | ||
"task": "BabyAI-MixedTrainLocal-v0/goto", | ||
"action_frequency": { | ||
"turn right": 1, | ||
"go forward": 1, | ||
"turn left": 1 | ||
"turn left": 6, | ||
"turn right": 6, | ||
"go forward": 2 | ||
}, | ||
"input_tokens": 1356, | ||
"output_tokens": 31, | ||
"input_tokens": 9898, | ||
"output_tokens": 70, | ||
"done": true, | ||
"episode_return": 0.9578125, | ||
"num_steps": 3, | ||
"episode_return": 0.803125, | ||
"num_steps": 14, | ||
"failed_candidates": [], | ||
"mission": "go to the green box", | ||
"mission": "go to the grey ball", | ||
"progression": 1.0, | ||
"process_num": "ForkProcess-2", | ||
"seed": 68573331, | ||
"seed": 3943674400, | ||
"agent": { | ||
"type": "naive", | ||
"remember_cot": true, | ||
"max_history": 16, | ||
"max_image_history": 0, | ||
"max_cot_history": 1, | ||
"max_icl_history": 1000, | ||
"cache_icl": false | ||
}, | ||
"client": { | ||
"client_name": "claude", | ||
"model_id": "claude-3-5-sonnet-20240620", | ||
"base_url": "http://localhost:8000/v1", | ||
"model_id": "claude-3-5-sonnet-latest", | ||
"base_url": "http://localhost:8080/v1", | ||
"generate_kwargs": { | ||
"temperature": 0.0, | ||
"max_tokens": 1024 | ||
}, | ||
"timeout": 60, | ||
"max_retries": 5, | ||
"delay": 2 | ||
"delay": 2, | ||
"alternate_roles": false | ||
} | ||
} |
Oops, something went wrong.