Skip to content

Commit

Permalink
fix: babyai fix
Browse files Browse the repository at this point in the history
  • Loading branch information
DavidePaglieri committed Dec 9, 2024
1 parent b15156f commit de2b833
Show file tree
Hide file tree
Showing 206 changed files with 13,467 additions and 48,429 deletions.
Original file line number Diff line number Diff line change
@@ -1,63 +1,41 @@
Step,Observation,Action,Reasoning,Reward,Done
0,"a wall 1 step right
a grey ball 3 steps left and 3 steps forward
a blue key 3 steps left and 1 step forward
a grey ball 2 steps left and 1 step forward
a green key 2 steps left
a blue key 3 steps forward",turn left,,0,False
1,"a wall 1 step right
a grey ball 3 steps left and 2 steps forward
a blue key 3 steps left
a grey ball 2 steps left
a blue key 2 steps forward",go forward,,0,False
2,"a wall 1 step right
a grey ball 3 steps left and 1 step forward
a blue key 1 step forward",go forward,,0,False
3,"a wall 1 step right
a grey ball 3 steps left and 1 step forward
a blue key 1 step forward",go forward,,0,False
4,"a wall 1 step right
a grey ball 3 steps left and 1 step forward
a blue key 1 step forward",toggle,,0,False
5,"You carry a blue key
a wall 2 steps forward
a wall 1 step right
a grey ball 3 steps left and 1 step forward",pick up,,0,False
6,"You carry a blue key
a wall 6 steps forward
Step,Action,Reasoning,Observation,Reward,Done
0,turn left,,"a wall 4 steps forward
a wall 2 steps right
a green key 2 steps left and 4 steps forward
a green key 2 steps left and 2 steps forward
a blue ball 1 step left and 5 steps forward
a blue key 1 step left and 3 steps forward
a grey ball 1 step left and 2 steps forward
a grey ball 1 step right and 5 steps forward
a grey ball 1 step right and 3 steps forward",turn left,,0,False
7,"You carry a blue key
a wall 5 steps forward
a grey ball 1 step right and 2 steps forward",0,False
1,go forward,,"a wall 3 steps forward
a wall 2 steps right
a green key 2 steps left and 3 steps forward
a green key 2 steps left and 1 step forward
a blue ball 1 step left and 4 steps forward
a blue key 1 step left and 2 steps forward
a grey ball 1 step left and 1 step forward
a grey ball 1 step right and 4 steps forward
a grey ball 1 step right and 2 steps forward",go forward,,0,False
8,"You carry a blue key
a wall 4 steps forward
a grey ball 1 step right and 1 step forward",0,False
2,turn right,,"a wall 2 steps forward
a wall 3 steps left
a grey ball 1 step left and 1 step forward",0,False
3,turn left,,"a wall 3 steps forward
a wall 2 steps right
a grey ball 1 step right and 1 step forward",0,False
4,turn right,,"a wall 2 steps forward
a wall 3 steps left
a grey ball 1 step left and 1 step forward",0,False
5,turn left,,"a wall 3 steps forward
a wall 2 steps right
a grey ball 1 step right and 1 step forward",0,False
6,turn right,,"a wall 2 steps forward
a wall 3 steps left
a grey ball 1 step left and 1 step forward",0,False
7,turn left,,"a wall 3 steps forward
a wall 2 steps right
a grey ball 1 step right and 1 step forward",0,False
8,turn right,,"a wall 2 steps forward
a wall 3 steps left
a grey ball 1 step left and 1 step forward",0,False
9,turn left,,"a wall 3 steps forward
a wall 2 steps right
a green key 2 steps left and 2 steps forward
a green key 2 steps left
a blue ball 1 step left and 3 steps forward
a blue key 1 step left and 1 step forward
a grey ball 1 step left
a grey ball 1 step right and 3 steps forward
a grey ball 1 step right and 1 step forward",go forward,,0,False
9,"You carry a blue key
a grey ball 1 step right and 1 step forward",0,False
10,turn right,,"a wall 2 steps forward
a wall 3 steps left
a green key 2 steps forward
a grey ball 1 step forward
a blue key 1 step right and 1 step forward
a purple ball 2 steps right and 4 steps forward
a green key 2 steps right and 2 steps forward
a blue ball 3 steps right and 1 step forward",turn left,,0.859375,True
a grey ball 1 step left and 1 step forward",0,False
11,turn left,,"a wall 3 steps forward
a wall 2 steps right
a grey ball 1 step right and 1 step forward",0,False
12,go forward,,"a wall 2 steps forward
a grey ball 1 step right",0,False
13,turn right,,"a wall 2 steps left
a grey ball 1 step forward",0.803125,True
Original file line number Diff line number Diff line change
@@ -1,39 +1,40 @@
{
"task": "BabyAI-MixedTrainLocal-v0/goto",
"action_frequency": {
"turn left": 3,
"go forward": 5,
"toggle": 1,
"pick up": 1
"turn left": 6,
"go forward": 2,
"turn right": 6
},
"input_tokens": 5503,
"output_tokens": 86,
"input_tokens": 9926,
"output_tokens": 70,
"done": true,
"episode_return": 0.859375,
"num_steps": 10,
"episode_return": 0.803125,
"num_steps": 14,
"failed_candidates": [],
"mission": "go to a grey ball",
"mission": "go to the grey ball",
"progression": 1.0,
"process_num": "ForkProcess-1",
"seed": 587100551,
"seed": 917751506,
"agent": {
"type": "naive",
"remember_cot": true,
"max_history": 16,
"max_image_history": 0,
"max_cot_history": 1,
"max_icl_history": 1000,
"cache_icl": false
},
"client": {
"client_name": "claude",
"model_id": "claude-3-5-sonnet-20240620",
"base_url": "http://localhost:8000/v1",
"model_id": "claude-3-5-sonnet-latest",
"base_url": "http://localhost:8080/v1",
"generate_kwargs": {
"temperature": 0.0,
"max_tokens": 1024
},
"timeout": 60,
"max_retries": 5,
"delay": 2
"delay": 2,
"alternate_roles": false
}
}
Original file line number Diff line number Diff line change
@@ -1,29 +1,40 @@
Step,Observation,Action,Reasoning,Reward,Done
0,"a wall 5 steps forward
Step,Action,Reasoning,Observation,Reward,Done
0,turn left,,"a wall 6 steps forward
a wall 3 steps right
a purple box 3 steps left and 2 steps forward
a red box 3 steps left and 1 step forward
a yellow key 2 steps left and 4 steps forward
a red ball 1 step left and 4 steps forward
a green ball 1 step left and 2 steps forward
a green box 1 step left and 1 step forward
a red ball 1 step right and 2 steps forward
a yellow key 2 steps right and 4 steps forward",turn right,,0,False
1,"a wall 4 steps forward
a grey ball 2 steps right and 1 step forward",0,False
1,turn right,,"a wall 3 steps forward
a wall 1 step right
a grey ball 1 step left and 2 steps forward",0,False
2,turn left,,"a wall 6 steps forward
a wall 3 steps right
a purple box 3 steps left and 1 step forward
a red box 3 steps left
a yellow key 2 steps left and 3 steps forward
a red ball 1 step left and 3 steps forward
a green ball 1 step left and 1 step forward
a green box 1 step left
a red ball 1 step right and 1 step forward
a yellow key 2 steps right and 3 steps forward",go forward,,0,False
2,"a wall 3 steps left
a green ball 2 steps left and 3 steps forward
a red box 3 steps forward
a green box 1 step forward
a purple box 1 step right and 3 steps forward
a green ball 1 step right and 1 step forward
a yellow key 3 steps right and 2 steps forward
a red ball 3 steps right and 1 step forward",turn left,,0.9578125,True
a grey ball 2 steps right and 1 step forward",0,False
3,turn right,,"a wall 3 steps forward
a wall 1 step right
a grey ball 1 step left and 2 steps forward",0,False
4,turn left,,"a wall 6 steps forward
a wall 3 steps right
a grey ball 2 steps right and 1 step forward",0,False
5,turn right,,"a wall 3 steps forward
a wall 1 step right
a grey ball 1 step left and 2 steps forward",0,False
6,turn left,,"a wall 6 steps forward
a wall 3 steps right
a grey ball 2 steps right and 1 step forward",0,False
7,turn right,,"a wall 3 steps forward
a wall 1 step right
a grey ball 1 step left and 2 steps forward",0,False
8,turn left,,"a wall 6 steps forward
a wall 3 steps right
a grey ball 2 steps right and 1 step forward",0,False
9,turn right,,"a wall 3 steps forward
a wall 1 step right
a grey ball 1 step left and 2 steps forward",0,False
10,turn left,,"a wall 6 steps forward
a wall 3 steps right
a grey ball 2 steps right and 1 step forward",0,False
11,go forward,,"a wall 5 steps forward
a grey ball 2 steps right",0,False
12,turn right,,"a wall 2 steps right
a grey ball 2 steps forward",0,False
13,go forward,,"a wall 2 steps right
a grey ball 1 step forward",0.803125,True
Original file line number Diff line number Diff line change
@@ -1,38 +1,40 @@
{
"task": "BabyAI-MixedTrainLocal-v0/goto",
"action_frequency": {
"turn right": 1,
"go forward": 1,
"turn left": 1
"turn left": 6,
"turn right": 6,
"go forward": 2
},
"input_tokens": 1356,
"output_tokens": 31,
"input_tokens": 9898,
"output_tokens": 70,
"done": true,
"episode_return": 0.9578125,
"num_steps": 3,
"episode_return": 0.803125,
"num_steps": 14,
"failed_candidates": [],
"mission": "go to the green box",
"mission": "go to the grey ball",
"progression": 1.0,
"process_num": "ForkProcess-2",
"seed": 68573331,
"seed": 3943674400,
"agent": {
"type": "naive",
"remember_cot": true,
"max_history": 16,
"max_image_history": 0,
"max_cot_history": 1,
"max_icl_history": 1000,
"cache_icl": false
},
"client": {
"client_name": "claude",
"model_id": "claude-3-5-sonnet-20240620",
"base_url": "http://localhost:8000/v1",
"model_id": "claude-3-5-sonnet-latest",
"base_url": "http://localhost:8080/v1",
"generate_kwargs": {
"temperature": 0.0,
"max_tokens": 1024
},
"timeout": 60,
"max_retries": 5,
"delay": 2
"delay": 2,
"alternate_roles": false
}
}
Loading

0 comments on commit de2b833

Please sign in to comment.