Spaces:
Running
Running
{ | |
"12172380859428428757": { | |
"episode_goal": "Open a new Chrome private window", | |
"steps": [ | |
{ | |
"step_id": 0, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_0.png", | |
"action_history": "", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Type: 'search'", | |
"Swipe: Down", | |
"Tap: [382, 838]", | |
"Button: Press Back" | |
], | |
"correct_answer_index": 2 | |
} | |
}, | |
{ | |
"step_id": 1, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_1.png", | |
"action_history": "Step 0: Tapped at pixel coordinates (x,y): [382, 838]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Button: Press Back", | |
"Tap: [120, 625]", | |
"Swipe: Down", | |
"Tap: [224, 776]" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 2, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_2.png", | |
"action_history": "Step 0: Tapped at pixel coordinates (x,y): [382, 838]\nStep 1: Tapped at pixel coordinates (x,y): [224, 776]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [500, 420]", | |
"Tap: [160, 775]", | |
"Button: Press Back", | |
"Tap: [420, 775]" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 3, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_3.png", | |
"action_history": "Step 0: Tapped at pixel coordinates (x,y): [382, 838]\nStep 1: Tapped at pixel coordinates (x,y): [224, 776]\nStep 2: Tapped at pixel coordinates (x,y): [420, 775]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [468, 64]", | |
"Tap: [513, 64]", | |
"Tap: [518, 526]", | |
"Type: 'new incognito tab'" | |
], | |
"correct_answer_index": 0 | |
} | |
}, | |
{ | |
"step_id": 4, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_4.png", | |
"action_history": "Step 0: Tapped at pixel coordinates (x,y): [382, 838]\nStep 1: Tapped at pixel coordinates (x,y): [224, 776]\nStep 2: Tapped at pixel coordinates (x,y): [420, 775]\nStep 3: Tapped at pixel coordinates (x,y): [468, 64]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Swipe: Right", | |
"Tap: [44, 78]", | |
"Type: 'search'", | |
"Button: Press Enter" | |
], | |
"correct_answer_index": 1 | |
} | |
}, | |
{ | |
"step_id": 5, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_5.png", | |
"action_history": "Step 0: Tapped at pixel coordinates (x,y): [382, 838]\nStep 1: Tapped at pixel coordinates (x,y): [224, 776]\nStep 2: Tapped at pixel coordinates (x,y): [420, 775]\nStep 3: Tapped at pixel coordinates (x,y): [468, 64]\nStep 4: Tapped at pixel coordinates (x,y): [44, 78]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Type: 'new private window'", | |
"Tap: [515, 522]", | |
"Tap: [515, 62]", | |
"Tap: [467, 62]" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 6, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_6.png", | |
"action_history": "Step 0: Tapped at pixel coordinates (x,y): [382, 838]\nStep 1: Tapped at pixel coordinates (x,y): [224, 776]\nStep 2: Tapped at pixel coordinates (x,y): [420, 775]\nStep 3: Tapped at pixel coordinates (x,y): [468, 64]\nStep 4: Tapped at pixel coordinates (x,y): [44, 78]\nStep 5: Tapped at pixel coordinates (x,y): [467, 62]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [490, 114]", | |
"Swipe: Down", | |
"Tap: [150, 78]", | |
"Tap: [514, 64]" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 7, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_7.png", | |
"action_history": "Step 0: Tapped at pixel coordinates (x,y): [382, 838]\nStep 1: Tapped at pixel coordinates (x,y): [224, 776]\nStep 2: Tapped at pixel coordinates (x,y): [420, 775]\nStep 3: Tapped at pixel coordinates (x,y): [468, 64]\nStep 4: Tapped at pixel coordinates (x,y): [44, 78]\nStep 5: Tapped at pixel coordinates (x,y): [467, 62]\nStep 6: Tapped at pixel coordinates (x,y): [514, 64]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [370, 127]", | |
"Tap: [370, 298]", | |
"Button: Press Back", | |
"Tap: [370, 70]" | |
], | |
"correct_answer_index": 0 | |
} | |
}, | |
{ | |
"step_id": 8, | |
"screenshot_path": "./aitw_gemini_images/episode_12172380859428428757_step_8.png", | |
"action_history": "Step 0: Tapped at pixel coordinates (x,y): [382, 838]\nStep 1: Tapped at pixel coordinates (x,y): [224, 776]\nStep 2: Tapped at pixel coordinates (x,y): [420, 775]\nStep 3: Tapped at pixel coordinates (x,y): [468, 64]\nStep 4: Tapped at pixel coordinates (x,y): [44, 78]\nStep 5: Tapped at pixel coordinates (x,y): [467, 62]\nStep 6: Tapped at pixel coordinates (x,y): [514, 64]\nStep 7: Tapped at pixel coordinates (x,y): [370, 127]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [270, 80]", | |
"Button: Press Back", | |
"Tap: [450, 80]", | |
"Button: Unknown" | |
], | |
"correct_answer_index": 3 | |
} | |
} | |
] | |
}, | |
"9027843537045096280": { | |
"episode_goal": "Open a new Chrome window", | |
"steps": [ | |
{ | |
"step_id": 0, | |
"screenshot_path": "./aitw_gemini_images/episode_9027843537045096280_step_0.png", | |
"action_history": "", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Button: Press Back", | |
"Type: 'search'", | |
"Swipe: Left", | |
"Button: Press Home" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 1, | |
"screenshot_path": "./aitw_gemini_images/episode_9027843537045096280_step_1.png", | |
"action_history": "Step 0: Pressed Button: Press Home", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [90, 960]", | |
"Tap: [278, 826]", | |
"Tap: [365, 826]", | |
"Swipe: Up" | |
], | |
"correct_answer_index": 2 | |
} | |
}, | |
{ | |
"step_id": 2, | |
"screenshot_path": "./aitw_gemini_images/episode_9027843537045096280_step_2.png", | |
"action_history": "Step 0: Pressed Button: Press Home\nStep 1: Tapped at pixel coordinates (x,y): [365, 826]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [46, 86]", | |
"Type: 'new tab'", | |
"Button: Unknown", | |
"Button: Press Back" | |
], | |
"correct_answer_index": 2 | |
} | |
} | |
] | |
}, | |
"2247237893045084693": { | |
"episode_goal": "Open the calendar and show me this week's events?", | |
"steps": [ | |
{ | |
"step_id": 0, | |
"screenshot_path": "./aitw_gemini_images/episode_2247237893045084693_step_0.png", | |
"action_history": "", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Swipe: Swipe Down", | |
"Swipe: Swipe Up", | |
"Tap: [270, 880]", | |
"Tap: [114, 153]" | |
], | |
"correct_answer_index": 1 | |
} | |
}, | |
{ | |
"step_id": 1, | |
"screenshot_path": "./aitw_gemini_images/episode_2247237893045084693_step_1.png", | |
"action_history": "Step 0: Swiped: Swipe Up", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [379, 183]", | |
"Tap: [75, 345]", | |
"Tap: [275, 183]", | |
"Type: 'Calendar'" | |
], | |
"correct_answer_index": 0 | |
} | |
}, | |
{ | |
"step_id": 2, | |
"screenshot_path": "./aitw_gemini_images/episode_2247237893045084693_step_2.png", | |
"action_history": "Step 0: Swiped: Swipe Up\nStep 1: Tapped at pixel coordinates (x,y): [379, 183]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [270, 315]", | |
"Tap: [440, 976]", | |
"Swipe: Left", | |
"Tap: [499, 976]" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 3, | |
"screenshot_path": "./aitw_gemini_images/episode_2247237893045084693_step_3.png", | |
"action_history": "Step 0: Swiped: Swipe Up\nStep 1: Tapped at pixel coordinates (x,y): [379, 183]\nStep 2: Tapped at pixel coordinates (x,y): [499, 976]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [302, 950]", | |
"Swipe: Down", | |
"Tap: [425, 950]", | |
"Tap: [270, 600]" | |
], | |
"correct_answer_index": 0 | |
} | |
}, | |
{ | |
"step_id": 4, | |
"screenshot_path": "./aitw_gemini_images/episode_2247237893045084693_step_4.png", | |
"action_history": "Step 0: Swiped: Swipe Up\nStep 1: Tapped at pixel coordinates (x,y): [379, 183]\nStep 2: Tapped at pixel coordinates (x,y): [499, 976]\nStep 3: Tapped at pixel coordinates (x,y): [302, 950]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Swipe: Right", | |
"Tap: [453, 86]", | |
"Tap: [140, 184]", | |
"Button: Unknown" | |
], | |
"correct_answer_index": 3 | |
} | |
} | |
] | |
}, | |
"12224608131504749719": { | |
"episode_goal": "How much does a 2x4x8 board cost at Lowes?", | |
"steps": [ | |
{ | |
"step_id": 0, | |
"screenshot_path": "./aitw_gemini_images/episode_12224608131504749719_step_0.png", | |
"action_history": "", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [375, 790]", | |
"Swipe: Swipe Up", | |
"Tap: [270, 882]", | |
"Swipe: Swipe Down" | |
], | |
"correct_answer_index": 1 | |
} | |
}, | |
{ | |
"step_id": 1, | |
"screenshot_path": "./aitw_gemini_images/episode_12224608131504749719_step_1.png", | |
"action_history": "Step 0: Swiped: Swipe Up", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Button: Press Back", | |
"Button: Press Home", | |
"Type: 'how much does a 2x4x8 board cost at lowes'", | |
"Tap: [337, 362]" | |
], | |
"correct_answer_index": 1 | |
} | |
}, | |
{ | |
"step_id": 2, | |
"screenshot_path": "./aitw_gemini_images/episode_12224608131504749719_step_2.png", | |
"action_history": "Step 0: Swiped: Swipe Up\nStep 1: Pressed Button: Press Home", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [405, 853]", | |
"Type: 'How much does a 2x4x8 board cost at Lowes?'", | |
"Tap: [475, 950]", | |
"Tap: [289, 950]" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 3, | |
"screenshot_path": "./aitw_gemini_images/episode_12224608131504749719_step_3.png", | |
"action_history": "Step 0: Swiped: Swipe Up\nStep 1: Pressed Button: Press Home\nStep 2: Tapped at pixel coordinates (x,y): [289, 950]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [495, 85]", | |
"Type: 'how much does a 2 bedroom apartment rent for in house'", | |
"Type: 'How much does a 2x4x8 board cost at Lowes?'", | |
"Button: Press Back" | |
], | |
"correct_answer_index": 2 | |
} | |
}, | |
{ | |
"step_id": 4, | |
"screenshot_path": "./aitw_gemini_images/episode_12224608131504749719_step_4.png", | |
"action_history": "Step 0: Swiped: Swipe Up\nStep 1: Pressed Button: Press Home\nStep 2: Tapped at pixel coordinates (x,y): [289, 950]\nStep 3: Typed: 'How much does a 2x4x8 board cost at Lowes?'", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [280, 198]", | |
"Tap: [504, 82]", | |
"Button: Press Enter", | |
"Tap: [286, 129]" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 5, | |
"screenshot_path": "./aitw_gemini_images/episode_12224608131504749719_step_5.png", | |
"action_history": "Step 0: Swiped: Swipe Up\nStep 1: Pressed Button: Press Home\nStep 2: Tapped at pixel coordinates (x,y): [289, 950]\nStep 3: Typed: 'How much does a 2x4x8 board cost at Lowes?'\nStep 4: Tapped at pixel coordinates (x,y): [286, 129]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Swipe: Down", | |
"Tap: [270, 830]", | |
"Tap: [490, 129]", | |
"Button: Unknown" | |
], | |
"correct_answer_index": 3 | |
} | |
} | |
] | |
}, | |
"1307957808436696980": { | |
"episode_goal": "Google the capital of Mexico", | |
"steps": [ | |
{ | |
"step_id": 0, | |
"screenshot_path": "./aitw_gemini_images/episode_1307957808436696980_step_0.png", | |
"action_history": "", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [175, 178]", | |
"Button: Press Back", | |
"Button: Press Home", | |
"Tap: [52, 83]" | |
], | |
"correct_answer_index": 2 | |
} | |
}, | |
{ | |
"step_id": 1, | |
"screenshot_path": "./aitw_gemini_images/episode_1307957808436696980_step_1.png", | |
"action_history": "Step 0: Pressed Button: Press Home", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Tap: [270, 915]", | |
"Swipe: Swipe Down", | |
"Tap: [373, 801]", | |
"Swipe: Swipe Up" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 2, | |
"screenshot_path": "./aitw_gemini_images/episode_1307957808436696980_step_2.png", | |
"action_history": "Step 0: Pressed Button: Press Home\nStep 1: Swiped: Swipe Up", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Button: Press Home", | |
"Type: 'capital of Mexico'", | |
"Button: Press Back", | |
"Tap: [270, 100]" | |
], | |
"correct_answer_index": 0 | |
} | |
}, | |
{ | |
"step_id": 3, | |
"screenshot_path": "./aitw_gemini_images/episode_1307957808436696980_step_3.png", | |
"action_history": "Step 0: Pressed Button: Press Home\nStep 1: Swiped: Swipe Up\nStep 2: Pressed Button: Press Home", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Type: 'capital of Mexico'", | |
"Swipe: Up", | |
"Tap: [320, 974]", | |
"Tap: [398, 866]" | |
], | |
"correct_answer_index": 2 | |
} | |
}, | |
{ | |
"step_id": 4, | |
"screenshot_path": "./aitw_gemini_images/episode_1307957808436696980_step_4.png", | |
"action_history": "Step 0: Pressed Button: Press Home\nStep 1: Swiped: Swipe Up\nStep 2: Pressed Button: Press Home\nStep 3: Tapped at pixel coordinates (x,y): [320, 974]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Button: Press Back", | |
"Type: 'Google the capital of Mexico'", | |
"Tap: [484, 86]", | |
"Type: 'Mexico City'" | |
], | |
"correct_answer_index": 1 | |
} | |
}, | |
{ | |
"step_id": 5, | |
"screenshot_path": "./aitw_gemini_images/episode_1307957808436696980_step_5.png", | |
"action_history": "Step 0: Pressed Button: Press Home\nStep 1: Swiped: Swipe Up\nStep 2: Pressed Button: Press Home\nStep 3: Tapped at pixel coordinates (x,y): [320, 974]\nStep 4: Typed: 'Google the capital of Mexico'", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Button: Press Enter", | |
"Swipe: Up", | |
"Type: 'search'", | |
"Tap: [185, 114]" | |
], | |
"correct_answer_index": 3 | |
} | |
}, | |
{ | |
"step_id": 6, | |
"screenshot_path": "./aitw_gemini_images/episode_1307957808436696980_step_6.png", | |
"action_history": "Step 0: Pressed Button: Press Home\nStep 1: Swiped: Swipe Up\nStep 2: Pressed Button: Press Home\nStep 3: Tapped at pixel coordinates (x,y): [320, 974]\nStep 4: Typed: 'Google the capital of Mexico'\nStep 5: Tapped at pixel coordinates (x,y): [185, 114]", | |
"ground_truth_format": "mcq", | |
"questions": { | |
"question": "Based on the goal and screen, what is the precise next action to perform?", | |
"options": [ | |
"Type: 'search'", | |
"Button: Press Enter", | |
"Button: Unknown", | |
"Swipe: Left" | |
], | |
"correct_answer_index": 2 | |
} | |
} | |
] | |
} | |
} |