diff --git "a/eval_milebench/ActionPrediction/pred.json" "b/eval_milebench/ActionPrediction/pred.json" new file mode 100644--- /dev/null +++ "b/eval_milebench/ActionPrediction/pred.json" @@ -0,0 +1,2402 @@ +[ + { + "sample_id": 0, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Open the door.\nC. Take the book.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 56, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Eat the sandwich.\nC. Put down the phone/camera.\nD. Throw the pillow.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 1, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the floor.\nB. Put down the cup/glass/bottle.\nC. Take the book.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 16, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the towel.\nB. Close the laptop.\nC. Close the door.\nD. Hold the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 33, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Take the laptop.\nC. Take the cup/glass/bottle.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 2, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Take the book.\nC. Eat the sandwich.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 23, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the laptop.\nB. Lie on the sofa/couch.\nC. Close the box.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 25, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Put down the food.\nC. Take the paper/notebook.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 28, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the dish?\nChoice list: \nA. Wash.\nB. Put down.\nC. Hold.\nD. Take.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 3, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the broom.\nB. Put down the clothes.\nC. Put down the food.\nD. Throw the blanket.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 18, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Sit at the table.\nC. Take the food.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit at the table.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 37, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the food.\nB. Close the door.\nC. Close the window.\nD. Open the window.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the window.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 42, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the food.\nC. Throw the pillow.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 4, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the table.\nB. Open the box.\nC. Tidy up the closet/cabinet.\nD. Hold the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Tidy up the closet/cabinet.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 14, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Take the phone/camera.\nC. Take the blanket.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 21, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Hold the laptop.\nB. Sit on the sofa/couch.\nC. Take the shoe.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 38, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the bag.\nB. Put down the towel.\nC. Eat the sandwich.\nD. Sit at the table.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 50, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Put down the phone/camera.\nC. Hold the box.\nD. Take the blanket.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the picture.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 57, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Put down the towel.\nC. Put down the paper/notebook.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Eat the medicine.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 75, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the shoe?\nChoice list: \nA. Sit on.\nB. Take.\nC. Throw.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 5, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Sit on the table.\nC. Take the paper/notebook.\nD. Throw the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the paper/notebook.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 43, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Sit on the sofa/couch.\nC. Throw the clothes.\nD. Put down the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the cup/glass/bottle.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 60, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Put down the broom.\nC. Put down the towel.\nD. Take the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 6, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the sofa/couch?\nChoice list: \nA. Take.\nB. Sit on.\nC. Tidy up.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Lie on.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 29, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the door.\nB. Take the picture.\nC. Lie on the sofa/couch.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Lie on the sofa/couch.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 7, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the bag.\nC. Sit on the table.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 8, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the shoe.\nB. Put down the laptop.\nC. Put down the dish.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 47, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Take the book.\nC. Put down the blanket.\nD. Sit on the floor.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 9, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the closet/cabinet.\nB. Tidy up the broom.\nC. Throw the pillow.\nD. Take the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 10, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Take the food.\nC. Take the phone/camera.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 11, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Eat the medicine.\nC. Tidy up the table.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the picture.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 12, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the broom.\nB. Open the bag.\nC. Take the cup/glass/bottle.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the paper/notebook.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 13, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Wash the window.\nC. Tidy up the blanket.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Wash the window.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 15, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Open the book.\nC. Take the shoe.\nD. Open the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 85, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Take the bag.\nC. Put down the paper/notebook.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 17, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Tidy up.\nB. Sit on.\nC. Put down.\nD. Take.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 22, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Put down the towel.\nC. Take the laptop.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 24, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Put down the phone/camera.\nC. Open the book.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the phone/camera.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 26, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Open the door.\nC. Close the closet/cabinet.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the closet/cabinet.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 31, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the window.\nB. Close the refrigerator.\nC. Sit on the sofa/couch.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on the sofa/couch.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 34, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Put down the broom.\nC. Open the bag.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 35, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the floor.\nB. Open the bag.\nC. Lie on the bed.\nD. Tidy up the table.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on the floor.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 51, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Sit at the table.\nC. Throw the book.\nD. Throw the pillow.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 58, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the blanket.\nB. Take the phone/camera.\nC. Close the door.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the phone/camera.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 65, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Take the shoe.\nC. Take the book.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Eat the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 67, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the mirror.\nB. Close the box.\nC. Put down the towel.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 68, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Eat the medicine.\nC. Tidy up the table.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 20, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the table.\nB. Lie on the floor.\nC. Put down the towel.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Wash the table.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 27, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Open the refrigerator.\nC. Throw the clothes.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 32, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the closet/cabinet.\nB. Put down the paper/notebook.\nC. Take the dish.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the paper/notebook.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 36, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Open the book.\nC. Sit on the bed.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 41, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the blanket.\nB. Eat the medicine.\nC. Lie on the sofa/couch.\nD. Put down the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 44, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Take.\nC. Hold.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 46, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Tidy up the clothes.\nC. Take the bag.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Lie on the sofa/couch.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 49, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Close the box.\nC. Lie on the floor.\nD. Hold the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Lie on the sofa/couch.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 52, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the pillow.\nB. Lie on the bed.\nC. Close the window.\nD. Wash the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the window.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 53, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the towel.\nB. Eat the sandwich.\nC. Put down the broom.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 59, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Take the bag.\nC. Throw the pillow.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 61, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the table.\nB. Eat the medicine.\nC. Throw the shoe.\nD. Take the blanket.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 70, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Put down.\nB. Wash.\nC. Close.\nD. Take.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 141, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the clothes.\nB. Wash the mirror.\nC. Take the bag.\nD. Put down the phone/camera.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the phone/camera.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 82, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Take the book.\nC. Open the bag.\nD. Tidy up the blanket.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 89, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Throw the shoe.\nC. Put down the cup/glass/bottle.\nD. Put down the towel.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 98, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the towel.\nB. Hold the blanket.\nC. Eat the sandwich.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Eat the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 111, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the picture.\nC. Tidy up the blanket.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 133, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Open the door.\nC. Tidy up the clothes.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 134, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the book.\nB. Take the pillow.\nC. Put down the picture.\nD. Close the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 138, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Take the phone/camera.\nC. Take the clothes.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 150, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Wash the clothes.\nC. Take the book.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 158, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the dish.\nC. Put down the sandwich.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on the sofa/couch.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 164, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the bed?\nChoice list: \nA. Eat.\nB. Take.\nC. Lie on.\nD. Sit on.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Lie on.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 171, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Put down the food.\nC. Close the book.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 174, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the floor.\nB. Close the refrigerator.\nC. Open the box.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 194, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the dish.\nB. Eat the medicine.\nC. Put down the clothes.\nD. Take the paper/notebook.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the dish.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 62, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Take the box.\nC. Take the book.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 40, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Take the shoe.\nC. Take the clothes.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 64, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Close the book.\nC. Take the towel.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 30, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Put down the shoe.\nC. Wash the dish.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 63, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Take the sandwich.\nC. Open the closet/cabinet.\nD. Hold the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 99, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Put down the book.\nC. Throw the clothes.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 45, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Tidy up.\nC. Hold.\nD. Take.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Tidy up.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 55, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the box.\nB. Throw the food.\nC. Tidy up the towel.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 81, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Sit on the table.\nC. Take the food.\nD. Put down the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 94, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Open the bag.\nC. Take the towel.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 79, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the towel.\nB. Open the laptop.\nC. Wash the clothes.\nD. Sit on the bed.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on the bed.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 95, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the pillow.\nB. Take the book.\nC. Open the book.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 104, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the sofa/couch.\nB. Take the phone/camera.\nC. Put down the box.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 106, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Open the refrigerator.\nC. Put down the phone/camera.\nD. Wash the window.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 108, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Take the food.\nC. Close the door.\nD. Put down the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the food.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 116, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Put down the phone/camera.\nC. Put down the food.\nD. Close the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the phone/camera.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 122, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the bed.\nB. Sit on the sofa/couch.\nC. Throw the blanket.\nD. Take the paper/notebook.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the paper/notebook.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 76, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the broom.\nB. Put down the blanket.\nC. Close the refrigerator.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 84, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Open the closet/cabinet.\nC. Put down the paper/notebook.\nD. Put down the phone/camera.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the paper/notebook.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 113, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Wash the table.\nC. Throw the pillow.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 127, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Take the clothes.\nC. Eat the medicine.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 72, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Open.\nB. Put down.\nC. Throw.\nD. Take.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 48, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the window.\nB. Take the towel.\nC. Take the shoe.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the window.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 73, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Tidy up the clothes.\nC. Take the box.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 120, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next with the bed?\nChoice list: \nA. Put down.\nB. Throw.\nC. Sit on.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 54, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Put down the dish.\nC. Sit on the floor.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 135, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the blanket.\nB. Take the blanket.\nC. Wash the clothes.\nD. Put down the sandwich.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 19, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Throw the clothes.\nC. Open the box.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 121, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the clothes.\nC. Lie on the sofa/couch.\nD. Put down the pillow.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 74, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Take the box.\nC. Put down the blanket.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 77, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next with the table?\nChoice list: \nA. Take.\nB. Tidy up.\nC. Sit at.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit at.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 80, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the sofa/couch?\nChoice list: \nA. Put down.\nB. Lie on.\nC. Throw.\nD. Sit on.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 83, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the book.\nB. Open the closet/cabinet.\nC. Take the sandwich.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 88, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Lie on the floor.\nC. Close the box.\nD. Tidy up the blanket.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Tidy up the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 90, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Take the pillow.\nC. Take the laptop.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 91, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Take.\nB. Eat.\nC. Put down.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 93, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Open the bag.\nC. Put down the blanket.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 97, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Put down the blanket.\nC. Take the cup/glass/bottle.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 100, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the book.\nB. Close the closet/cabinet.\nC. Put down the bag.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 103, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Tidy up the blanket.\nC. Close the laptop.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 107, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the blanket.\nB. Open the refrigerator.\nC. Open the closet/cabinet.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 39, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Tidy up the blanket.\nC. Take the pillow.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 180, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Take.\nB. Put down.\nC. Wash.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 71, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Lie on the floor.\nC. Sit on the table.\nD. Put down the towel.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 145, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the clothes.\nB. Close the window.\nC. Put down the food.\nD. Wash the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 117, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Wash the mirror.\nC. Open the box.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the door.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 195, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Take the towel.\nC. Close the door.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 149, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the sandwich.\nB. Take the dish.\nC. Wash the dish.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 163, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the food.\nB. Take the box.\nC. Put down the broom.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the broom.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 137, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Hold.\nB. Throw.\nC. Take.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 185, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the clothes.\nC. Put down the broom.\nD. Put down the picture.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the broom.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 129, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Put down.\nB. Hold.\nC. Take.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 69, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Take the dish.\nC. Hold the picture.\nD. Take the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 87, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit at the table.\nB. Close the window.\nC. Take the cup/glass/bottle.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Eat the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 131, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Take the blanket.\nC. Eat the medicine.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 132, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Put down the laptop.\nC. Put down the cup/glass/bottle.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 155, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Take the book.\nC. Sit on the table.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 101, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Open the refrigerator.\nC. Tidy up the towel.\nD. Lie on the bed.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 102, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Close the box.\nC. Put down the cup/glass/bottle.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 112, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the bed.\nB. Put down the dish.\nC. Throw the clothes.\nD. Sit on the table.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 118, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Eat the sandwich.\nC. Open the door.\nD. Throw the blanket.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 126, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the book.\nB. Put down the pillow.\nC. Open the bag.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 128, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Hold.\nB. Put down.\nC. Take.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 130, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the closet/cabinet.\nB. Take the food.\nC. Close the refrigerator.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 148, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Tidy up the clothes.\nC. Take the phone/camera.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Tidy up the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 152, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the floor.\nB. Put down the shoe.\nC. Take the paper/notebook.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 153, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Take the food.\nC. Close the book.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 86, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the table?\nChoice list: \nA. Close.\nB. Sit at.\nC. Tidy up.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit at.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 96, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Eat the sandwich.\nC. Lie on the bed.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Eat the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 146, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Put down the paper/notebook.\nC. Put down the picture.\nD. Hold the blanket.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the picture.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 78, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Take the phone/camera.\nC. Put down the book.\nD. Throw the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 144, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Open the door.\nC. Sit on the bed.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on the bed.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 151, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Put down the bag.\nC. Take the shoe.\nD. Take the towel.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 161, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Take the clothes.\nC. Sit on the sofa/couch.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 66, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Eat the sandwich.\nC. Lie on the floor.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the closet/cabinet.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 140, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the door.\nB. Close the closet/cabinet.\nC. Tidy up the table.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the dish.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 109, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Sit at the table.\nC. Take the sandwich.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 110, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Throw the clothes.\nC. Wash the table.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 114, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Hold the box.\nC. Throw the blanket.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 119, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Throw the clothes.\nC. Open the book.\nD. Throw the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the shoe.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 123, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the dish.\nB. Open the closet/cabinet.\nC. Take the food.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 124, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the pillow?\nChoice list: \nA. Tidy up.\nB. Throw.\nC. Put down.\nD. Take.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 125, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Throw.\nC. Lie on.\nD. Tidy up.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Tidy up.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 136, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Sit at the table.\nC. Lie on the sofa/couch.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit at the table.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 142, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the window.\nB. Open the book.\nC. Wash the mirror.\nD. Close the door.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Wash the mirror.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 143, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the book.\nC. Tidy up the broom.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 154, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the box.\nB. Take the bag.\nC. Lie on the bed.\nD. Sit on the floor.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Lie on the bed.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 182, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the paper/notebook.\nB. Hold the phone/camera.\nC. Throw the blanket.\nD. Close the window.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Close the window.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 139, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Throw the bag.\nC. Open the door.\nD. Put down the pillow.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the pillow.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 179, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the bag.\nB. Take the shoe.\nC. Put down the phone/camera.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the phone/camera.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 186, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Sit on the table.\nC. Close the refrigerator.\nD. Wash the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the box.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 160, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Throw the blanket.\nC. Open the door.\nD. Tidy up the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the food.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 92, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Put down the bag.\nC. Throw the clothes.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 199, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Take the blanket.\nC. Open the door.\nD. Sit on the bed.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Tidy up the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 157, + "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the clothes.\nB. Put down the cup/glass/bottle.\nC. Take the food.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 183, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Take the laptop.\nC. Close the box.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 191, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Put down the sandwich.\nC. Put down the shoe.\nD. Throw the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 147, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the box.\nB. Open the bag.\nC. Close the door.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 167, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Close the door.\nC. Close the refrigerator.\nD. Throw the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the phone/camera.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 187, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the towel.\nB. Open the door.\nC. Put down the dish.\nD. Throw the broom.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the towel.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 168, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Close the door.\nC. Sit on the table.\nD. Put down the sandwich.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 170, + "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the phone/camera.\nB. Throw the bag.\nC. Put down the food.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the laptop.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 173, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Sit on the table.\nC. Throw the clothes.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 176, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Throw the clothes.\nC. Take the clothes.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 177, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the mirror.\nB. Close the box.\nC. Throw the clothes.\nD. Take the sandwich.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 190, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Put down the cup/glass/bottle.\nC. Open the door.\nD. Close the door.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 115, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the sandwich.\nB. Put down the book.\nC. Lie on the floor.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the sandwich.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 169, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the window.\nB. Take the food.\nC. Put down the clothes.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 192, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the bag.\nC. Wash the table.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 105, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the book.\nC. Eat the sandwich.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the book.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 165, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the bag.\nB. Take the book.\nC. Put down the phone/camera.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Open the refrigerator.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 198, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Close the door.\nC. Tidy up the table.\nD. Wash the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the clothes.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 197, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Close the box.\nC. Put down the blanket.\nD. Take the pillow.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 156, + "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Close the refrigerator.\nC. Take the bag.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 159, + "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Put down the bag.\nC. Put down the cup/glass/bottle.\nD. Take the clothes.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the bag.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 162, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the floor?\nChoice list: \nA. Take.\nB. Sit on.\nC. Lie on.\nD. Close.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 166, + "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the table.\nB. Take the sandwich.\nC. Throw the blanket.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Throw the blanket.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 172, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Take the paper/notebook.\nC. Lie on the bed.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the paper/notebook.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "B" + }, + { + "sample_id": 175, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the paper/notebook.\nB. Take the cup/glass/bottle.\nC. Eat the sandwich.\nD. Open the window.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the paper/notebook.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 178, + "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Open the window.\nC. Open the refrigerator.\nD. Sit at the table.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit at the table.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 181, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Sit at.\nB. Throw.\nC. Tidy up.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 184, + "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the clothes?\nChoice list: \nA. Put down.\nB. Take.\nC. Throw.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 188, + "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next with the floor?\nChoice list: \nA. Put down.\nB. Lie on.\nC. Sit on.\nD. Eat.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Sit on.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + }, + { + "sample_id": 193, + "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the paper/notebook.\nB. Wash the mirror.\nC. Take the bag.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Take the paper/notebook.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "A" + }, + { + "sample_id": 189, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Throw.\nB. Hold.\nC. Tidy up.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "D" + }, + { + "sample_id": 196, + "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Lie on the floor.\nC. Put down the broom.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", + "gt_response": "Put down the broom.", + "gen_kwargs": { + "do_sample": false, + "num_beams": 1, + "max_new_tokens": 32, + "eos_token_id": 92542 + }, + "pred_response": "C" + } +] \ No newline at end of file