diff --git "a/eval_milebench/ActionPrediction/ActionPrediction_240803234615.json" "b/eval_milebench/ActionPrediction/ActionPrediction_240803234615.json" new file mode 100644--- /dev/null +++ "b/eval_milebench/ActionPrediction/ActionPrediction_240803234615.json" @@ -0,0 +1 @@ +[{"sample_id": 0, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Open the door.\nC. Take the book.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 56, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Eat the sandwich.\nC. Put down the phone/camera.\nD. Throw the pillow.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 1, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the floor.\nB. Put down the cup/glass/bottle.\nC. Take the book.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 16, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the towel.\nB. Close the laptop.\nC. Close the door.\nD. Hold the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 33, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Take the laptop.\nC. Take the cup/glass/bottle.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 2, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Take the book.\nC. Eat the sandwich.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 23, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the laptop.\nB. Lie on the sofa/couch.\nC. Close the box.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 25, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Put down the food.\nC. Take the paper/notebook.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 28, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the dish?\nChoice list: \nA. Wash.\nB. Put down.\nC. Hold.\nD. Take.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 3, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the broom.\nB. Put down the clothes.\nC. Put down the food.\nD. Throw the blanket.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 18, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Sit at the table.\nC. Take the food.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit at the table.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 37, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the food.\nB. Close the door.\nC. Close the window.\nD. Open the window.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the window.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 42, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the food.\nC. Throw the pillow.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 4, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the table.\nB. Open the box.\nC. Tidy up the closet/cabinet.\nD. Hold the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Tidy up the closet/cabinet.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 14, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Take the phone/camera.\nC. Take the blanket.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 21, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Hold the laptop.\nB. Sit on the sofa/couch.\nC. Take the shoe.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 38, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the bag.\nB. Put down the towel.\nC. Eat the sandwich.\nD. Sit at the table.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 50, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Put down the phone/camera.\nC. Hold the box.\nD. Take the blanket.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the picture.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 57, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Put down the towel.\nC. Put down the paper/notebook.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Eat the medicine.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 75, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the shoe?\nChoice list: \nA. Sit on.\nB. Take.\nC. Throw.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 5, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Sit on the table.\nC. Take the paper/notebook.\nD. Throw the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the paper/notebook.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 43, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Sit on the sofa/couch.\nC. Throw the clothes.\nD. Put down the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the cup/glass/bottle.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 60, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Put down the broom.\nC. Put down the towel.\nD. Take the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 6, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the sofa/couch?\nChoice list: \nA. Take.\nB. Sit on.\nC. Tidy up.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Lie on.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 29, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the door.\nB. Take the picture.\nC. Lie on the sofa/couch.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Lie on the sofa/couch.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 7, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the bag.\nC. Sit on the table.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 8, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the shoe.\nB. Put down the laptop.\nC. Put down the dish.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 47, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Take the book.\nC. Put down the blanket.\nD. Sit on the floor.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 9, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the closet/cabinet.\nB. Tidy up the broom.\nC. Throw the pillow.\nD. Take the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 10, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Take the food.\nC. Take the phone/camera.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 11, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Eat the medicine.\nC. Tidy up the table.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the picture.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 12, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the broom.\nB. Open the bag.\nC. Take the cup/glass/bottle.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the paper/notebook.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 13, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Wash the window.\nC. Tidy up the blanket.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Wash the window.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 15, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Open the book.\nC. Take the shoe.\nD. Open the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 85, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Take the bag.\nC. Put down the paper/notebook.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 17, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Tidy up.\nB. Sit on.\nC. Put down.\nD. Take.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 22, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Put down the towel.\nC. Take the laptop.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 24, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Put down the phone/camera.\nC. Open the book.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the phone/camera.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 26, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Open the door.\nC. Close the closet/cabinet.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the closet/cabinet.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 31, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the window.\nB. Close the refrigerator.\nC. Sit on the sofa/couch.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on the sofa/couch.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 34, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Put down the broom.\nC. Open the bag.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 35, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the floor.\nB. Open the bag.\nC. Lie on the bed.\nD. Tidy up the table.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on the floor.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 51, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Sit at the table.\nC. Throw the book.\nD. Throw the pillow.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 58, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the blanket.\nB. Take the phone/camera.\nC. Close the door.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the phone/camera.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 65, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Take the shoe.\nC. Take the book.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Eat the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 67, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the mirror.\nB. Close the box.\nC. Put down the towel.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 68, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Eat the medicine.\nC. Tidy up the table.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 20, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the table.\nB. Lie on the floor.\nC. Put down the towel.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Wash the table.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 27, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Open the refrigerator.\nC. Throw the clothes.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 32, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the closet/cabinet.\nB. Put down the paper/notebook.\nC. Take the dish.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the paper/notebook.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 36, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Open the book.\nC. Sit on the bed.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 41, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the blanket.\nB. Eat the medicine.\nC. Lie on the sofa/couch.\nD. Put down the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 44, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Take.\nC. Hold.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 46, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Tidy up the clothes.\nC. Take the bag.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Lie on the sofa/couch.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 49, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Close the box.\nC. Lie on the floor.\nD. Hold the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Lie on the sofa/couch.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 52, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the pillow.\nB. Lie on the bed.\nC. Close the window.\nD. Wash the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the window.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 53, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the towel.\nB. Eat the sandwich.\nC. Put down the broom.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 59, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Take the bag.\nC. Throw the pillow.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 61, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the table.\nB. Eat the medicine.\nC. Throw the shoe.\nD. Take the blanket.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 70, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Put down.\nB. Wash.\nC. Close.\nD. Take.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 141, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the clothes.\nB. Wash the mirror.\nC. Take the bag.\nD. Put down the phone/camera.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the phone/camera.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 82, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Take the book.\nC. Open the bag.\nD. Tidy up the blanket.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 89, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Throw the shoe.\nC. Put down the cup/glass/bottle.\nD. Put down the towel.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 98, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the towel.\nB. Hold the blanket.\nC. Eat the sandwich.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Eat the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 111, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the picture.\nC. Tidy up the blanket.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 133, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Open the door.\nC. Tidy up the clothes.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 134, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the book.\nB. Take the pillow.\nC. Put down the picture.\nD. Close the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 138, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Take the phone/camera.\nC. Take the clothes.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 150, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Wash the clothes.\nC. Take the book.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 158, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the dish.\nC. Put down the sandwich.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on the sofa/couch.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 164, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the bed?\nChoice list: \nA. Eat.\nB. Take.\nC. Lie on.\nD. Sit on.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Lie on.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 171, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Put down the food.\nC. Close the book.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 174, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the floor.\nB. Close the refrigerator.\nC. Open the box.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 194, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the dish.\nB. Eat the medicine.\nC. Put down the clothes.\nD. Take the paper/notebook.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the dish.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 62, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Take the box.\nC. Take the book.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 40, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Take the shoe.\nC. Take the clothes.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 64, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Close the book.\nC. Take the towel.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 30, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Put down the shoe.\nC. Wash the dish.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 63, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Take the sandwich.\nC. Open the closet/cabinet.\nD. Hold the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 99, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Put down the book.\nC. Throw the clothes.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 45, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Tidy up.\nC. Hold.\nD. Take.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Tidy up.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 55, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the box.\nB. Throw the food.\nC. Tidy up the towel.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 81, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Sit on the table.\nC. Take the food.\nD. Put down the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 94, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Open the bag.\nC. Take the towel.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 79, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the towel.\nB. Open the laptop.\nC. Wash the clothes.\nD. Sit on the bed.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on the bed.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 95, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the pillow.\nB. Take the book.\nC. Open the book.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 104, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the sofa/couch.\nB. Take the phone/camera.\nC. Put down the box.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 106, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Open the refrigerator.\nC. Put down the phone/camera.\nD. Wash the window.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 108, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Take the food.\nC. Close the door.\nD. Put down the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the food.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 116, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Put down the phone/camera.\nC. Put down the food.\nD. Close the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the phone/camera.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 122, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the bed.\nB. Sit on the sofa/couch.\nC. Throw the blanket.\nD. Take the paper/notebook.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the paper/notebook.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 76, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the broom.\nB. Put down the blanket.\nC. Close the refrigerator.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 84, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Open the closet/cabinet.\nC. Put down the paper/notebook.\nD. Put down the phone/camera.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the paper/notebook.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 113, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Wash the table.\nC. Throw the pillow.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 127, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Take the clothes.\nC. Eat the medicine.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 72, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Open.\nB. Put down.\nC. Throw.\nD. Take.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 48, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the window.\nB. Take the towel.\nC. Take the shoe.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the window.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 73, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Tidy up the clothes.\nC. Take the box.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 120, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next with the bed?\nChoice list: \nA. Put down.\nB. Throw.\nC. Sit on.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 54, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Put down the dish.\nC. Sit on the floor.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 135, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the blanket.\nB. Take the blanket.\nC. Wash the clothes.\nD. Put down the sandwich.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 19, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Throw the clothes.\nC. Open the box.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 121, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the clothes.\nC. Lie on the sofa/couch.\nD. Put down the pillow.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 74, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Take the box.\nC. Put down the blanket.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 77, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next with the table?\nChoice list: \nA. Take.\nB. Tidy up.\nC. Sit at.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit at.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 80, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the sofa/couch?\nChoice list: \nA. Put down.\nB. Lie on.\nC. Throw.\nD. Sit on.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 83, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the book.\nB. Open the closet/cabinet.\nC. Take the sandwich.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 88, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Lie on the floor.\nC. Close the box.\nD. Tidy up the blanket.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Tidy up the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 90, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Take the pillow.\nC. Take the laptop.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 91, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Take.\nB. Eat.\nC. Put down.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 93, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Open the bag.\nC. Put down the blanket.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 97, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Put down the blanket.\nC. Take the cup/glass/bottle.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 100, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the book.\nB. Close the closet/cabinet.\nC. Put down the bag.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 103, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Tidy up the blanket.\nC. Close the laptop.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 107, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the blanket.\nB. Open the refrigerator.\nC. Open the closet/cabinet.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 39, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Tidy up the blanket.\nC. Take the pillow.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 180, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Take.\nB. Put down.\nC. Wash.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 71, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Lie on the floor.\nC. Sit on the table.\nD. Put down the towel.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 145, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the clothes.\nB. Close the window.\nC. Put down the food.\nD. Wash the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 117, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Wash the mirror.\nC. Open the box.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the door.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 195, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Take the towel.\nC. Close the door.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 149, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the sandwich.\nB. Take the dish.\nC. Wash the dish.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 163, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the food.\nB. Take the box.\nC. Put down the broom.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the broom.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 137, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Hold.\nB. Throw.\nC. Take.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 185, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the clothes.\nC. Put down the broom.\nD. Put down the picture.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the broom.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 129, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Put down.\nB. Hold.\nC. Take.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 69, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Take the dish.\nC. Hold the picture.\nD. Take the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 87, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit at the table.\nB. Close the window.\nC. Take the cup/glass/bottle.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Eat the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 131, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Take the blanket.\nC. Eat the medicine.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 132, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Put down the laptop.\nC. Put down the cup/glass/bottle.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 155, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Take the book.\nC. Sit on the table.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 101, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Open the refrigerator.\nC. Tidy up the towel.\nD. Lie on the bed.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 102, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Close the box.\nC. Put down the cup/glass/bottle.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 112, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the bed.\nB. Put down the dish.\nC. Throw the clothes.\nD. Sit on the table.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 118, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Eat the sandwich.\nC. Open the door.\nD. Throw the blanket.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 126, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the book.\nB. Put down the pillow.\nC. Open the bag.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 128, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Hold.\nB. Put down.\nC. Take.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 130, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the closet/cabinet.\nB. Take the food.\nC. Close the refrigerator.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 148, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Tidy up the clothes.\nC. Take the phone/camera.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Tidy up the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 152, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the floor.\nB. Put down the shoe.\nC. Take the paper/notebook.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 153, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Take the food.\nC. Close the book.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 86, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the table?\nChoice list: \nA. Close.\nB. Sit at.\nC. Tidy up.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit at.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 96, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Eat the sandwich.\nC. Lie on the bed.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Eat the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 146, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Put down the paper/notebook.\nC. Put down the picture.\nD. Hold the blanket.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the picture.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 78, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Take the phone/camera.\nC. Put down the book.\nD. Throw the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 144, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Open the door.\nC. Sit on the bed.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on the bed.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 151, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Put down the bag.\nC. Take the shoe.\nD. Take the towel.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 161, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Take the clothes.\nC. Sit on the sofa/couch.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 66, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Eat the sandwich.\nC. Lie on the floor.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the closet/cabinet.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 140, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the door.\nB. Close the closet/cabinet.\nC. Tidy up the table.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the dish.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 109, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Sit at the table.\nC. Take the sandwich.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 110, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Throw the clothes.\nC. Wash the table.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 114, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Hold the box.\nC. Throw the blanket.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 119, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Throw the clothes.\nC. Open the book.\nD. Throw the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the shoe.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 123, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the dish.\nB. Open the closet/cabinet.\nC. Take the food.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 124, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the pillow?\nChoice list: \nA. Tidy up.\nB. Throw.\nC. Put down.\nD. Take.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 125, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Throw.\nC. Lie on.\nD. Tidy up.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Tidy up.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 136, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Sit at the table.\nC. Lie on the sofa/couch.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit at the table.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 142, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the window.\nB. Open the book.\nC. Wash the mirror.\nD. Close the door.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Wash the mirror.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 143, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the book.\nC. Tidy up the broom.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 154, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the box.\nB. Take the bag.\nC. Lie on the bed.\nD. Sit on the floor.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Lie on the bed.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 182, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the paper/notebook.\nB. Hold the phone/camera.\nC. Throw the blanket.\nD. Close the window.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Close the window.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 139, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Throw the bag.\nC. Open the door.\nD. Put down the pillow.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the pillow.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 179, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the bag.\nB. Take the shoe.\nC. Put down the phone/camera.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the phone/camera.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 186, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Sit on the table.\nC. Close the refrigerator.\nD. Wash the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the box.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 160, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Throw the blanket.\nC. Open the door.\nD. Tidy up the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the food.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 92, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Put down the bag.\nC. Throw the clothes.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 199, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Take the blanket.\nC. Open the door.\nD. Sit on the bed.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Tidy up the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 157, "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the clothes.\nB. Put down the cup/glass/bottle.\nC. Take the food.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 183, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Take the laptop.\nC. Close the box.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 191, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Put down the sandwich.\nC. Put down the shoe.\nD. Throw the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 147, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the box.\nB. Open the bag.\nC. Close the door.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 167, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Close the door.\nC. Close the refrigerator.\nD. Throw the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the phone/camera.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 187, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the towel.\nB. Open the door.\nC. Put down the dish.\nD. Throw the broom.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the towel.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 168, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Close the door.\nC. Sit on the table.\nD. Put down the sandwich.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 170, "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the phone/camera.\nB. Throw the bag.\nC. Put down the food.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the laptop.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 173, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Sit on the table.\nC. Throw the clothes.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 176, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Throw the clothes.\nC. Take the clothes.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 177, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the mirror.\nB. Close the box.\nC. Throw the clothes.\nD. Take the sandwich.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 190, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Put down the cup/glass/bottle.\nC. Open the door.\nD. Close the door.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 115, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the sandwich.\nB. Put down the book.\nC. Lie on the floor.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the sandwich.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 169, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the window.\nB. Take the food.\nC. Put down the clothes.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 192, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the bag.\nC. Wash the table.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 105, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the book.\nC. Eat the sandwich.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the book.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 165, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the bag.\nB. Take the book.\nC. Put down the phone/camera.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Open the refrigerator.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 198, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Close the door.\nC. Tidy up the table.\nD. Wash the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the clothes.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 197, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Close the box.\nC. Put down the blanket.\nD. Take the pillow.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 156, "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Close the refrigerator.\nC. Take the bag.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 159, "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Put down the bag.\nC. Put down the cup/glass/bottle.\nD. Take the clothes.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the bag.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 162, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the floor?\nChoice list: \nA. Take.\nB. Sit on.\nC. Lie on.\nD. Close.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 166, "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the table.\nB. Take the sandwich.\nC. Throw the blanket.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Throw the blanket.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 172, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Take the paper/notebook.\nC. Lie on the bed.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the paper/notebook.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "B"}, {"sample_id": 175, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the paper/notebook.\nB. Take the cup/glass/bottle.\nC. Eat the sandwich.\nD. Open the window.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the paper/notebook.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 178, "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Open the window.\nC. Open the refrigerator.\nD. Sit at the table.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit at the table.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 181, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Sit at.\nB. Throw.\nC. Tidy up.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 184, "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the clothes?\nChoice list: \nA. Put down.\nB. Take.\nC. Throw.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 188, "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next with the floor?\nChoice list: \nA. Put down.\nB. Lie on.\nC. Sit on.\nD. Eat.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Sit on.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}, {"sample_id": 193, "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the paper/notebook.\nB. Wash the mirror.\nC. Take the bag.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Take the paper/notebook.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "A"}, {"sample_id": 189, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Throw.\nB. Hold.\nC. Tidy up.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "D"}, {"sample_id": 196, "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Lie on the floor.\nC. Put down the broom.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", "gt_response": "Put down the broom.", "gen_kwargs": {"do_sample": false, "num_beams": 1, "max_new_tokens": 32, "eos_token_id": 92542}, "pred_response": "C"}] \ No newline at end of file