diff --git "a/eval_milebench/ActionPrediction/pred.json" "b/eval_milebench/ActionPrediction/pred.json" deleted file mode 100644--- "a/eval_milebench/ActionPrediction/pred.json" +++ /dev/null @@ -1,2402 +0,0 @@ -[ - { - "sample_id": 0, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Open the door.\nC. Take the book.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 56, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Eat the sandwich.\nC. Put down the phone/camera.\nD. Throw the pillow.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 1, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the floor.\nB. Put down the cup/glass/bottle.\nC. Take the book.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 16, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the towel.\nB. Close the laptop.\nC. Close the door.\nD. Hold the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 33, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Take the laptop.\nC. Take the cup/glass/bottle.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 2, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Take the book.\nC. Eat the sandwich.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 23, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the laptop.\nB. Lie on the sofa/couch.\nC. Close the box.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 25, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Put down the food.\nC. Take the paper/notebook.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 28, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the dish?\nChoice list: \nA. Wash.\nB. Put down.\nC. Hold.\nD. Take.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 3, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the broom.\nB. Put down the clothes.\nC. Put down the food.\nD. Throw the blanket.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 18, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Sit at the table.\nC. Take the food.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit at the table.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 37, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the food.\nB. Close the door.\nC. Close the window.\nD. Open the window.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the window.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 42, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the food.\nC. Throw the pillow.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 4, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the table.\nB. Open the box.\nC. Tidy up the closet/cabinet.\nD. Hold the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Tidy up the closet/cabinet.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 14, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Take the phone/camera.\nC. Take the blanket.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 21, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Hold the laptop.\nB. Sit on the sofa/couch.\nC. Take the shoe.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 38, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the bag.\nB. Put down the towel.\nC. Eat the sandwich.\nD. Sit at the table.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 50, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Put down the phone/camera.\nC. Hold the box.\nD. Take the blanket.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the picture.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 57, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Put down the towel.\nC. Put down the paper/notebook.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Eat the medicine.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 75, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the shoe?\nChoice list: \nA. Sit on.\nB. Take.\nC. Throw.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 5, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Sit on the table.\nC. Take the paper/notebook.\nD. Throw the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the paper/notebook.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 43, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Sit on the sofa/couch.\nC. Throw the clothes.\nD. Put down the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the cup/glass/bottle.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 60, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Put down the broom.\nC. Put down the towel.\nD. Take the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 6, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the sofa/couch?\nChoice list: \nA. Take.\nB. Sit on.\nC. Tidy up.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Lie on.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 29, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the door.\nB. Take the picture.\nC. Lie on the sofa/couch.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Lie on the sofa/couch.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 7, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the bag.\nC. Sit on the table.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 8, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the shoe.\nB. Put down the laptop.\nC. Put down the dish.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 47, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Take the book.\nC. Put down the blanket.\nD. Sit on the floor.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 9, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the closet/cabinet.\nB. Tidy up the broom.\nC. Throw the pillow.\nD. Take the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 10, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Take the food.\nC. Take the phone/camera.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 11, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the picture.\nB. Eat the medicine.\nC. Tidy up the table.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the picture.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 12, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the broom.\nB. Open the bag.\nC. Take the cup/glass/bottle.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the paper/notebook.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 13, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Wash the window.\nC. Tidy up the blanket.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Wash the window.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 15, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Open the book.\nC. Take the shoe.\nD. Open the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 85, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Take the bag.\nC. Put down the paper/notebook.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 17, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Tidy up.\nB. Sit on.\nC. Put down.\nD. Take.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 22, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Put down the towel.\nC. Take the laptop.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 24, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Put down the phone/camera.\nC. Open the book.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the phone/camera.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 26, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Open the door.\nC. Close the closet/cabinet.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the closet/cabinet.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 31, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the window.\nB. Close the refrigerator.\nC. Sit on the sofa/couch.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on the sofa/couch.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 34, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Put down the broom.\nC. Open the bag.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 35, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the floor.\nB. Open the bag.\nC. Lie on the bed.\nD. Tidy up the table.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on the floor.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 51, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Sit at the table.\nC. Throw the book.\nD. Throw the pillow.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 58, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the blanket.\nB. Take the phone/camera.\nC. Close the door.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the phone/camera.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 65, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Take the shoe.\nC. Take the book.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Eat the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 67, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the mirror.\nB. Close the box.\nC. Put down the towel.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 68, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Eat the medicine.\nC. Tidy up the table.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 20, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the table.\nB. Lie on the floor.\nC. Put down the towel.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Wash the table.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 27, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Open the refrigerator.\nC. Throw the clothes.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 32, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the closet/cabinet.\nB. Put down the paper/notebook.\nC. Take the dish.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the paper/notebook.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 36, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Open the book.\nC. Sit on the bed.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 41, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the blanket.\nB. Eat the medicine.\nC. Lie on the sofa/couch.\nD. Put down the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 44, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Take.\nC. Hold.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 46, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Tidy up the clothes.\nC. Take the bag.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Lie on the sofa/couch.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 49, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Close the box.\nC. Lie on the floor.\nD. Hold the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Lie on the sofa/couch.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 52, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the pillow.\nB. Lie on the bed.\nC. Close the window.\nD. Wash the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the window.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 53, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the towel.\nB. Eat the sandwich.\nC. Put down the broom.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 59, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Take the bag.\nC. Throw the pillow.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 61, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the table.\nB. Eat the medicine.\nC. Throw the shoe.\nD. Take the blanket.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 70, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Put down.\nB. Wash.\nC. Close.\nD. Take.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 141, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the clothes.\nB. Wash the mirror.\nC. Take the bag.\nD. Put down the phone/camera.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the phone/camera.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 82, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Take the book.\nC. Open the bag.\nD. Tidy up the blanket.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 89, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Throw the shoe.\nC. Put down the cup/glass/bottle.\nD. Put down the towel.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 98, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the towel.\nB. Hold the blanket.\nC. Eat the sandwich.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Eat the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 111, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the picture.\nC. Tidy up the blanket.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 133, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the refrigerator.\nB. Open the door.\nC. Tidy up the clothes.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 134, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the book.\nB. Take the pillow.\nC. Put down the picture.\nD. Close the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 138, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Take the phone/camera.\nC. Take the clothes.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 150, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the closet/cabinet.\nB. Wash the clothes.\nC. Take the book.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 158, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the dish.\nC. Put down the sandwich.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on the sofa/couch.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 164, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the bed?\nChoice list: \nA. Eat.\nB. Take.\nC. Lie on.\nD. Sit on.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Lie on.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 171, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Put down the food.\nC. Close the book.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 174, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the floor.\nB. Close the refrigerator.\nC. Open the box.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 194, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the dish.\nB. Eat the medicine.\nC. Put down the clothes.\nD. Take the paper/notebook.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the dish.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 62, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Take the box.\nC. Take the book.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 40, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the medicine.\nB. Take the shoe.\nC. Take the clothes.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 64, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Close the book.\nC. Take the towel.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 30, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Put down the shoe.\nC. Wash the dish.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 63, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Take the sandwich.\nC. Open the closet/cabinet.\nD. Hold the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 99, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Put down the book.\nC. Throw the clothes.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 45, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Tidy up.\nC. Hold.\nD. Take.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Tidy up.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 55, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the box.\nB. Throw the food.\nC. Tidy up the towel.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 81, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Sit on the table.\nC. Take the food.\nD. Put down the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 94, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Open the bag.\nC. Take the towel.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 79, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the towel.\nB. Open the laptop.\nC. Wash the clothes.\nD. Sit on the bed.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on the bed.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 95, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the pillow.\nB. Take the book.\nC. Open the book.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 104, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the sofa/couch.\nB. Take the phone/camera.\nC. Put down the box.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 106, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Open the refrigerator.\nC. Put down the phone/camera.\nD. Wash the window.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 108, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Take the food.\nC. Close the door.\nD. Put down the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the food.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 116, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Put down the phone/camera.\nC. Put down the food.\nD. Close the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the phone/camera.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 122, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit on the bed.\nB. Sit on the sofa/couch.\nC. Throw the blanket.\nD. Take the paper/notebook.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the paper/notebook.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 76, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the broom.\nB. Put down the blanket.\nC. Close the refrigerator.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 84, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Open the closet/cabinet.\nC. Put down the paper/notebook.\nD. Put down the phone/camera.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the paper/notebook.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 113, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Wash the table.\nC. Throw the pillow.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 127, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Take the clothes.\nC. Eat the medicine.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 72, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Open.\nB. Put down.\nC. Throw.\nD. Take.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 48, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the window.\nB. Take the towel.\nC. Take the shoe.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the window.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 73, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Tidy up the clothes.\nC. Take the box.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 120, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next with the bed?\nChoice list: \nA. Put down.\nB. Throw.\nC. Sit on.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 54, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Put down the dish.\nC. Sit on the floor.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 135, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the blanket.\nB. Take the blanket.\nC. Wash the clothes.\nD. Put down the sandwich.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 19, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Throw the clothes.\nC. Open the box.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 121, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the clothes.\nC. Lie on the sofa/couch.\nD. Put down the pillow.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 74, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Take the box.\nC. Put down the blanket.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 77, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next with the table?\nChoice list: \nA. Take.\nB. Tidy up.\nC. Sit at.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit at.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 80, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the sofa/couch?\nChoice list: \nA. Put down.\nB. Lie on.\nC. Throw.\nD. Sit on.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 83, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the book.\nB. Open the closet/cabinet.\nC. Take the sandwich.\nD. Take the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 88, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Lie on the floor.\nC. Close the box.\nD. Tidy up the blanket.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Tidy up the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 90, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Take the pillow.\nC. Take the laptop.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 91, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Take.\nB. Eat.\nC. Put down.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 93, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Open the bag.\nC. Put down the blanket.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 97, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the sandwich.\nB. Put down the blanket.\nC. Take the cup/glass/bottle.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 100, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the book.\nB. Close the closet/cabinet.\nC. Put down the bag.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 103, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Tidy up the blanket.\nC. Close the laptop.\nD. Put down the paper/notebook.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 107, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the blanket.\nB. Open the refrigerator.\nC. Open the closet/cabinet.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 39, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Tidy up the blanket.\nC. Take the pillow.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 180, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next with the cup/glass/bottle?\nChoice list: \nA. Take.\nB. Put down.\nC. Wash.\nD. Lie on.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 71, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Lie on the floor.\nC. Sit on the table.\nD. Put down the towel.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 145, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the clothes.\nB. Close the window.\nC. Put down the food.\nD. Wash the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 117, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Wash the mirror.\nC. Open the box.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the door.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 195, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Take the towel.\nC. Close the door.\nD. Put down the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 149, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the sandwich.\nB. Take the dish.\nC. Wash the dish.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 163, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the food.\nB. Take the box.\nC. Put down the broom.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the broom.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 137, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Hold.\nB. Throw.\nC. Take.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 185, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Put down the clothes.\nC. Put down the broom.\nD. Put down the picture.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the broom.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 129, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Put down.\nB. Hold.\nC. Take.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 69, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Take the dish.\nC. Hold the picture.\nD. Take the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 87, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Sit at the table.\nB. Close the window.\nC. Take the cup/glass/bottle.\nD. Eat the sandwich.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Eat the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 131, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Take the blanket.\nC. Eat the medicine.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 132, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Put down the laptop.\nC. Put down the cup/glass/bottle.\nD. Put down the shoe.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 155, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the shoe.\nB. Take the book.\nC. Sit on the table.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 101, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Open the refrigerator.\nC. Tidy up the towel.\nD. Lie on the bed.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 102, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Close the box.\nC. Put down the cup/glass/bottle.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 112, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the bed.\nB. Put down the dish.\nC. Throw the clothes.\nD. Sit on the table.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 118, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the book.\nB. Eat the sandwich.\nC. Open the door.\nD. Throw the blanket.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 126, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the book.\nB. Put down the pillow.\nC. Open the bag.\nD. Tidy up the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 128, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next with the food?\nChoice list: \nA. Hold.\nB. Put down.\nC. Take.\nD. Throw.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 130, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the closet/cabinet.\nB. Take the food.\nC. Close the refrigerator.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 148, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Tidy up the clothes.\nC. Take the phone/camera.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Tidy up the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 152, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the floor.\nB. Put down the shoe.\nC. Take the paper/notebook.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 153, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Take the food.\nC. Close the book.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 86, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next with the table?\nChoice list: \nA. Close.\nB. Sit at.\nC. Tidy up.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit at.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 96, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Eat the sandwich.\nC. Lie on the bed.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Eat the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 146, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the laptop.\nB. Put down the paper/notebook.\nC. Put down the picture.\nD. Hold the blanket.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the picture.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 78, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the box.\nB. Take the phone/camera.\nC. Put down the book.\nD. Throw the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 144, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Open the door.\nC. Sit on the bed.\nD. Close the laptop.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on the bed.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 151, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Put down the bag.\nC. Take the shoe.\nD. Take the towel.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 161, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Take the clothes.\nC. Sit on the sofa/couch.\nD. Take the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 66, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Eat the sandwich.\nC. Lie on the floor.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the closet/cabinet.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 140, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the door.\nB. Close the closet/cabinet.\nC. Tidy up the table.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the dish.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 109, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Sit at the table.\nC. Take the sandwich.\nD. Lie on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 110, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the book.\nB. Throw the clothes.\nC. Wash the table.\nD. Open the door.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 114, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the bag.\nB. Hold the box.\nC. Throw the blanket.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 119, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the shoe.\nB. Throw the clothes.\nC. Open the book.\nD. Throw the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the shoe.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 123, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the dish.\nB. Open the closet/cabinet.\nC. Take the food.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 124, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the pillow?\nChoice list: \nA. Tidy up.\nB. Throw.\nC. Put down.\nD. Take.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 125, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Put down.\nB. Throw.\nC. Lie on.\nD. Tidy up.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Tidy up.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 136, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Sit at the table.\nC. Lie on the sofa/couch.\nD. Throw the food.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit at the table.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 142, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the window.\nB. Open the book.\nC. Wash the mirror.\nD. Close the door.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Wash the mirror.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 143, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the book.\nC. Tidy up the broom.\nD. Put down the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 154, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the box.\nB. Take the bag.\nC. Lie on the bed.\nD. Sit on the floor.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Lie on the bed.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 182, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the paper/notebook.\nB. Hold the phone/camera.\nC. Throw the blanket.\nD. Close the window.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Close the window.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 139, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the bag.\nB. Throw the bag.\nC. Open the door.\nD. Put down the pillow.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the pillow.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 179, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the bag.\nB. Take the shoe.\nC. Put down the phone/camera.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the phone/camera.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 186, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Sit on the table.\nC. Close the refrigerator.\nD. Wash the cup/glass/bottle.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the box.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 160, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Throw the blanket.\nC. Open the door.\nD. Tidy up the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the food.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 92, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Put down the bag.\nC. Throw the clothes.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 199, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the clothes.\nB. Take the blanket.\nC. Open the door.\nD. Sit on the bed.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Tidy up the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 157, - "question": "With the images at your disposal, foresee the person's impending maneuver. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the clothes.\nB. Put down the cup/glass/bottle.\nC. Take the food.\nD. Take the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 183, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the window.\nB. Take the laptop.\nC. Close the box.\nD. Eat the medicine.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 191, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the cup/glass/bottle.\nB. Put down the sandwich.\nC. Put down the shoe.\nD. Throw the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 147, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the box.\nB. Open the bag.\nC. Close the door.\nD. Throw the towel.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 167, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the phone/camera.\nB. Close the door.\nC. Close the refrigerator.\nD. Throw the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the phone/camera.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 187, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the towel.\nB. Open the door.\nC. Put down the dish.\nD. Throw the broom.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the towel.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 168, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the door.\nB. Close the door.\nC. Sit on the table.\nD. Put down the sandwich.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 170, - "question": "Study the provided images and predict the individual's forthcoming behavior. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the phone/camera.\nB. Throw the bag.\nC. Put down the food.\nD. Open the laptop.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the laptop.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 173, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Close the laptop.\nB. Sit on the table.\nC. Throw the clothes.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 176, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Lie on the sofa/couch.\nB. Throw the clothes.\nC. Take the clothes.\nD. Close the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 177, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Wash the mirror.\nB. Close the box.\nC. Throw the clothes.\nD. Take the sandwich.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 190, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the book.\nB. Put down the cup/glass/bottle.\nC. Open the door.\nD. Close the door.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 115, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the sandwich.\nB. Put down the book.\nC. Lie on the floor.\nD. Take the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the sandwich.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 169, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the window.\nB. Take the food.\nC. Put down the clothes.\nD. Open the book.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 192, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Open the box.\nB. Take the bag.\nC. Wash the table.\nD. Put down the dish.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 105, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the dish.\nB. Take the book.\nC. Eat the sandwich.\nD. Throw the box.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the book.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 165, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Throw the bag.\nB. Take the book.\nC. Put down the phone/camera.\nD. Open the refrigerator.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Open the refrigerator.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 198, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the clothes.\nB. Close the door.\nC. Tidy up the table.\nD. Wash the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the clothes.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 197, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the cup/glass/bottle.\nB. Close the box.\nC. Put down the blanket.\nD. Take the pillow.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 156, - "question": "Using the given pictures as a reference, anticipate the person's upcoming action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Eat the sandwich.\nB. Close the refrigerator.\nC. Take the bag.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 159, - "question": "Evaluate the given images and infer the individual's next step. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the cup/glass/bottle.\nB. Put down the bag.\nC. Put down the cup/glass/bottle.\nD. Take the clothes.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the bag.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 162, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the floor?\nChoice list: \nA. Take.\nB. Sit on.\nC. Lie on.\nD. Close.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 166, - "question": "With the given visuals as your guide, infer the individual's impending action. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Tidy up the table.\nB. Take the sandwich.\nC. Throw the blanket.\nD. Open the bag.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Throw the blanket.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 172, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the food.\nB. Take the paper/notebook.\nC. Lie on the bed.\nD. Sit on the sofa/couch.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the paper/notebook.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "B" - }, - { - "sample_id": 175, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the paper/notebook.\nB. Take the cup/glass/bottle.\nC. Eat the sandwich.\nD. Open the window.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the paper/notebook.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 178, - "question": "Analyze the provided visuals and forecast the individual's subsequent move. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the box.\nB. Open the window.\nC. Open the refrigerator.\nD. Sit at the table.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit at the table.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 181, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Sit at.\nB. Throw.\nC. Tidy up.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 184, - "question": "Infer the next action of the person from the presented images. You must choose your answer from the Choice List.\nWhat will the person do next with the clothes?\nChoice list: \nA. Put down.\nB. Take.\nC. Throw.\nD. Wash.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 188, - "question": "Based on the given images, prediction the person's next action You must choose your answer from the Choice List.\nWhat will the person do next with the floor?\nChoice list: \nA. Put down.\nB. Lie on.\nC. Sit on.\nD. Eat.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Sit on.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - }, - { - "sample_id": 193, - "question": "Examine the images at hand and forecast the person's imminent activity. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Take the paper/notebook.\nB. Wash the mirror.\nC. Take the bag.\nD. Open the closet/cabinet.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Take the paper/notebook.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "A" - }, - { - "sample_id": 189, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next with the blanket?\nChoice list: \nA. Throw.\nB. Hold.\nC. Tidy up.\nD. Put down.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "D" - }, - { - "sample_id": 196, - "question": "From the images supplied, deduce the likely next step of the person. You must choose your answer from the Choice List.\nWhat will the person do next?\nChoice list: \nA. Put down the pillow.\nB. Lie on the floor.\nC. Put down the broom.\nD. Take the phone/camera.\nAnswer with the option's letter from the given choices directly.", - "gt_response": "Put down the broom.", - "gen_kwargs": { - "do_sample": false, - "num_beams": 1, - "max_new_tokens": 32, - "eos_token_id": 92542 - }, - "pred_response": "C" - } -] \ No newline at end of file