diff --git "a/weights/model-idf/prediction.json" "b/weights/model-idf/prediction.json"
new file mode 100644--- /dev/null
+++ "b/weights/model-idf/prediction.json"
@@ -0,0 +1,2132 @@
+[
+ {
+ "id": 1,
+ "question": "Ben Milo is image_1\n In the image: image_2\n Identify Ben Milo with grounding.",
+ "prediction": "[Ben Milo](646,219),(958,985)"
+ },
+ {
+ "id": 2,
+ "question": "Caption Mitch is image_1\n In the image: image_2\n What is Caption Mitch doing?",
+ "prediction": "Caption Mitch is standing with his arms crossed."
+ },
+ {
+ "id": 3,
+ "question": "Caption Mitch is image_1\n Vern is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Mitch is standing on the left, facing Vern, who is on the right holding a horse's reins. Both are in military attire, in a rugged outdoor setting with rocky terrain and vegetation in the background. There are other soldiers and horses under the sky."
+ },
+ {
+ "id": 4,
+ "question": "Caption Mitch is image_1\n Gen. Dostum is image_2\n In the image: image_3\n Who is holding an interphone?",
+ "prediction": "Gen. Dostum is holding an interphone."
+ },
+ {
+ "id": 5,
+ "question": "Hal Spencer is image_1\n In the image: image_2\n How is his state?",
+ "prediction": "Hal Spencer is lying on the ground, seemingly injured."
+ },
+ {
+ "id": 6,
+ "question": "Vern is image_1\n In the image: image_2\n What is Vern doing?",
+ "prediction": "Vern is aiming a rifle."
+ },
+ {
+ "id": 7,
+ "question": "Kyle is image_1\n Adam is image_2\n In the image: image_3\n What is Kyle's state?",
+ "prediction": "Kyle is in a conversation with another person."
+ },
+ {
+ "id": 8,
+ "question": "Diane is image_1\n In the image: image_2\n Identify Diane with grounding.",
+ "prediction": "[Diane](10,11),(417,992)"
+ },
+ {
+ "id": 9,
+ "question": "Adam is image_1\n Diane is image_2\n Richard is image_3\n In the image: image_4\n Identify Richard with grounding.",
+ "prediction": "[Richard](0,205),(341,976)"
+ },
+ {
+ "id": 10,
+ "question": "Alan is image_1\n Mitch is image_2\n Please describe the image: image_3\n",
+ "prediction": "Alan is seated on the left, holding a bowl of chips, while Mitch is on the right with his arm resting on a chair. They appear to be in a medical setting."
+ },
+ {
+ "id": 11,
+ "question": "Mitch is image_1\n In the image: image_2\n What color is Mitch's clothes?",
+ "prediction": "Mitch is wearing a beige coat and blue jeans."
+ },
+ {
+ "id": 12,
+ "question": "Diane is image_1\n Richard is image_2\n In the image: image_3\n What is the spatial relation between Diane and Richard?",
+ "prediction": "Diane is in front of Richard."
+ },
+ {
+ "id": 13,
+ "question": "Jackson is image_1\n Lilly is image_2\n Noah is image_3\n Please describe the photo: image_4\n",
+ "prediction": "Yes\n\nJackson is walking holding hands with a young girl, Lilly. Noah seems to be following them, standing to the side with his hand in his pocket. There are soldiers in uniform nearby, one of them holding a gun."
+ },
+ {
+ "id": 14,
+ "question": "Kate is image_1\n Lilly is image_2\n In the image: image_3\n What is Kate doing?",
+ "prediction": "Kate is embracing Lilly."
+ },
+ {
+ "id": 15,
+ "question": "Jackson is image_1\n Gordon is image_2\n In the image: image_3\n Identify Gordon with grounding.",
+ "prediction": "[Gordon](535,128),(916,996)"
+ },
+ {
+ "id": 16,
+ "question": "Kate is image_1\n Noah is image_2\n In the image: image_3\n From our view, which side of Kate is Noah at?",
+ "prediction": "Noah is on the right side of Kate."
+ },
+ {
+ "id": 17,
+ "question": "Jackson is image_1\n In the image: image_2\n Identify Jackson with grounding.",
+ "prediction": "[Jackson](421,104),(733,945)"
+ },
+ {
+ "id": 18,
+ "question": "Dukchoon is image_1\n Kim is image_2\n In the image: image_3\n Please give a description.",
+ "prediction": "Dukchoon is kneeling beside Kim, who appears to be in a firefighter's uniform crouching on the ground."
+ },
+ {
+ "id": 19,
+ "question": "Kim is image_1\n In the image: image_2\n Identify Kim with grounding",
+ "prediction": "[Kim](199,226),(505,996)"
+ },
+ {
+ "id": 20,
+ "question": "Kim is image_1\n Kangrim is image_2\n In the image: image_3\n Who is pushing the bamboo raft nearby?",
+ "prediction": "Kim is pushing the bamboo raft."
+ },
+ {
+ "id": 21,
+ "question": "Dukchoon is image_1\n In the image: image_2\n What is Dukchoon's expression?",
+ "prediction": "Dukchoon looks concerned or thoughtful."
+ },
+ {
+ "id": 22,
+ "question": "Ron is image_1\n Brian is image_2\n Champ is image_3\n In the image: image_4\n Who is driving the car?",
+ "prediction": "Ron is driving the car."
+ },
+ {
+ "id": 23,
+ "question": "Brian is image_1\n In the image: image_2\n Identify Brian with grounding.",
+ "prediction": "[Brian](625,300),(975,988)"
+ },
+ {
+ "id": 24,
+ "question": "Ron is image_1\n Brick is image_2\n Explain the content of this image: image_3\n",
+ "prediction": "Ron, on the left, is gesturing with his right hand while holding a can, and Brick, on the right, is sitting with his hands on his lap. They appear to be in a room with blinds partially closed in the background."
+ },
+ {
+ "id": 25,
+ "question": "Veronica is image_1\n In the image: image_2\n Identify Veronica with grounding.",
+ "prediction": "[Veronica](1,176),(317,979)"
+ },
+ {
+ "id": 26,
+ "question": "Ron is image_1\n In the image: image_2\n What is Ron doing?",
+ "prediction": "Ron is sitting on a chair."
+ },
+ {
+ "id": 27,
+ "question": "Ron is image_1\n Veronica is image_2\n In the image: image_3\n Describe the image.",
+ "prediction": "Veronica, wearing a yellow coat and pink hat, stands to the left with her hand on a child's shoulder. Ron, to the right, stands in a brown coat and scarf, looking straight ahead. They are all outdoors by the water."
+ },
+ {
+ "id": 28,
+ "question": "Bill is image_1\n Barbara is image_2\n Violet is image_3\n In the image: image_4\n Who is sitting at the middle of the table?",
+ "prediction": "Bill is sitting at the middle of the table."
+ },
+ {
+ "id": 29,
+ "question": "Barbara is image_1\n Violet is image_2\n Mattie is image_3\n Explain the content of the image: image_4\n",
+ "prediction": "Barbara stands to the left holding a book, facing towards Mattie, who sits in the center reading a document. Violet sits to the right, also looking at the document. They seem to be in a discussion."
+ },
+ {
+ "id": 30,
+ "question": "Barbara is image_1\n In the image: image_2\n Identify Barbara with grounding.",
+ "prediction": "[Barbara](665,90),(941,972)"
+ },
+ {
+ "id": 31,
+ "question": "Barbara is image_1\n Mattie is image_2\n In the image: image_3\n What is Mattie doing?",
+ "prediction": "Mattie is sitting at a table with a glass in her hand."
+ },
+ {
+ "id": 32,
+ "question": "Bill is image_1\n Charlie is image_2\n Barbara is image_3\n In the image: image_4\n Identify Bill with grounding.",
+ "prediction": "[Bill](0,25),(353,990)"
+ },
+ {
+ "id": 33,
+ "question": "Lynn is image_1\n Lynn's father is image_2\n In the image: image_3\n Identify Lynn's father with grounding.",
+ "prediction": "[Lynn's father](477,75),(723,733)"
+ },
+ {
+ "id": 34,
+ "question": "Grace is image_1\n In the image: image_2\n Describe Grace's state.",
+ "prediction": "Grace is a student wearing a school uniform."
+ },
+ {
+ "id": 35,
+ "question": "Bank is image_1\n Lynn is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Bank stands on the left with his arm resting on a desk, wearing a white shirt and carrying a bag. Lynn is to the right, also in a white shirt and carrying a smaller bag. They appear to be in a room with glass walls."
+ },
+ {
+ "id": 36,
+ "question": "Lynn is image_1\n Grace is image_2\n In the image: image_3\n Identify Lynn with grounding.",
+ "prediction": "[Lynn](432,45),(853,988)"
+ },
+ {
+ "id": 37,
+ "question": "Tong is image_1\n In the image: image_2\n What color is Tong's clothes?",
+ "prediction": "Tong is wearing a blue shirt."
+ },
+ {
+ "id": 38,
+ "question": "Grace is image_1\n Pat is image_2\n Please describe the image: image_3\n",
+ "prediction": "Grace is sitting on a table looking away, while Pat is lounging with his arm extended, both seem to be in a workshop."
+ },
+ {
+ "id": 39,
+ "question": "Scott is image_1\n Elizabeth is image_2\n In the image: image_3\n What does Scott wear?",
+ "prediction": "Scott wears a beige blazer with a checked tie."
+ },
+ {
+ "id": 40,
+ "question": "Amy is image_1\n Lynn is image_2\n In the image: image_3\n Identify Amy with grounding.",
+ "prediction": "[Amy](110,43),(522,947)"
+ },
+ {
+ "id": 41,
+ "question": "Wally is image_1\n In the image: image_2\n Identify Wally with grounding.",
+ "prediction": "[Wally](140,294),(586,973)"
+ },
+ {
+ "id": 42,
+ "question": "Bei Zhai is image_1\n Shen Lian is image_2\n In the image: image_3\n Describe the visual content.",
+ "prediction": "Bei Zhai stands on the left, wearing a light blue outfit, partially shaded by a bamboo structure. Shen Lian is on the right, facing her, dressed in black with a traditional hat. They appear to be in a bamboo forest."
+ },
+ {
+ "id": 43,
+ "question": "Shen lian is image_1\n Lu Wenzhao is image_2\n In the image: image_3\n What is Lu Wenzhao doing?",
+ "prediction": "Lu Wenzhao is extending his hand towards Shen Lian."
+ },
+ {
+ "id": 44,
+ "question": "Bei Zhai is image_1\n Shen Lian is image_2\n In the image: image_3\n Describe the state of Bei Zhai.",
+ "prediction": "Bei Zhai is seated and looking downward."
+ },
+ {
+ "id": 45,
+ "question": "Bei Zhai is image_1\n Shen Lian is image_2\n In the image: image_3\n Identify Shen Lian with grounding.",
+ "prediction": "[Shen Lian](735,29),(917,990)"
+ },
+ {
+ "id": 46,
+ "question": "Bei Zhai is image_1\n In the image: image_2\n Identify Bei Zhai with grounding.",
+ "prediction": "[Bei Zhai](453,268),(755,992)"
+ },
+ {
+ "id": 47,
+ "question": "Lu Wenzhao is image_1\n Ding Baiying is image_2\n Describe the image: image_3\n",
+ "prediction": "Lu Wenzhao is seen holding a sword, standing closely behind Ding Baiying. They appear to be in a tense moment, surrounded by fallen soldiers in a battle scene."
+ },
+ {
+ "id": 48,
+ "question": "Haskell is image_1\n In the image: image_2\n What is he doing?",
+ "prediction": "He is sitting at a dining table."
+ },
+ {
+ "id": 49,
+ "question": "Molyneux is image_1\n In the image: image_2\n Describe the content.",
+ "prediction": "Molyneux is sitting in the driver's seat of a car, looking straight ahead. There's an elderly couple in the back seat, appearing to be in a conversation."
+ },
+ {
+ "id": 50,
+ "question": "Henry Goose is image_1\n Native Woman is image_2\n In the image: image_3\n Identify Henry Goose with grounding.",
+ "prediction": "[Henry Goose](110,13),(531,987)"
+ },
+ {
+ "id": 51,
+ "question": "Molyneux is image_1\n In the image: image_2\n Describe the state of Molyneux.",
+ "prediction": "Molyneux is seated and appears to be embracing someone."
+ },
+ {
+ "id": 52,
+ "question": "Mr. Griffith is image_1\n Mrs. Griffith is image_2\n In the image: image_3\n What is Mr. Griffith doing?",
+ "prediction": "Mr. Griffith is sitting and leaning forward with his hand on his cheek."
+ },
+ {
+ "id": 53,
+ "question": "Gibbons is image_1\n Describe the image: image_2\n",
+ "prediction": "Gibbons, an elderly man in a suit and tie, is dancing with a young woman in a cheerleading outfit on a basketball court, surrounded by a crowd of onlookers."
+ },
+ {
+ "id": 54,
+ "question": "Micah is image_1\n In the image: image_2\n Describe the image.",
+ "prediction": "Two young men are sitting together; one, dressed in a plaid shirt, is strumming a guitar, while the other, in a black shirt, is playing the acoustic guitar. They seem to be enjoying a casual outdoor gathering."
+ },
+ {
+ "id": 55,
+ "question": "Rhiannon is image_1\n In the image: image_2\n Identify Rhiannon with grounding.",
+ "prediction": "[Rhiannon](10,125),(414,997)"
+ },
+ {
+ "id": 56,
+ "question": "Olive is image_1\n Rhiannon is image_2\n In the image: image_3\n Who is carrying a handbag?",
+ "prediction": "Olive is carrying a handbag."
+ },
+ {
+ "id": 57,
+ "question": "Brandon is image_1\n In the image: image_2\n Identify Brandon with grounding.",
+ "prediction": "[Brandon](111,34),(625,991)"
+ },
+ {
+ "id": 58,
+ "question": "Walt is image_1\n Sue is image_2\n In the image: image_3\n Explain the content.",
+ "prediction": "Walt, an older man, stands on a porch with a woman, Sue, to his left, touching his shoulder. Both are facing the camera."
+ },
+ {
+ "id": 59,
+ "question": "Karen is image_1\n Mitch is image_2\n In the image: image_3\n Identify Karen with grounding.",
+ "prediction": "[Karen](571,125),(966,988)"
+ },
+ {
+ "id": 60,
+ "question": "Walt is image_1\n Thao is image_2\n In the image: image_3\n Please reason out what role of Thao is in this scene.",
+ "prediction": "Thao is standing on the right, facing and seemingly conversing with Walt on the left."
+ },
+ {
+ "id": 61,
+ "question": "Mitch is image_1\n Walt is image_2\n In the image: image_3\n What color is Walt's clothes?",
+ "prediction": "Walt's clothes are white."
+ },
+ {
+ "id": 62,
+ "question": "Thao is image_1\n Sue is image_2\n In the image: image_3\n Identify Sue with grounding.",
+ "prediction": "[Sue](714,108),(998,985)"
+ },
+ {
+ "id": 63,
+ "question": "Harry is image_1\n Hermione is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Hermione is standing to the left, slightly behind Harry, who is in the center. Both are in a dimly lit room, looking towards the right."
+ },
+ {
+ "id": 64,
+ "question": "Hermione is image_1\n Ron is image_2\n In the image: image_3\n What is the spatial relation between Hermione and Ron?",
+ "prediction": "Hermione is standing to the right of Ron."
+ },
+ {
+ "id": 65,
+ "question": "Harry is image_1\n Albus is image_2\n In the image: image_3\n Identify Albus with grounding.",
+ "prediction": "[Albus](587,43),(828,986)"
+ },
+ {
+ "id": 66,
+ "question": "Hermione is image_1\n Harry is image_2\n In the image: image_3\n Identify Hermione with grounding.",
+ "prediction": "[Hermione](285,15),(757,986)"
+ },
+ {
+ "id": 67,
+ "question": "Ron is image_1\n In the image: image_2\n Identify Ron with grounding.",
+ "prediction": "[Ron](6,159),(273,995)"
+ },
+ {
+ "id": 68,
+ "question": "Ariadne is image_1\n Mal is image_2\n In the image: image_3\n Identify Mal with grounding.",
+ "prediction": "[Mal](713,29),(896,985)"
+ },
+ {
+ "id": 69,
+ "question": "Eames is image_1\n Cobb is image_2\n In the image: image_3\n Identify Cobb with grounding.",
+ "prediction": "[Cobb](63,230),(408,995)"
+ },
+ {
+ "id": 70,
+ "question": "Ariadne is image_1\n Yusuf is image_2\n In the image: image_3\n Please describe the content.",
+ "prediction": "Ariadne is lying on a chair with her arm resting on a table, looking off to the side. Yusuf is reclining on another chair with his arm extended, appearing to be in a relaxed state. They are in a room with a dark, moody atmosphere."
+ },
+ {
+ "id": 71,
+ "question": "Ariadne is image_1\n In the image: image_2\n What is she doing?",
+ "prediction": "Ariadne appears to be walking alongside a man."
+ },
+ {
+ "id": 72,
+ "question": "Cobb is image_1\n Ariadne is image_2\n In the image: image_3\n Who is walking in front?",
+ "prediction": "Cobb is walking in front."
+ },
+ {
+ "id": 73,
+ "question": "Cobb is image_1\n Saito is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Cobb is seated on a train, looking intently at Saito, who is reclined in a seat facing away from the camera. Saito has his hand on Cobb's shoulder."
+ },
+ {
+ "id": 74,
+ "question": "Tony is image_1\n Pepper is image_2\n Natalie is image_3\n In the image: image_4\n Who is the person standing?",
+ "prediction": "Pepper Potts is the person standing."
+ },
+ {
+ "id": 75,
+ "question": "Agent is image_1\n Justin is image_2\n Please provide an overview of the visual information in this image: image_3\n",
+ "prediction": "Agent is standing on the left, wearing a black suit and tie, carrying a suitcase. Justin is on the right, also in a black suit, standing beside the Agent. They are in a factory setting with machinery in the background."
+ },
+ {
+ "id": 76,
+ "question": "Nick is image_1\n Tony is image_2\n In the image: image_3\n Identify Nick with grounding.",
+ "prediction": "[Nick](268,18),(569,797)"
+ },
+ {
+ "id": 77,
+ "question": "Tony is image_1\n Justin is image_2\n In the image: image_3\n Identify Justin with grounding.",
+ "prediction": "[Justin](460,106),(698,995)"
+ },
+ {
+ "id": 78,
+ "question": "Pepper is image_1\n Natalie is image_2\n In the image: image_3\n Whose clothes color is gray?",
+ "prediction": "Pepper is wearing a gray outfit."
+ },
+ {
+ "id": 79,
+ "question": "Tony is image_1\n In the image: image_2\n Give a description.",
+ "prediction": "Tony, wearing a suit and tie, is sitting at a table with his hands clasped in front of him. There are other individuals seated around the table, appearing to be engaged in a meeting or a public hearing."
+ },
+ {
+ "id": 80,
+ "question": "Mrs. Fairfax is image_1\n Jane is image_2\n In the image: image_3\n What color is Jane's dress?",
+ "prediction": "Jane's dress is blue."
+ },
+ {
+ "id": 81,
+ "question": "Rochester is image_1\n Jane is image_2\n In the image: image_3\n Describe Rochester's clothes.",
+ "prediction": "Rochester is wearing a dark coat with a waistcoat."
+ },
+ {
+ "id": 82,
+ "question": "Jane is image_1\n Varens is image_2\n In the image: image_3\n Identify Varens with grounding.",
+ "prediction": "[Varens](578,175),(928,997)"
+ },
+ {
+ "id": 83,
+ "question": "Jane is image_1\n Mrs. Fairfax is image_2\n In the image: image_3\n Identify Mrs. Fairfax with grounding.",
+ "prediction": "[Mrs. Fairfax](575,119),(998,995)"
+ },
+ {
+ "id": 84,
+ "question": "Bai Letian is image_1\n Kukai is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Bai Letian is seated to the left, looking towards Kukai, who is seated to the right holding a paper. Both are against a brick wall backdrop, sitting on what appears to be a bench."
+ },
+ {
+ "id": 85,
+ "question": "Bai Letian is image_1\n Kukai is image_2\n In the image: image_3\n Identify Bai Letian with grounding.",
+ "prediction": "[Bai Letian](510,230),(719,997)"
+ },
+ {
+ "id": 86,
+ "question": "Bai Letian is image_1\n Kukai is image_2\n In the image: image_3\n Please provide an overview of the visual information.",
+ "prediction": "Bai Letian is seated on the left, gesturing with his right hand, while Kukai is seated on the right with his hands on the table. There's a standing individual in the middle, between Bai and Kukai."
+ },
+ {
+ "id": 87,
+ "question": "Gennady is image_1\n Eddie is image_2\n In the image: image_3\n Please provide an image caption.",
+ "prediction": "Gennady is seated to the right on a bench, looking down at an object in his hands, while Eddie sits to the left facing him. They are in a park setting with trees and a bench behind them."
+ },
+ {
+ "id": 88,
+ "question": "Eddie is image_1\n In the image: image_2\n Identify Eddie with grounding.",
+ "prediction": "[Eddie](586,168),(935,996)"
+ },
+ {
+ "id": 89,
+ "question": "Lindy is image_1\n Eddie is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Lindy is holding a newspaper with the headline \" Poll Vault, \" facing to her right, while Eddie, wearing a black leather jacket, is turned towards his right with his hands in his pockets. They appear to be on a city street with shops in the background."
+ },
+ {
+ "id": 90,
+ "question": "Gennady is image_1\n In the image: image_2\n What is Gennady doing?",
+ "prediction": "Gennady is walking towards the camera with his back turned."
+ },
+ {
+ "id": 91,
+ "question": "Eddie is image_1\n Carl is image_2\n In the image: image_3\n Identify Carl with grounding.",
+ "prediction": "[Carl](63,211),(309,995)"
+ },
+ {
+ "id": 92,
+ "question": "Old Joe is image_1\n Joe is image_2\n In the image: image_3\n Who is on the left side of the table?",
+ "prediction": "Old Joe is on the left side of the table."
+ },
+ {
+ "id": 93,
+ "question": "Sara is image_1\n Cid is image_2\n In the image: image_3\n Identify Cid with grounding.",
+ "prediction": "[Cid](254,409),(522,992)"
+ },
+ {
+ "id": 94,
+ "question": "Ye Jin is image_1\n Vivian is image_2\n In the image: image_3\n Who just got out of the car?",
+ "prediction": "Ye Jin just got out of the car."
+ },
+ {
+ "id": 95,
+ "question": "Vivian is image_1\n Ye Jin is image_2\n In the image: image_3\n What does Vivian wear?",
+ "prediction": "Vivian wears a black and white striped blazer with a black top and skirt."
+ },
+ {
+ "id": 96,
+ "question": "Vivian is image_1\n Ye Jin is image_2\n In the image: image_3\n Identify Vivian with grounding.",
+ "prediction": "[Vivian](417,197),(696,996)"
+ },
+ {
+ "id": 97,
+ "question": "Vivian is image_1\n In the image: image_2\n What is Vivian doing?",
+ "prediction": "Vivian is holding up a phone."
+ },
+ {
+ "id": 98,
+ "question": "Ye Jin is image_1\n Please describe the image: image_2\n",
+ "prediction": "Ye Jin in a white suit walks away from the camera, carrying a bouquet of flowers. A man in a grey suit follows behind her. They are in a bright, modern living room with white furniture and a red chair."
+ },
+ {
+ "id": 99,
+ "question": "Boris' Girlfriend is image_1\n Boris is image_2\n In the image: image_3\n Who is carrying the cake?",
+ "prediction": "Boris' girlfriend is carrying the cake."
+ },
+ {
+ "id": 100,
+ "question": "Agent K is image_1\n Agent J is image_2\n In the image: image_3\n Identify Agent K with grounding.",
+ "prediction": "[Agent K](586,126),(950,732)"
+ },
+ {
+ "id": 101,
+ "question": "Agent J is image_1\n Agent O is image_2\n In the image: image_3\n What is Agent O doing?",
+ "prediction": "Agent O is standing and facing Agent J."
+ },
+ {
+ "id": 102,
+ "question": "Young Agent K is image_1\n Young Agent O is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Young Agent K is seated to the left, wearing a black suit, while Young Agent O stands to the right, dressed in a black dress with a white collar. They are in a modern office setting with other agents and office elements in the background."
+ },
+ {
+ "id": 103,
+ "question": "Young Agent K is image_1\n Agent J is image_2\n In the image: image_3\n Identify Agent J with grounding.",
+ "prediction": "[Agent J](646,52),(905,981)"
+ },
+ {
+ "id": 104,
+ "question": "Agent J is image_1\n Young Agent K is image_2\n Griffin is image_3\n In the image: image_4\n Please provide a description.",
+ "prediction": "Agent J is standing on the left in a formal suit, facing Young Agent K who is on the right in a similar suit. Griffin, wearing a green jacket and a red knit hat, is serving food in the center. They are in a room with other guests at a party."
+ },
+ {
+ "id": 105,
+ "question": "Boris is image_1\n Griffin is image_2\n In the image: image_3\n Identify Griffin with grounding.",
+ "prediction": "[Griffin](509,231),(983,986)"
+ },
+ {
+ "id": 106,
+ "question": "Billy Beane is image_1\n In the image: image_2\n Identify Billy Beane with grounding.",
+ "prediction": "[Billy Beane](480,44),(848,913)"
+ },
+ {
+ "id": 107,
+ "question": "Peter Brand is image_1\n In the image: image_2\n Identify Peter Brand with grounding.",
+ "prediction": "[Peter Brand](10,37),(592,991)"
+ },
+ {
+ "id": 108,
+ "question": "Billy is image_1\n Peter is image_2\n In the image: image_3\n Please give a description.",
+ "prediction": "Peter is seated to the left, resting his chin on his hand, facing slightly right. Billy is sitting to the right, with one hand on a desk and the other near his face, in a thoughtful pose. A poster on the wall reads \"CLASH\". There's a desk with various items, including a computer, books, and a coffee cup."
+ },
+ {
+ "id": 109,
+ "question": "Sharp is image_1\n Scout is image_2\n In the image: image_3\n Identify Scout with grounding.",
+ "prediction": "[Scout](542,191),(832,843)"
+ },
+ {
+ "id": 110,
+ "question": "Sam is image_1\n Suzy is image_2\n Please describe the image: image_3\n",
+ "prediction": "Sam is sitting outside in a scout uniform, holding a frying pan, while Suzy sits beside her, partially visible, with a camera in her lap. There's a campsite setup with a tent and decorations in the background."
+ },
+ {
+ "id": 111,
+ "question": "Suzy is image_1\n Sam is image_2\n In the image: image_3\n Describe Suzy's state.",
+ "prediction": "Suzy is sitting on the ground, looking at something in her hands."
+ },
+ {
+ "id": 112,
+ "question": "Sharp is image_1\n Scout is image_2\n In the image: image_3\n Identify Sharp with grounding.",
+ "prediction": "[Sharp](665,79),(932,992)"
+ },
+ {
+ "id": 113,
+ "question": "Sam is image_1\n Suzy is image_2\n In the image: image_3\n Identify Suzy with grounding.",
+ "prediction": "[Suzy](137,248),(400,993)"
+ },
+ {
+ "id": 114,
+ "question": "Sam is image_1\n Suzy is image_2\n In the image: image_3\n Describe the visual content.",
+ "prediction": "Sam is sitting on the left, wearing a yellow scout uniform with badges, looking towards the right. Suzy, also in a yellow scout uniform, is seated on the right, with her hands clasped in front of her. They appear to be in a room with other scouts and a leader gesturing with one hand."
+ },
+ {
+ "id": 115,
+ "question": "Sharp is image_1\n Scout is image_2\n In the image: image_3\n What is Sharp doing?",
+ "prediction": "Sharp is wiping his face with a handkerchief."
+ },
+ {
+ "id": 116,
+ "question": "Social Services is image_1\n Scout is image_2\n Sharp is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Social Services, holding a book, is gesturing while talking to Scout, who is standing with his hands by his sides. Sharp is looking towards their direction, partially visible on the right side. There are other people in the background."
+ },
+ {
+ "id": 117,
+ "question": "Chigusa is image_1\n Shimada is image_2\n Kawai is image_3\n In the image: image_4\n Please give a description.",
+ "prediction": "Chigusa is sitting on the left, wearing a school uniform with a bow tie. Shimada is seated in the center, also in a school uniform, slightly turned towards Chigusa. Kawai is on the right, leaning forward while holding a piece of paper."
+ },
+ {
+ "id": 118,
+ "question": "Shimada is image_1\n Chigusa is image_2\n In the image: image_3\n Identify Chigusa with grounding.",
+ "prediction": "[Chigusa](391,202),(602,998)"
+ },
+ {
+ "id": 119,
+ "question": "Chigusa is image_1\n In the image: image_2\n What is her emotion?",
+ "prediction": "Chigusa is surprised."
+ },
+ {
+ "id": 120,
+ "question": "Kosaku is image_1\n Shimada is image_2\n For the image: image_3\n Give a description.",
+ "prediction": "Kosaku stands to the right, extending a drink to Shimada who is seated to the left, both are in a dimly lit waiting area with red seating."
+ },
+ {
+ "id": 121,
+ "question": "Kosuke is image_1\n Sachiko is image_2\n In the image: image_3\n Identify Sachiko with grounding.",
+ "prediction": "[Sachiko](546,562),(757,997)"
+ },
+ {
+ "id": 122,
+ "question": "Chigusa is image_1\n Kosuke is image_2\n Shimada is image_3\n In the image: image_4\n Who is raising hand?",
+ "prediction": "Shimada is raising hand."
+ },
+ {
+ "id": 123,
+ "question": "Sachiko is image_1\n In the image: image_2\n Identify Sachiko with grounding.",
+ "prediction": "[Sachiko](578,150),(842,996)"
+ },
+ {
+ "id": 124,
+ "question": "Chigusa is image_1\n Shimada is image_2\n In the image: image_3\n What is Shimada doing?",
+ "prediction": "Shimada is writing in a notebook."
+ },
+ {
+ "id": 125,
+ "question": "Kosaku is image_1\n Shimada is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Kosaku, a man in a suit, stands in a crowded train car, holding onto a pole. Next to him, Shimada, wearing a school uniform, looks downward. Other passengers are visible in the background."
+ },
+ {
+ "id": 126,
+ "question": "Kosaku is image_1\n Shimada is image_2\n In the image: image_3\n What is Kosaku doing?",
+ "prediction": "Kosaku is sitting and reading a book on a bench."
+ },
+ {
+ "id": 127,
+ "question": "Kosaku is image_1\n Shimada is image_2\n Please describe the image: image_3\n",
+ "prediction": "Kosaku is seated on a bench, looking down, while Shimada stands behind him, appearing to adjust his hair or clothing."
+ },
+ {
+ "id": 128,
+ "question": "Shimada is image_1\n Kosaku is image_2\n In the image: image_3\n Give an image caption.",
+ "prediction": "Shimada, wearing a school uniform with a camera, stands under an umbrella next to Kosaku, dressed in a suit. It's raining outside."
+ },
+ {
+ "id": 129,
+ "question": "Shimada is image_1\n Yusuke is image_2\n In the image: image_3\n Identify Shimada with grounding.",
+ "prediction": "[Shimada](106,12),(520,981)"
+ },
+ {
+ "id": 130,
+ "question": "Kosaku Ito is image_1\n In the image: image_2\n Identify Kosaku Ito with grounding.",
+ "prediction": "[Kosaku Ito](34,179),(450,996)"
+ },
+ {
+ "id": 131,
+ "question": "Hibiki Shimada is image_1\n Megumi Chigusa is image_2\n In the image: image_3\n Who is holding a cylinder object?",
+ "prediction": "Megumi Chigusa."
+ },
+ {
+ "id": 132,
+ "question": "Kosuke is image_1\n Shimada is image_2\n Describe the image: image_3\n",
+ "prediction": "Kosuke, in a black school uniform with a red flower on his lapel, is walking alongside Shimada, who is wearing a similar uniform with a red bow tie, under cherry blossom trees in full bloom."
+ },
+ {
+ "id": 133,
+ "question": "Kosaku Ito is image_1\n Hibiki Shimada is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Kosaku Ito, dressed in a suit, stands facing Hibiki Shimada, who is in a school uniform with a bouquet of flowers in hand, on a sunny street with a car and houses in the background."
+ },
+ {
+ "id": 134,
+ "question": "Emma is image_1\n In the image: image_2\n Identify Emma with grounding.",
+ "prediction": "[Emma](383,41),(785,988)"
+ },
+ {
+ "id": 135,
+ "question": "Adam is image_1\n Alvin is image_2\n In the image: image_3\n Is Adam standing?",
+ "prediction": "No, Adam is sitting."
+ },
+ {
+ "id": 136,
+ "question": "Emma is image_1\n In the image: image_2\n Identify Emma with grounding.",
+ "prediction": "[Emma](279,226),(497,996)"
+ },
+ {
+ "id": 137,
+ "question": "Adam is image_1\n In the image: image_2\n What is Adam doing?",
+ "prediction": "Adam is standing and appears to be in motion."
+ },
+ {
+ "id": 138,
+ "question": "Emma is image_1\n Adam is image_2\n Please describe the image: image_3\n",
+ "prediction": "Emma, wearing a doctor's coat, is standing to the left, while Adam is lying in a hospital bed to the right, with his arm resting on a pillow. There's medical equipment in the background."
+ },
+ {
+ "id": 139,
+ "question": "Alvin is image_1\n Lucy is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Alvin, wearing a suit, sits at a table with a drink in his hand. Lucy, in a dress, is seated across from him, also with a drink. They appear to be engaged in a conversation at a bustling restaurant or bar setting."
+ },
+ {
+ "id": 140,
+ "question": "Gao Jian Xiang is image_1\n Liu Hao is image_2\n In the image: image_3\n Identify Gao Jian Xiang with grounding.",
+ "prediction": "[Gao Jian Xiang](220,87),(562,863)"
+ },
+ {
+ "id": 141,
+ "question": "Chen is image_1\n Gao is image_2\n In the image: image_3\n Describe the scene.",
+ "prediction": "Chen is being shoved by Gao in a tense confrontation outside, with another person watching."
+ },
+ {
+ "id": 142,
+ "question": "Gao is image_1\n Lin is image_2\n In the image: image_3\n Identify Lin with grounding.",
+ "prediction": "[Lin](26,99),(317,998)"
+ },
+ {
+ "id": 143,
+ "question": "Chen is image_1\n Gao is image_2\n In the image: image_3\n What is the expression of Chen?",
+ "prediction": "Chen looks surprised or in distress."
+ },
+ {
+ "id": 144,
+ "question": "Jack is image_1\n Gibbs is image_2\n In the image: image_3\n Identify Jack with grounding.",
+ "prediction": "[Jack](175,72),(533,985)"
+ },
+ {
+ "id": 145,
+ "question": "Jack Sparrow is image_1\n In the image: image_2\n Identify Jack with grounding.",
+ "prediction": "[Jack](347,19),(723,987)"
+ },
+ {
+ "id": 146,
+ "question": "Barbossa is image_1\n In the image: image_2\n Identify Barbossa with grounding.",
+ "prediction": "[Barbossa](612,137),(810,995)"
+ },
+ {
+ "id": 147,
+ "question": "Barbossa is image_1\n In the image: image_2\n Please give a description.",
+ "prediction": "Barbossa, dressed in elaborate pirate attire, stands on a ship with a sword in hand, while two other pirates stand beside him."
+ },
+ {
+ "id": 148,
+ "question": "Angelica is image_1\n Jack is image_2\n Describe the image: image_3\n",
+ "prediction": "Angelica, wearing a dark hat, is extending her hand towards Jack, who is shirtless and appears to be in the jungle. There are other indistinct figures in the background."
+ },
+ {
+ "id": 149,
+ "question": "Syrena is image_1\n Philip is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Syrena is sitting on the lap of Philip, who is shirtless among dense foliage. There is another person visible in the background."
+ },
+ {
+ "id": 150,
+ "question": "Angelica is image_1\n In the image: image_2\n Identify Angelica with grounding.",
+ "prediction": "[Angelica](78,52),(514,988)"
+ },
+ {
+ "id": 151,
+ "question": "Elizabeth is image_1\n William is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Elizabeth is sitting on the steps, looking down at a book. William is sitting beside her, gazing towards the left side of the image. They appear to be in a contemplative mood."
+ },
+ {
+ "id": 152,
+ "question": "William is image_1\n Elizabeth is image_2\n In the image: image_3\n Identify Elizabeth with grounding.",
+ "prediction": "[Elizabeth](37,69),(331,988)"
+ },
+ {
+ "id": 153,
+ "question": "Brant is image_1\n Olive is image_2\n In the image: image_3\n What color is Olive's hat?",
+ "prediction": "Olive's hat is brown."
+ },
+ {
+ "id": 154,
+ "question": "Elizabeth is image_1\n Olive is image_2\n In the image: image_3\n Identify Elizabeth with grounding.",
+ "prediction": "[Elizabeth](607,67),(886,983)"
+ },
+ {
+ "id": 155,
+ "question": "Elizabeth is image_1\n William is image_2\n In the image: image_3\n Describe William's state.",
+ "prediction": "William is standing with his hands on his hips."
+ },
+ {
+ "id": 156,
+ "question": "William is image_1\n Elizabeth is image_2\n In the image: image_3\n Is William sitting or lying down?",
+ "prediction": "William is lying down."
+ },
+ {
+ "id": 157,
+ "question": "Robert is image_1\n In the image: image_2\n Identify Robert with grounding.",
+ "prediction": "[Robert](578,65),(895,976)"
+ },
+ {
+ "id": 158,
+ "question": "Charles Rodman is image_1\n Will Rodman is image_2\n In the image: image_3\n Explain the visual content.",
+ "prediction": "Charles Rodman is standing and feeding a chimpanzee with a bottle, while Will Rodman is sitting at a table, looking at a book and having a drink."
+ },
+ {
+ "id": 159,
+ "question": "Will Rodman is image_1\n Caesar is image_2\n In the image: image_3\n Who is sitting in the back seat of the car?",
+ "prediction": "Caesar is sitting in the back seat of the car."
+ },
+ {
+ "id": 160,
+ "question": "Will Rodman is image_1\n In the image: image_2\n Identify Will Rodman with grounding.",
+ "prediction": "[Will Rodman](381,16),(635,987)"
+ },
+ {
+ "id": 161,
+ "question": "David Norris is image_1\n Elise Sellas is image_2\n In the image: image_3\n Who is sitting by the window?",
+ "prediction": "Elise Sellas is sitting by the window."
+ },
+ {
+ "id": 162,
+ "question": "Charlie Traynor is image_1\n David Norris is image_2\n In the image: image_3\n Identify Charlie Traynor with grounding.",
+ "prediction": "[Charlie Traynor](97,85),(476,988)"
+ },
+ {
+ "id": 163,
+ "question": "Charlie is image_1\n David is image_2\n Elise is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "David is seated at a table with food and drinks, facing Charlie who stands in a suit with a red tie. Elise is seated across from David, engaged in conversation with him. They are in an outdoor dining setting with other patrons in the background."
+ },
+ {
+ "id": 164,
+ "question": "David Norris is image_1\n Jon Stewart is image_2\n In the image: image_3\n Identify Jon Stewart with grounding.",
+ "prediction": "[Jon Stewart](171,61),(446,987)"
+ },
+ {
+ "id": 165,
+ "question": "Bloom is image_1\n In the image: image_2\n Identify Bloom with grounding.",
+ "prediction": "[Bloom](625,69),(998,989)"
+ },
+ {
+ "id": 166,
+ "question": "Romeo is image_1\n Murphy is image_2\n Please describe the image: image_3\n",
+ "prediction": "Murphy, on the left, is holding a gun with both hands in a defensive stance, while Romeo stands on the right, dressed in a white chef's uniform, looking towards Murphy. They appear to be in a dimly lit kitchen or bar area."
+ },
+ {
+ "id": 167,
+ "question": "Romeo is image_1\n In the image: image_2\n What is Romeo doing?",
+ "prediction": "Romeo is drinking at the bar."
+ },
+ {
+ "id": 168,
+ "question": "Connor is image_1\n In the image: image_2\n What is Connor doing?",
+ "prediction": "Connor is sitting and holding a card."
+ },
+ {
+ "id": 169,
+ "question": "Romeo is image_1\n In the image: image_2\n Give a description.",
+ "prediction": "Romeo, holding a gun, stands in a room next to a bed. Another person is partially visible on the right side, facing Romeo."
+ },
+ {
+ "id": 170,
+ "question": "Poppa is image_1\n In the image: image_2\n Identify Poppa with grounding.",
+ "prediction": "[Poppa](285,59),(546,981)"
+ },
+ {
+ "id": 171,
+ "question": "Katsuro Matsuoka is image_1\n In the image: image_2\n Identify Katsuro Matsuoka with grounding.",
+ "prediction": "[Katsuro Matsuoka](300,170),(532,998)"
+ },
+ {
+ "id": 172,
+ "question": "Zhu Bajie is image_1\n Tangseng is image_2\n Shaseng is image_3\n In the image: image_4\n Identify Tangseng with grounding.",
+ "prediction": "[Tangseng](25,247),(386,986)"
+ },
+ {
+ "id": 173,
+ "question": "Shaseng is image_1\n Tangseng is image_2\n Sun Wukong is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Sun Wukong, wearing a red robe, stands on the left with a sword. Shaseng is in the center, draped in white, with a sword and shield. Tangseng is on the right, armored blue, holding a spear. They are in a forest setting."
+ },
+ {
+ "id": 174,
+ "question": "Shaseng is image_1\n Tangseng is image_2\n Sun Wukong is image_3\n In the image: image_4\n Identify Sun Wukong with grounding.",
+ "prediction": "[Sun Wukong](409,280),(767,987)"
+ },
+ {
+ "id": 175,
+ "question": "Shary is image_1\n In the image: image_2\n Identify Shary with grounding.",
+ "prediction": "[Shary](7,481),(276,998)"
+ },
+ {
+ "id": 176,
+ "question": "Shaseng is image_1\n In the image: image_2\n What is Shaseng doing?",
+ "prediction": "Shaseng is standing and seems to be in a conversation."
+ },
+ {
+ "id": 177,
+ "question": "Shaseng is image_1\n Zhu Bajie is image_2\n In the image: image_3\n Who is lying down?",
+ "prediction": "Zhu Bajie is lying down."
+ },
+ {
+ "id": 178,
+ "question": "Benjam is image_1\n Irene is image_2\n In the image: image_3\n Identify Benjam with grounding.",
+ "prediction": "[Benjam](167,50),(535,972)"
+ },
+ {
+ "id": 179,
+ "question": "Irene is image_1\n In the image: image_2\n What is Irene doing?",
+ "prediction": "Irene is standing and holding some papers."
+ },
+ {
+ "id": 180,
+ "question": "Isidoro is image_1\n Benjam is image_2\n Irene is image_3\n In the image: image_4\n Identify Isidoro with grounding.",
+ "prediction": "[Isidoro](12,65),(468,981)"
+ },
+ {
+ "id": 181,
+ "question": "Sam Witwicky is image_1\n Bruce Brazos is image_2\n In the image: image_3\n What is Bruce Brazos going to do?",
+ "prediction": "Bruce Brazos is going to shake Sam Witwicky's hand."
+ },
+ {
+ "id": 182,
+ "question": "Sam Witwicky is image_1\n In the image: image_2\n Identify Sam Witwicky with grounding.",
+ "prediction": "[Sam Witwicky](1,0),(392,983)"
+ },
+ {
+ "id": 183,
+ "question": "Lennox is image_1\n In the image: image_2\n Is Lennox the person on the left or the one on the right?",
+ "prediction": "Lennox is the one on the right."
+ },
+ {
+ "id": 184,
+ "question": "Sam is image_1\n Carly is image_2\n In the image: image_3\n What color is Sam's clothes?",
+ "prediction": "Sam's clothes are light blue."
+ },
+ {
+ "id": 185,
+ "question": "Dylan is image_1\n Carly is image_2\n In the image: image_3\n Identify Carly with grounding.",
+ "prediction": "[Carly](119,52),(381,887)"
+ },
+ {
+ "id": 186,
+ "question": "Dylan is image_1\n Carly is image_2\n In the image: image_3\n Identify Dylan with grounding.",
+ "prediction": "[Dylan](467,137),(723,983)"
+ },
+ {
+ "id": 187,
+ "question": "Rooster is image_1\n LaBoeuf is image_2\n In the image: image_3\n What is Rooster doing?",
+ "prediction": "Rooster is lighting a cigarette."
+ },
+ {
+ "id": 188,
+ "question": "Mattie Ross is image_1\n In the image: image_2\n Identify Mattie Ross with grounding.",
+ "prediction": "[Mattie Ross](179,125),(414,988)"
+ },
+ {
+ "id": 189,
+ "question": "Mattie Ross is image_1\n LaBoeuf is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Mattie Ross, wearing a dark coat and hat, is standing in a forest, holding a metal cup. LaBoeuf is sitting beside her, also dressed in dark attire, with a hat on. They both seem to be in a tense conversation at night."
+ },
+ {
+ "id": 190,
+ "question": "Mattie Ross is image_1\n LaBoeuf is image_2\n In the image: image_3\n Who is hiding beside a rock?",
+ "prediction": "LaBoeuf is hiding beside a rock."
+ },
+ {
+ "id": 191,
+ "question": "Qin is image_1\n Lord Ximen is image_2\n In the image: image_3\n Identify Qin with grounding.",
+ "prediction": "[Qin](481,16),(906,988)"
+ },
+ {
+ "id": 192,
+ "question": "Qin is image_1\n In the image: image_2\n Describe Qin's state.",
+ "prediction": "Qin is standing in a relaxed pose with an arm extended out."
+ },
+ {
+ "id": 193,
+ "question": "Lord is image_1\n In the image: image_2\n What color is Lord's clothes?",
+ "prediction": "Lord's clothes are red."
+ },
+ {
+ "id": 194,
+ "question": "Lord Ximen is image_1\n Ho Sum-on is image_2\n In the image: image_3\n What color is Ho Sum-on's clothes?",
+ "prediction": "Ho Sum-on's clothes are yellow."
+ },
+ {
+ "id": 195,
+ "question": "Qin is image_1\n Big Brother is image_2\n Please describe the image: image_3\n",
+ "prediction": "Big Brother, wearing a pink shirt and gray vest, is sitting on the left side, gesturing while speaking. Qin, dressed in a black suit, is seated on the right, listening attentively. They are surrounded by a variety of books and are in a room with a view of trees outside."
+ },
+ {
+ "id": 196,
+ "question": "Qin is image_1\n SoSo is image_2\n In the image: image_3\n What does SoSo wear?",
+ "prediction": "SoSo wears a yellow coat."
+ },
+ {
+ "id": 197,
+ "question": "Qin Kwai is image_1\n Qin is image_2\n In the image: image_3\n Who is waving hand?",
+ "prediction": "Qin Kwai is waving hand."
+ },
+ {
+ "id": 198,
+ "question": "Qin is image_1\n Qin Kwai is image_2\n In the image: image_3\n Identify Qin Kwai with grounding.",
+ "prediction": "[Qin Kwai](602,219),(991,996)"
+ },
+ {
+ "id": 199,
+ "question": "Big Brother is image_1\n In the image: image_2\n Give a description.",
+ "prediction": "Big Brother, wearing a light blue shirt, is embracing a young boy in a blue shirt with checkered pants. They are in a room with traditional Chinese decor. In the background, two other individuals can be seen."
+ },
+ {
+ "id": 200,
+ "question": "Qin is image_1\n SoSo is image_2\n Provide a description for the image: image_3\n",
+ "prediction": "Qin is on the right, wearing a white shirt and pointing to the left. SoSo is on the left, dressed in a white tank top, looking towards Qin's direction. They are surrounded by blue and green balloons."
+ },
+ {
+ "id": 201,
+ "question": "Dr. Martin Harris is image_1\n Herr Strauss is image_2\n In the image: image_3\n Identify Herr Strauss with grounding.",
+ "prediction": "[Herr Strauss](602,84),(889,994)"
+ },
+ {
+ "id": 202,
+ "question": "Herr Strauss is image_1\n Dr. Martin Harris is image_2\n In the image: image_3\n Who is leaning against the table?",
+ "prediction": "Dr. Martin Harris is leaning against the table."
+ },
+ {
+ "id": 203,
+ "question": "Martin is image_1\n Gina is image_2\n In the image: image_3\n Does Martin wear a hat?",
+ "prediction": "No, Martin does not wear a hat."
+ },
+ {
+ "id": 204,
+ "question": "Martin is image_1\n Ernst is image_2\n Gina is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Martin is standing on the left, facing Ernst who is on the right. In front of them is Gina, standing slightly angled towards Ernst. They appear to be having a conversation on a bridge with a historic building in the background."
+ },
+ {
+ "id": 205,
+ "question": "Martin is image_1\n Elizabeth is image_2\n In the image: image_3\n What is on Elizabeth's neck?",
+ "prediction": "Elizabeth is wearing a pearl necklace."
+ },
+ {
+ "id": 206,
+ "question": "Professor Bressler is image_1\n Provide a description for the image: image_2\n",
+ "prediction": "Professor Bressler is embracing a girl in a corridor. There are blurred people in the background."
+ },
+ {
+ "id": 207,
+ "question": "Natalie is image_1\n Craig is image_2\n In the image: image_3\n Is Natalie the person standing closer to Craig or farther away?",
+ "prediction": "Natalie is standing closer to Craig."
+ },
+ {
+ "id": 208,
+ "question": "Craig is image_1\n In the image: image_2\n Identify Craig with grounding.",
+ "prediction": "[Craig](497,43),(885,908)"
+ },
+ {
+ "id": 209,
+ "question": "Ryan is image_1\n Natalie is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Ryan, in a dark suit, stands holding a jacket in an airport terminal next to Natalie, who is also in a suit with a coat in her hand. They appear to be waiting or lining up."
+ },
+ {
+ "id": 210,
+ "question": "Julie Bingham is image_1\n Kara Bingham is image_2\n In the image: image_3\n Identify Julie Bingham with grounding.",
+ "prediction": "[Julie Bingham](5,126),(407,991)"
+ },
+ {
+ "id": 211,
+ "question": "Jim is image_1\n Julie is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Jim is on the right, wearing a black suit with a red vest and tie, standing next to Julie who is in a white bridal dress holding a bouquet. There are other people in the background."
+ },
+ {
+ "id": 212,
+ "question": "Ryan Bingham is image_1\n Alex Goran is image_2\n In the image: image_3\n What is Alex Goran doing?",
+ "prediction": "Alex Goran is holding a champagne glass."
+ },
+ {
+ "id": 213,
+ "question": "Brendan Conlon is image_1\n Frank Campana is image_2\n In the image: image_3\n What is Frank Campana doing?",
+ "prediction": "Frank Campana is pointing towards Brendan Conlon."
+ },
+ {
+ "id": 214,
+ "question": "Paddy Conlon is image_1\n In the image: image_2\n Identify Paddy Conlon with grounding.",
+ "prediction": "[Paddy Conlon](189,40),(617,990)"
+ },
+ {
+ "id": 215,
+ "question": "Principal Zito is image_1\n In the image: image_2\n What does Principal Zito wear?",
+ "prediction": "Principal Zito is wearing a striped shirt."
+ },
+ {
+ "id": 216,
+ "question": "Fenroy is image_1\n In the image: image_2\n Identify Fenroy with grounding.",
+ "prediction": "[Fenroy](546,198),(906,1016)"
+ },
+ {
+ "id": 217,
+ "question": "Juan Lian is image_1\n Zi Xia is image_2\n Please describe the image: image_3\n",
+ "prediction": "Juan Lian is on the left, wearing a white robe with a black chest emblem, his right hand covering his mouth. Zi Xia is on the right, dressed in white with a side braid, looking towards the left. They appear to be in a traditional setting with a lantern and shelves in the background."
+ },
+ {
+ "id": 218,
+ "question": "Sun Wukong is image_1\n In the image: image_2\n Give a description.",
+ "prediction": "Sun Wukong is in the center of the image, engaged in a fierce battle with two opponents on each side, wielding a weapon with both hands."
+ },
+ {
+ "id": 219,
+ "question": "Juan Lian is image_1\n Zi Xia is image_2\n In the image: image_3\n What is Zi Xia doing?",
+ "prediction": "Zi Xia is standing with her hands clasped together."
+ },
+ {
+ "id": 220,
+ "question": "Sun Wukong is image_1\n Zi Xia is image_2\n In the image: image_3\n Who is sitting on top?",
+ "prediction": "Sun Wukong is sitting on top."
+ },
+ {
+ "id": 221,
+ "question": "Erlang Shen is image_1\n Juan Lian is image_2\n In the image: image_3\n Identify Erlang Shen with grounding.",
+ "prediction": "[Erlang Shen](29,5),(662,989)"
+ },
+ {
+ "id": 222,
+ "question": "Sun Wukong is image_1\n Zi Xia is image_2\n In the image: image_3\n Identify Zi Xia with grounding.",
+ "prediction": "[Zi Xia](142,223),(453,985)"
+ },
+ {
+ "id": 223,
+ "question": "Royce is image_1\n In the image: image_2\n Identify Royce with grounding.",
+ "prediction": "[Royce](606,0),(967,969)"
+ },
+ {
+ "id": 224,
+ "question": "Edwin is image_1\n Isabelle is image_2\n In the image: image_3\n Identify Isabelle with grounding.",
+ "prediction": "[Isabelle](385,195),(570,995)"
+ },
+ {
+ "id": 225,
+ "question": "Elizabeth Shaw is image_1\n In the image: image_2\n Identify Elizabeth Shaw with grounding.",
+ "prediction": "[Elizabeth Shaw](92,131),(307,996)"
+ },
+ {
+ "id": 226,
+ "question": "David is image_1\n Elizabeth Shaw is image_2\n In the image: image_3\n What is David doing?",
+ "prediction": "David is standing and looking at a wall screen."
+ },
+ {
+ "id": 227,
+ "question": "David is image_1\n Elizabeth Shaw is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "David is lying on a table, and Elizabeth Shaw is leaning over him, appearing to be in a conversation or interaction."
+ },
+ {
+ "id": 228,
+ "question": "Hilly Holbrook is image_1\n Jolene French is image_2\n Elizabeth Leefolt is image_3\n In the image: image_4\n Identify Elizabeth Leefolt with grounding.",
+ "prediction": "[Elizabeth Leefolt](546,112),(821,987)"
+ },
+ {
+ "id": 229,
+ "question": "Hilly Holbrook is image_1\n Skeeter Phelan is image_2\n In the image: image_3\n Who is holding the other person's arms?",
+ "prediction": "Hilly Holbrook is holding Skeeter Phelan's arms."
+ },
+ {
+ "id": 230,
+ "question": "Skeeter Phelan is image_1\n Elizabeth Leefolt is image_2\n In the image: image_3\n who has a drink in front of herself?",
+ "prediction": "Skeeter Phelan has a drink in front of herself."
+ },
+ {
+ "id": 231,
+ "question": "Skeeter Phelan is image_1\n Aibileen Clark is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Skeeter Phelan is seated at a kitchen table, looking at Aibileen Clark who stands with her hand on the table, in a domestic kitchen setting."
+ },
+ {
+ "id": 232,
+ "question": "Hilly Holbrook is image_1\n Elizabeth Leefolt is image_2\n Jolene French is image_3\n In the image: image_4\n What does Jolene French wear?",
+ "prediction": "Jolene French is wearing a black dress with lace details."
+ },
+ {
+ "id": 233,
+ "question": "Aibileen Clark is image_1\n Minny Jackson is image_2\n In the image: image_3\n Identify Minny Jackson with grounding.",
+ "prediction": "[Minny Jackson](645,0),(837,983)"
+ },
+ {
+ "id": 234,
+ "question": "Aibileen is image_1\n In the image: image_2\n What is Aibileen doing?",
+ "prediction": "Aibileen is standing and holding a picture."
+ },
+ {
+ "id": 235,
+ "question": "Hilly Holbrook is image_1\n Elizabeth Leefolt is image_2\n Describe the content of the image: image_3\n",
+ "prediction": "Hilly Holbrook stands with her hands on her hips facing forward, while Elizabeth Leefolt holds a baby, looking away to the side."
+ },
+ {
+ "id": 236,
+ "question": "Meiqin is image_1\n Heizi is image_2\n Leizi is image_3\n Chuchun is image_4\n In the image: image_5\n Identify Leizi with grounding.",
+ "prediction": "[Leizi](10,260),(346,995)"
+ },
+ {
+ "id": 237,
+ "question": "Heizi is image_1\n Chuchun is image_2\n Leizi is image_3\n In the image: image_4\n Who is standing behind?",
+ "prediction": "Heizi is standing behind."
+ },
+ {
+ "id": 238,
+ "question": "Meiqin is image_1\n Shifeng is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Meiqin is seated at a library table reading a book, while Shifeng stands behind her, leaning over as if to get a closer look at the book or discuss it with Meiqin. They are surrounded by other students in a spacious library."
+ },
+ {
+ "id": 239,
+ "question": "Meiqin is image_1\n Heizi is image_2\n Leizi is image_3\n Chuchun is image_4\n In the image: image_5\n Who is squatting?",
+ "prediction": "Meiqin is squatting."
+ },
+ {
+ "id": 240,
+ "question": "Pei is image_1\n Heizi is image_2\n Leizi is image_3\n Chuchun is image_4\n In the image: image_5\n What is Chuchun doing?",
+ "prediction": "Chuchun is standing and looking towards Heizi."
+ },
+ {
+ "id": 241,
+ "question": "Meiqin is image_1\n Heizi is image_2\n Pei is image_3\n Describe the image: image_4\n",
+ "prediction": "Heizi stands confidently with her hands on her hips facing Meiqin, who is kneeling on the ground looking up at Heizi. Pei observes from behind, standing slightly apart from Heizi. They are on a rooftop with a clear sky above."
+ },
+ {
+ "id": 242,
+ "question": "Meiqin is image_1\n Pei is image_2\n Leizi is image_3\n Chuchun is image_4\n In the image: image_5\n Who is carrying Pei on her back?",
+ "prediction": "Leizi is carrying Pei on her back."
+ },
+ {
+ "id": 243,
+ "question": "Leizi is image_1\n Chuchun is image_2\n In the image: image_3\n What is Chuchun's experssion?",
+ "prediction": "Chuchun appears to be smiling."
+ },
+ {
+ "id": 244,
+ "question": "Meiqin is image_1\n Pei is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Pei, in a blue dress, is leaping over a railing, while Meiqin, in a brown shirt and skirt, appears to be dodging or falling."
+ },
+ {
+ "id": 245,
+ "question": "Meiqin is image_1\n Dangma is image_2\n In the image: image_3\n Identify Dangma with grounding.",
+ "prediction": "[Dangma](477,108),(734,994)"
+ },
+ {
+ "id": 246,
+ "question": "Meiqin is image_1\n Heizi is image_2\n Leizi is image_3\n Chuchun is image_4\n In the image: image_5\n Identify Heizi with grounding.",
+ "prediction": "[Heizi](57,509),(276,997)"
+ },
+ {
+ "id": 247,
+ "question": "Meiqin is image_1\n Heizi is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Meiqin is sitting at a table, holding a spoon near Heizi, who is leaning forward slightly towards the table. They are outdoors with greenery and flowers in the background."
+ },
+ {
+ "id": 248,
+ "question": "Meiqin is image_1\n Shifeng is image_2\n In the image: image_3\n What does Meiqin wear?",
+ "prediction": "Meiqin wears a black tank top."
+ },
+ {
+ "id": 249,
+ "question": "Dangma is image_1\n Leizi is image_2\n Describe the content of the image: image_3\n",
+ "prediction": "Dangma is on the left, facing a girl named Leizi on the right, who is holding a necklace towards Dangma in an outdoor setting with buildings in the background."
+ },
+ {
+ "id": 250,
+ "question": "Heizi is image_1\n Leizi is image_2\n Chuchun is image_3\n In the image: image_4\n What is Chuchun doing?",
+ "prediction": "Chuchun is pushing Heizi in a wheelchair."
+ },
+ {
+ "id": 251,
+ "question": "Runzi is image_1\n In the image: image_2\n Identify Runzi with grounding.",
+ "prediction": "[Runzi](108,172),(354,995)"
+ },
+ {
+ "id": 252,
+ "question": "Meiqin is image_1\n Heizi is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Heizi is on the left, touching her right eye, while Meiqin is on the right, facing Heizi. Both are in a corridor with railings on the sides."
+ },
+ {
+ "id": 253,
+ "question": "Meiqin is image_1\n Heizi is image_2\n In the image: image_3\n Who is holding the umbrella?",
+ "prediction": "Meiqin is holding the umbrella."
+ },
+ {
+ "id": 254,
+ "question": "Leizi is image_1\n In the image: image_2\n What color is Leizi's clothes?",
+ "prediction": "Leizi's clothes are grey with a red belt."
+ },
+ {
+ "id": 255,
+ "question": "Meiqin is image_1\n Heizi is image_2\n Leizi is image_3\n Chuchun is image_4\n In the image: image_5\n Identify Heizi with grounding.",
+ "prediction": "[Heizi](557,145),(867,994)"
+ },
+ {
+ "id": 256,
+ "question": "Tangsan is image_1\n Xiaowu is image_2\n Rongrong is image_3\n Zhuqing is image_4\n In the image: image_5\n Identify Rongrong with grounding.",
+ "prediction": "[Rongrong](664,187),(857,975)"
+ },
+ {
+ "id": 257,
+ "question": "Daimubai is image_1\n In the image: image_2\n What is Daimubai doing?",
+ "prediction": "Daimubai is standing with his arms crossed."
+ },
+ {
+ "id": 258,
+ "question": "Tangsan is image_1\n Xiaowu is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Tangsan, dressed in a blue outfit with a gold trim, stands on the left, and Xiaowu, wearing a pink dress with bunny ears, is on the right. They appear to be in a forest at night with glowing plants."
+ },
+ {
+ "id": 259,
+ "question": "Tangsan is image_1\n Xiaowu is image_2\n Rongrong is image_3\n Aosika is image_4\n In the image: image_5\n Give a description.",
+ "prediction": "Tangsan, dressed in a blue suit, is standing on the left. Xiaowu, in a pink outfit, is adjusting Tangsan's clothes from behind on the left. Rongrong, wearing green, is holding Tangsan from behind on the right. Aosika, in a brown leather outfit, is on the far right side. They are all against a backdrop with glowing lights."
+ },
+ {
+ "id": 260,
+ "question": "Xiaose is image_1\n Wuxin is image_2\n In the image: image_3\n What is Wuxin doing?",
+ "prediction": "Wuxin is engaged in a close combat with Xiaose."
+ },
+ {
+ "id": 261,
+ "question": "Xiaose is image_1\n Wuxin is image_2\n Leiwujie is image_3\n In the image: image_4\n Provide description of visual content.",
+ "prediction": "Wuxin is sitting on the ground to the left, working on something by the fire. Leiwujie is standing on the right, in a relaxed pose with an arm behind his back. Xiaose is not visible in the image."
+ },
+ {
+ "id": 262,
+ "question": "Xiaose is image_1\n Wuxin is image_2\n Baifa is image_3\n Leiwujie is image_4\n In the image: image_5\n Identify Baifa with grounding.",
+ "prediction": "[Baifa](16,125),(229,988)"
+ },
+ {
+ "id": 263,
+ "question": "Tanglian is image_1\n In the image: image_2\n Identify Tanglian with grounding.",
+ "prediction": "[Tanglian](229,302),(528,988)"
+ },
+ {
+ "id": 264,
+ "question": "Qianluo is image_1\n Tanglian is image_2\n Rui is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Qianluo is seated on the left, wearing a blue outfit with a white frontlet. Tanglian is seated on the right, dressed in black with a red frontlet. Rui is seated beside Tanglian, adorned in a golden outfit. They appear to be engaged in a conversation in a room with pink curtains."
+ },
+ {
+ "id": 265,
+ "question": "Xiaose is image_1\n Leiwujie is image_2\n In the image: image_3\n What is Xiaose doing?",
+ "prediction": "Xiaose is sitting with their hand on their chin."
+ },
+ {
+ "id": 266,
+ "question": "Xiaose is image_1\n Qianluo is image_2\n Tanglian is image_3\n Leiwujie is image_4\n In the image: image_5\n Identify Qianluo with grounding.",
+ "prediction": "[Qianluo](203,239),(371,861)"
+ },
+ {
+ "id": 267,
+ "question": "Yuechu is image_1\n Susu is image_2\n In the image: image_3\n Identify Susu with grounding.",
+ "prediction": "[Susu](510,525),(903,995)"
+ },
+ {
+ "id": 268,
+ "question": "Yuechu is image_1\n Susu is image_2\n In the image: image_3\n What is Yuechu doing?",
+ "prediction": "Yuechu is holding a speech bubble with Chinese characters."
+ },
+ {
+ "id": 269,
+ "question": "Yuechu is image_1\n Susu is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Yuechu is on the left, holding a red popsicle, and Susu is on the right, wearing a multicolored kimono with a pointed tail. They appear to be standing against a clear sky with greenery in the background."
+ },
+ {
+ "id": 270,
+ "question": "Rongrong is image_1\n Yaya is image_2\n In the image: image_3\n Identify Rongrong with grounding.",
+ "prediction": "[Rongrong](28,242),(478,981)"
+ },
+ {
+ "id": 271,
+ "question": "Fugui is image_1\n Qingtong is image_2\n In the image: image_3\n What is Fugui doing?",
+ "prediction": "Fugui is embracing Qingtong."
+ },
+ {
+ "id": 272,
+ "question": "Yuechu is image_1\n Susu is image_2\n Describe the image: image_3\n",
+ "prediction": "Yuechu is standing on the left, drawing on a sketchbook. Susu is on the right, watching Yuechu with a pole in her hand. They are indoors with a wooden background."
+ },
+ {
+ "id": 273,
+ "question": "Yuechu is image_1\n Susu is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Susu is sitting on the ground next to Yuechu, who is lying down with their eyes closed. They appear to be in a destroyed village setting under a reddish sky."
+ },
+ {
+ "id": 274,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n In the image: image_4\n Who is sitting on the chair?",
+ "prediction": "Fujie is sitting on the chair."
+ },
+ {
+ "id": 275,
+ "question": "Aniya is image_1\n Fujie is image_2\n In the image: image_3\n What is Aniya doing?",
+ "prediction": "Aniya is hiding behind the door."
+ },
+ {
+ "id": 276,
+ "question": "Aniya is image_1\n In the image: image_2\n Identify Aniya with grounding.",
+ "prediction": "[Aniya](97,373),(659,983)"
+ },
+ {
+ "id": 277,
+ "question": "Fujie is image_1\n Yueer is image_2\n In the image: image_3\n What is Yueer doing?",
+ "prediction": "Yueer is leaning towards Fujie's face with her hand raised."
+ },
+ {
+ "id": 278,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n In the image: image_4\n What does Yueer hold?",
+ "prediction": "Yueer holds a picnic basket."
+ },
+ {
+ "id": 279,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n Descirbe the image: image_4\n",
+ "prediction": "Aniya is a young girl in a red jacket, standing between Fujie, who is dressed in a suit holding a gift, and Yueer, wearing a pink dress with shopping bags. They appear to be after a successful shopping trip."
+ },
+ {
+ "id": 280,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n In the image: image_4\n Who is near the window?",
+ "prediction": "Fujie is near the window."
+ },
+ {
+ "id": 281,
+ "question": "Fujie is image_1\n Yueer is image_2\n In the image: image_3\n Describe Yueer's outfit.",
+ "prediction": "Yueer is wearing a blue dress with a yellow flower on the side."
+ },
+ {
+ "id": 282,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Aniya is sitting on the floor, looking at Fujie, who is sitting on a sofa reading a paper. Yueer is kneeling on the right, also looking at Fujie. They are in a living room with a fireplace and a chandelier."
+ },
+ {
+ "id": 283,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n What do you see in the image: image_4\n",
+ "prediction": "Aniya is sitting on Fujie's lap, leaning against a cloudy sky backdrop. Fujie is holding onto Yueer, who appears to be standing slightly behind with a focused expression."
+ },
+ {
+ "id": 284,
+ "question": "Fujie is image_1\n Yueer is image_2\n Beiji is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Fujie is sitting on a sofa with a surprised expression, while Yueer is standing beside her holding a cat. Beiji is sitting on the floor, looking towards Fujie and Yueer. The room has a cozy Japanese style interior."
+ },
+ {
+ "id": 285,
+ "question": "Aniya is image_1\n Fujie is image_2\n Provide a description of the image: image_3\n",
+ "prediction": "Aniya is riding a surfboard with a girl in the front, while Fujie is lying on a surfboard in the back, both are in the middle of the ocean with small waves."
+ },
+ {
+ "id": 286,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n In the image: image_4\n What expression is on Yueer's face?",
+ "prediction": "Yueer is smiling with her eyes closed."
+ },
+ {
+ "id": 287,
+ "question": "Aniya is image_1\n Cizi is image_2\n In the image: image_3\n What is Cizi's emotion?",
+ "prediction": "Cizi appears to be angry."
+ },
+ {
+ "id": 288,
+ "question": "Aniya is image_1\n Fujie is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Aniya is lying in bed, while Fujie is leaning over, looking at a clock."
+ },
+ {
+ "id": 289,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n In the image: image_4\n What is Fujie doing?",
+ "prediction": "Fujie is sitting and holding a drink."
+ },
+ {
+ "id": 290,
+ "question": "Aniya is image_1\n Fujie is image_2\n In the image: image_3\n Describe the content.",
+ "prediction": "Aniya is seated at a table, focused on writing on pieces of paper, while Fujie stands behind her, gesturing as if he's explaining something."
+ },
+ {
+ "id": 291,
+ "question": "Aniya is image_1\n Beiji is image_2\n Cizi is image_3\n In the image: image_4\n Identify Cizi with grounding.",
+ "prediction": "[Cizi](579,230),(748,1020)"
+ },
+ {
+ "id": 292,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n In the image: image_4\n Whose arms is Aniya in?",
+ "prediction": "Aniya is in Fujie's arms."
+ },
+ {
+ "id": 293,
+ "question": "Aniya is image_1\n Fujie is image_2\n Yueer is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Aniya is standing on one leg with a stretched arm, seemingly in a dance pose. Fujie is sitting on the couch, partially visible on the right side. Yueer is standing behind Aniya, with her body angled towards the left side of the image."
+ },
+ {
+ "id": 294,
+ "question": "Ranbing is image_1\n In the image: image_2\n Identify Ranbing with grounding.",
+ "prediction": "[Ranbing](150,274),(331,966)"
+ },
+ {
+ "id": 295,
+ "question": "Make is image_1\n Ranbing is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Make stands on the right in a suit, facing Ranbing, who is on the left in a bridal gown with a veil. They are surrounded by guests in a wedding setting."
+ },
+ {
+ "id": 296,
+ "question": "Ailika is image_1\n In the image: image_2\n What is Ailika doing?",
+ "prediction": "Ailika is sitting in a vehicle with her arm raised."
+ },
+ {
+ "id": 297,
+ "question": "Baiyuekui is image_1\n Xiadou is image_2\n In the image: image_3\n Identify Xiadou with grounding.",
+ "prediction": "[Xiadou](450,209),(757,838)"
+ },
+ {
+ "id": 298,
+ "question": "Hongkou is image_1\n In the image: image_2\n What is Hongkou doing?",
+ "prediction": "Hongkou is holding a gun and seems to be in a conversation or negotiation."
+ },
+ {
+ "id": 299,
+ "question": "Chengxiaoshi is image_1\n Luguang is image_2\n Qiaoling is image_3\n In the image: image_4\n Identify Chengxiaoshi with grounding.",
+ "prediction": "[Chengxiaoshi](267,198),(493,891)"
+ },
+ {
+ "id": 300,
+ "question": "Chengxiaoshi is image_1\n Qiaoling is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Qiaoling stands to the left with her body facing slightly right, wearing a school uniform. Chengxiaoshi is on the right, raising his hands with a smile, wearing a jacket with leaves on it. They appear to be outside near a window and a brick wall."
+ },
+ {
+ "id": 301,
+ "question": "Chengxiaoshi is image_1\n Luguang is image_2\n Qiaoling is image_3\n In the image: image_4\n Who is opening the door?",
+ "prediction": "Qiaoling is opening the door."
+ },
+ {
+ "id": 302,
+ "question": "Chengxiaoshi is image_1\n Luguang is image_2\n In the image: image_3\n What is Chengxiaoshi doing?",
+ "prediction": "Chengxiaoshi is standing next to Luguang."
+ },
+ {
+ "id": 303,
+ "question": "Luguang is image_1\n Qiaoling is image_2\n In the image: image_3\n Identify Luguang with grounding.",
+ "prediction": "[Luguang](43,103),(403,983)"
+ },
+ {
+ "id": 304,
+ "question": "Cody is image_1\n May is image_2\n In the image: image_3\n Identify May with grounding.",
+ "prediction": "[May](150,184),(407,937)"
+ },
+ {
+ "id": 305,
+ "question": "Cody is image_1\n May is image_2\n In the image: image_3\n What is Cody doing?",
+ "prediction": "Cody is holding a large rock."
+ },
+ {
+ "id": 306,
+ "question": "Cody is image_1\n May is image_2\n In the image: image_3\n Who is carrying the red magnet?",
+ "prediction": "Cody is carrying the red magnet."
+ },
+ {
+ "id": 307,
+ "question": "Bob parr is image_1\n Elastigirl is image_2\n Dashiell is image_3\n Violet parr is image_4\n In the image: image_5\n Identify Elastigirl with grounding.",
+ "prediction": "[Elastigirl](645,129),(950,972)"
+ },
+ {
+ "id": 308,
+ "question": "Elastigirl is image_1\n Dashiell is image_2\n Violet parr is image_3\n Jack-jack parr is image_4\n In the image: image_5\n Who is holding Jack-jack in arms?",
+ "prediction": "Violet parr."
+ },
+ {
+ "id": 309,
+ "question": "Bob parr is image_1\n Dashiell is image_2\n Violet parr is image_3\n In the image: image_4\n Identify Violet parr with grounding.",
+ "prediction": "[Violet parr](735,338),(978,986)"
+ },
+ {
+ "id": 310,
+ "question": "Elastigirl is image_1\n Jack-jack parr is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Elastigirl is standing in a kitchen, holding JackJack Parr's head above a sink filled with water and soap."
+ },
+ {
+ "id": 311,
+ "question": "Elastigirl is image_1\n Dashiell is image_2\n Jack-jack parr is image_3\n In the image: image_4\n What is Dashiell doing?",
+ "prediction": "Dashiell is sitting at the dinner table."
+ },
+ {
+ "id": 312,
+ "question": "Bob parr is image_1\n Elastigirl is image_2\n Dashiell is image_3\n Violet parr is image_4\n Jack-jack parr is image_5\n In the image: image_6\n Identify Bob parr with grounding.",
+ "prediction": "[Bob parr](114,38),(367,951)"
+ },
+ {
+ "id": 313,
+ "question": "Bob parr is image_1\n/img>\n In the image: image_2\n What is Bob parr doing?",
+ "prediction": "Bob parr is pouring a drink from a pitcher."
+ },
+ {
+ "id": 314,
+ "question": "Bob parr is image_1\n Elastigirl is image_2\n Jack-jack parr is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Elastigirl is sitting on a red motorcycle, looking to her right. Bob Parr is standing to her left, holding a small creature. JackJack Parr is standing between them, slightly behind. They are in a dimly lit room."
+ },
+ {
+ "id": 315,
+ "question": "Woody is image_1\n Jessie is image_2\n In the image: image_3\n Identify Jessie with grounding.",
+ "prediction": "[Jessie](7,35),(525,983)"
+ },
+ {
+ "id": 316,
+ "question": "Buzz is image_1\n Jessie is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Buzz Lightyear is playfully tussling with Jessie on a wooden floor."
+ },
+ {
+ "id": 317,
+ "question": "Woody is image_1\n Jessie is image_2\n Describe the content of the image: image_3\n",
+ "prediction": "Woody and Jessie are standing close to each other, surrounded by various characters from the Toy Story series."
+ },
+ {
+ "id": 318,
+ "question": "Woody is image_1\n Buzz is image_2\n Lotso is image_3\n In the image: image_4\n Identify Woody with grounding.",
+ "prediction": "[Woody](785,62),(951,820)"
+ },
+ {
+ "id": 319,
+ "question": "Woody is image_1\n Buzz is image_2\n Jessie is image_3\n In the image: image_4\n Who is Buzz looking at?",
+ "prediction": "Buzz is looking at Woody."
+ },
+ {
+ "id": 320,
+ "question": "Betty is image_1\n In the image: image_2\n Identify Betty with grounding.",
+ "prediction": "[Betty](489,105),(905,887)"
+ },
+ {
+ "id": 321,
+ "question": "Woody is image_1\n Buzz is image_2\n In the image: image_3\n Which hand of the boy is Buzz in?",
+ "prediction": "Buzz is on the left hand of the boy."
+ },
+ {
+ "id": 322,
+ "question": "Woody is image_1\n Buzz is image_2\n In the image: image_3\n What is Woody doing?",
+ "prediction": "Woody is standing with his back slightly turned."
+ },
+ {
+ "id": 323,
+ "question": "Buzz is image_1\n Jessie is image_2\n Rex is image_3\n In the image: image_4\n Who is being pressed at the bottom?",
+ "prediction": "Rex is being pressed at the bottom."
+ },
+ {
+ "id": 324,
+ "question": "Woody is image_1\n Buzz is image_2\n Jessie is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Woody stands on the left, Buzz in the center, and Jessie on the right, surrounded by various toy characters in a colorful toy room."
+ },
+ {
+ "id": 325,
+ "question": "Woody is image_1\n Buzz is image_2\n Describe the image: image_3\n",
+ "prediction": "Woody on the left is holding up his right hand while Buzz on the right is holding up a purple object in a room filled with various toys."
+ },
+ {
+ "id": 326,
+ "question": "Woody is image_1\n Buzz is image_2\n Bo peep is image_3\n In the image: image_4\n What is Bo peep doing?",
+ "prediction": "Bo peep is walking with a sheep."
+ },
+ {
+ "id": 327,
+ "question": "Woody is image_1\n Bo peep is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Woody is lying on his back on the grass, and Bo Peep is sitting on top of him, leaning closely towards him."
+ },
+ {
+ "id": 328,
+ "question": "Woody is image_1\n Buzz is image_2\n Please give a summary of the image: image_3\n",
+ "prediction": "Woody is sitting on a red couch with his hands up in the air, while Buzz is standing with his arms spread out wide, both against a backdrop of a vibrant, colorful scene."
+ },
+ {
+ "id": 329,
+ "question": "Woody is image_1\n Buzz is image_2\n Jessie is image_3\n Rex is image_4\n In the image: image_5\n Identify Rex with grounding.",
+ "prediction": "[Rex](767,357),(983,826)"
+ },
+ {
+ "id": 330,
+ "question": "Woody is image_1\n Buzz is image_2\n Jessie is image_3\n Bo peep is image_4\n In the image: image_5\n Who is on the right of Bo peep?",
+ "prediction": "Woody is on the right of Bo peep."
+ },
+ {
+ "id": 331,
+ "question": "Fuheihui is image_1\n Qiangwei is image_2\n Wutiaowu is image_3\n Qihai is image_4\n In the image: image_5\n Identify Fuheihui with grounding.",
+ "prediction": "[Fuheihui](389,116),(935,978)"
+ },
+ {
+ "id": 332,
+ "question": "Lizi is image_1\n In the image: image_2\n What is Lizi doing?",
+ "prediction": "Lizi is standing with her hands on her hips."
+ },
+ {
+ "id": 333,
+ "question": "Wutiaowu is image_1\n Xiayoujie is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Wutiaowu is seated facing away, looking out a cityscape, while Xiayoujie stands beside him facing towards the viewer."
+ },
+ {
+ "id": 334,
+ "question": "Wutiaowu is image_1\n Lizi is image_2\n In the image: image_3\n What is Wutiaowu doing?",
+ "prediction": "Wutiaowu is sitting and embracing Lizi."
+ },
+ {
+ "id": 335,
+ "question": "Wutiaowu is image_1\n Xiayoujie is image_2\n In the image: image_3\n What is Xiayoujie's expression?",
+ "prediction": "Xiayoujie looks surprised or in a state of excitement."
+ },
+ {
+ "id": 336,
+ "question": "Huzhang is image_1\n Fuheihui is image_2\n Qiangwei is image_3\n Wutiaowu is image_4\n In the image: image_5\n Who is sitting on the sofa?",
+ "prediction": "Huzhang is sitting on the sofa."
+ },
+ {
+ "id": 337,
+ "question": "Dongtang is image_1\n Zhenren is image_2\n In the image: image_3\n What is Zhenren doing?",
+ "prediction": "Zhenren is forcefully pushing Dongtang away."
+ },
+ {
+ "id": 338,
+ "question": "Huzhang is image_1\n Fuheihui is image_2\n Goujuan is image_3\n In the image: image_4\n Give a description.",
+ "prediction": "Huzhang is on the right, making a peace sign with his fingers. Fuheihui is in the middle, slightly turned to his left, with one hand covering his face. Goujuan is on the left, gesturing with both hands towards his chest. They all appear to accompany their gestures with smiles."
+ },
+ {
+ "id": 339,
+ "question": "Xiayoujie is image_1\n In the image: image_2\n What is Xiayoujie doing?",
+ "prediction": "Xiayoujie is sitting and reading a book."
+ },
+ {
+ "id": 340,
+ "question": "Qihai is image_1\n In the image: image_2\n Identify Qihai with grounding.",
+ "prediction": "[Qihai](153,239),(606,977)"
+ },
+ {
+ "id": 341,
+ "question": "Huzhang is image_1\n Mingming is image_2\n In the image: image_3\n Identify Mingming with grounding.",
+ "prediction": "[Mingming](589,433),(767,988)"
+ },
+ {
+ "id": 342,
+ "question": "Louhu is image_1\n In the image: image_2\n Identify Louhu with grounding.",
+ "prediction": "[Louhu](221,250),(560,968)"
+ },
+ {
+ "id": 343,
+ "question": "Fuheihui is image_1\n Qiangwei is image_2\n In the image: image_3\n Identify Qiangwei with grounding.",
+ "prediction": "[Qiangwei](96,131),(443,988)"
+ },
+ {
+ "id": 344,
+ "question": "Huzhang is image_1\n Louhu is image_2\n Give a content description of the image: image_3\n",
+ "prediction": "Louhu, wearing a spotted outfit, is holding Huzhang, who appears to be in a relaxed position on the ground."
+ },
+ {
+ "id": 345,
+ "question": "Wutiaowu is image_1\n Xiayoujie is image_2\n In the image: image_3\n What does Wutiaowu wear?",
+ "prediction": "Wutiaowu is wearing a red jacket over a white shirt."
+ },
+ {
+ "id": 346,
+ "question": "Wutiaowu is image_1\n Shener is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Wutiaowu is in a combat stance with a sword in hand, positioned as if ready to strike. Shener is in a defensive pose with a sword, facing Wutiaowu. They seem to be in a tense altercation under a red torii gate in a wooded area."
+ },
+ {
+ "id": 347,
+ "question": "Wutiaowu is image_1\n Xiayoujie is image_2\n Lizi is image_3\n In the image: image_4\n Identify Xiayoujie with grounding.",
+ "prediction": "[Xiayoujie](753,101),(998,978)"
+ },
+ {
+ "id": 348,
+ "question": "Huzhang is image_1\n Qiangwei is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Qiangwei, wearing a blue outfit, is gesturing with her right hand towards Huzhang, who is dressed in a red outfit with spiky hair. They appear to be in a conversation."
+ },
+ {
+ "id": 349,
+ "question": "Huzhang is image_1\n Fuheihui is image_2\n Qiangwei is image_3\n Please explain what's happening in the photo: image_4\n",
+ "prediction": "Huzhang is standing on the left, wearing a red scarf and a dark uniform with his fist clenched. Fuheihui is on the right, in a brown uniform, also with a fists clasped. Qiangwei is in the center, partially obscured, facing right, wearing a blue uniform."
+ },
+ {
+ "id": 350,
+ "question": "Huzhang is image_1\n Fuheihui is image_2\n Qiangwei is image_3\n In the image: image_4\n Identify Huzhang with grounding.",
+ "prediction": "[Huzhang](155,108),(596,972)"
+ },
+ {
+ "id": 351,
+ "question": "Ningguang is image_1\n Beidou is image_2\n In the image: image_3\n Give a description.",
+ "prediction": "Ningguang, on the left, is standing behind a table looking towards Beidou, who is leaning on the table with a relaxed posture, both surrounded by a lush forest setting."
+ },
+ {
+ "id": 352,
+ "question": "Zhongli is image_1\n Leishen is image_2\n Funingna is image_3\n In the image: image_4\n Identify Leishen with grounding.",
+ "prediction": "[Leishen](546,217),(839,987)"
+ },
+ {
+ "id": 353,
+ "question": "Hutao is image_1\n Yelan is image_2\n Xiao is image_3\n In the image: image_4\n What is Xiao doing?",
+ "prediction": "Xiao is walking to the right."
+ },
+ {
+ "id": 354,
+ "question": "Linghua is image_1\n Lingren is image_2\n In the image: image_3\n What is in Lingren's hand?",
+ "prediction": "Lingren is holding a teapot."
+ },
+ {
+ "id": 355,
+ "question": "Wulang is image_1\n In the image: image_2\n Identify Wulang with grounding.",
+ "prediction": "[Wulang](256,190),(456,933)"
+ },
+ {
+ "id": 356,
+ "question": "Abeiduo is image_1\n Kong is image_2\n In the image: image_3\n Who is holding a sword?",
+ "prediction": "Kong is holding a sword."
+ },
+ {
+ "id": 357,
+ "question": "Diluke is image_1\n Qin is image_2\n In the image: image_3\n Identify Qin with grounding.",
+ "prediction": "[Qin](135,210),(359,995)"
+ },
+ {
+ "id": 358,
+ "question": "Ningguang is image_1\n Kong is image_2\n Describe the image: image_3\n",
+ "prediction": "Ningguang is seated to the left, roasting marshmallows on a campfire, while Kong is seated to the right, looking on. They are surrounded by a forest and clear sky."
+ },
+ {
+ "id": 359,
+ "question": "Keqing is image_1\n Ying is image_2\n Give a content description of the image: image_3\n",
+ "prediction": "Keqing is on the left, wearing a purple dress with white cat ears, standing next to Ying, who is on the right wearing a blue gladiator-style outfit with a cape. They are in front of a mountainous backdrop."
+ },
+ {
+ "id": 360,
+ "question": "Regina Lampert is image_0\n In the following four images, Which is Regina Lampert? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 361,
+ "question": "Peter Joshua is image_0\n In the following four images, Which is Peter Joshua? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 362,
+ "question": "Peter Joshua is image_0\n In the following four images, Which is Peter Joshua? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 363,
+ "question": "Hamilton Bartholomew is image_0\n In the following four images, Which is Hamilton Bartholomew? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 364,
+ "question": "Kazan is image_0\n In the following four images, Which is Kazan? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 365,
+ "question": "Worth is image_0\n In the following four images, Which is Worth? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 366,
+ "question": "Worth is image_0\n In the following four images, Which is Worth? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 367,
+ "question": "Worth is image_0\n In the following four images, Which is Worth? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 368,
+ "question": "Quentin is image_0\n In the following four images, Which is Quentin? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 369,
+ "question": "Holloway is image_0\n In the following four images, Which is Holloway? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 370,
+ "question": "Leaven is image_0\n In the following four images, Which is Leaven? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 371,
+ "question": "Leaven is image_0\n In the following four images, Which is Leaven? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 372,
+ "question": "Agent Fox Mulder is image_0\n In the following four images, Which is Agent Fox Mulder? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 373,
+ "question": "Agent Dana Scully is image_0\n In the following four images, Which is Agent Dana Scully? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 374,
+ "question": "Reed Richards is image_0\n In the following four images, Which is Reed Richards? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 375,
+ "question": "Johnny Storm is image_0\n In the following four images, Which is Johnny Storm? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 376,
+ "question": "Sue Storm is image_0\n In the following four images, Which is Sue Storm? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 377,
+ "question": "Victor Von Doom is image_0\n In the following four images, Which is Victor Von Doom? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 378,
+ "question": "Sharon is image_0\n In the following four images, Which is Sharon? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 379,
+ "question": "Burke Dennings is image_0\n In the following four images, Which is Burke Dennings? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 380,
+ "question": "Jen Yu (Mandarin version) is image_0\n In the following four images, Which is Jen Yu (Mandarin version)? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 381,
+ "question": "Master Li Mu Bai is image_0\n In the following four images, Which is Master Li Mu Bai? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 382,
+ "question": "Yu Shu Lien is image_0\n In the following four images, Which is Yu Shu Lien? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 383,
+ "question": "Lo 'Dark Cloud' is image_0\n In the following four images, Which is Lo 'Dark Cloud'? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 384,
+ "question": "Evan is image_0\n In the following four images, Which is Evan? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 385,
+ "question": "Andrea is image_0\n In the following four images, Which is Andrea? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 386,
+ "question": "Lenny is image_0\n In the following four images, Which is Lenny? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 387,
+ "question": "Kayleigh is image_0\n In the following four images, Which is Kayleigh? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 388,
+ "question": "antelope is image_0\n In the following four images, Which is antelope? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 389,
+ "question": "appaloosa is image_0\n In the following four images, Which is appaloosa? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 390,
+ "question": "arabiancamel is image_0\n In the following four images, Which is arabiancamel? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 391,
+ "question": "asiancrocodile is image_0\n In the following four images, Which is asiancrocodile? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 392,
+ "question": "belgianhare is image_0\n In the following four images, Which is belgianhare? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 393,
+ "question": "bighorn is image_0\n In the following four images, Which is bighorn? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 394,
+ "question": "bovine is image_0\n In the following four images, Which is bovine? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 395,
+ "question": "cheetah is image_0\n In the following four images, Which is cheetah? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 396,
+ "question": "cheviot is image_0\n In the following four images, Which is cheviot? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 397,
+ "question": "dallsheep is image_0\n In the following four images, Which is dallsheep? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 398,
+ "question": "elk is image_0\n In the following four images, Which is elk? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 399,
+ "question": "forestgoat is image_0\n In the following four images, Which is forestgoat? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 400,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 401,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 402,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 403,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 404,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 405,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 406,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 407,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 408,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 409,
+ "question": "The reference vehicle is image_0\n In the following four images, Which is the reference vehicle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 410,
+ "question": "Willem_Merkxtuin is image_0\n In the following four images, Which is Willem_Merkxtuin? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 411,
+ "question": "Ch%C3%A2teau_de_Chenonceau is image_0\n In the following four images, Which is Ch%C3%A2teau_de_Chenonceau? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 412,
+ "question": "Munshi_Ghat is image_0\n In the following four images, Which is Munshi_Ghat? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 413,
+ "question": "Burg_Heidenreichstein is image_0\n In the following four images, Which is Burg_Heidenreichstein? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 414,
+ "question": "Santa_Maria_in_Cappella_(Rome) is image_0\n In the following four images, Which is Santa_Maria_in_Cappella_(Rome)? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 1"
+ },
+ {
+ "id": 415,
+ "question": "%C3%89glise_Saint-Martin_(Laon) is image_0\n In the following four images, Which is %C3%89glise_Saint-Martin_(Laon)? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 416,
+ "question": "Bizzell_Memorial_Library is image_0\n In the following four images, Which is Bizzell_Memorial_Library? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 4"
+ },
+ {
+ "id": 417,
+ "question": "Hiyoshi_Taisha is image_0\n In the following four images, Which is Hiyoshi_Taisha? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 418,
+ "question": "Michelangelo's_Moses is image_0\n In the following four images, Which is Michelangelo's_Moses? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 419,
+ "question": "%C4%BDubov%C5%88a_Castle is image_0\n In the following four images, Which is %C4%BDubov%C5%88a_Castle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 420,
+ "question": "Coll%C3%A9giale_Notre-Dame_de_Vernon is image_0\n In the following four images, Which is Coll%C3%A9giale_Notre-Dame_de_Vernon? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ },
+ {
+ "id": 421,
+ "question": "Cathedral_of_Guadalajara,_Mexico is image_0\n In the following four images, Which is Cathedral_of_Guadalajara,_Mexico? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 422,
+ "question": "Kankalini_Temple,_Saptari is image_0\n In the following four images, Which is Kankalini_Temple,_Saptari? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 423,
+ "question": "Wat_Thewarat_Kunchon is image_0\n In the following four images, Which is Wat_Thewarat_Kunchon? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 424,
+ "question": "Moszna_Castle is image_0\n In the following four images, Which is Moszna_Castle? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 425,
+ "question": "Cathedral-Basilica_of_Mary,_Queen_of_the_World is image_0\n In the following four images, Which is Cathedral-Basilica_of_Mary,_Queen_of_the_World? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 3"
+ },
+ {
+ "id": 426,
+ "question": "Helsinki_Lutheran_Cathedral is image_0\n In the following four images, Which is Helsinki_Lutheran_Cathedral? Image 1: image_1\n Image 2: image_2\n Image 3: image_3\n Image 4: image_4\n",
+ "prediction": "Image 2"
+ }
+]
\ No newline at end of file