|
[ |
|
{ |
|
"id": 1, |
|
"question": "Ben Milo is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Ben Milo with grounding.", |
|
"prediction": "<ref>Ben Milo</ref><box>(642,219),(964,995)</box>" |
|
}, |
|
{ |
|
"id": 2, |
|
"question": "Caption Mitch is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Caption Mitch doing?", |
|
"prediction": "Caption Mitch is standing with his arms crossed." |
|
}, |
|
{ |
|
"id": 3, |
|
"question": "Caption Mitch is <img>image_1</img>\n Vern is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Vern, on the left, is holding the reins of a horse and facing Mitch, who is partially obscured behind a horse's head. Both appear to be in a military camp, surrounded by rocky terrain and other soldiers." |
|
}, |
|
{ |
|
"id": 4, |
|
"question": "Caption Mitch is <img>image_1</img>\n Gen. Dostum is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is holding an interphone?", |
|
"prediction": "Gen. Dostum is holding an interphone." |
|
}, |
|
{ |
|
"id": 5, |
|
"question": "Hal Spencer is <img>image_1</img>\n In the image: <img>image_2</img>\n How is his state?", |
|
"prediction": "Hal Spencer is lying on the ground, seemingly injured or resting." |
|
}, |
|
{ |
|
"id": 6, |
|
"question": "Vern is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Vern doing?", |
|
"prediction": "Vern is aiming a rifle while crouched down on rocky terrain." |
|
}, |
|
{ |
|
"id": 7, |
|
"question": "Kyle is <img>image_1</img>\n Adam is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Kyle's state?", |
|
"prediction": "Kyle is in a conversation with Adam." |
|
}, |
|
{ |
|
"id": 8, |
|
"question": "Diane is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Diane with grounding.", |
|
"prediction": "<ref>Diane</ref><box>(10,0),(429,984)</box>" |
|
}, |
|
{ |
|
"id": 9, |
|
"question": "Adam is <img>image_1</img>\n Diane is <img>image_2</img>\n Richard is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Richard with grounding.", |
|
"prediction": "<ref>Richard</ref><box>(0,205),(341,979)</box>" |
|
}, |
|
{ |
|
"id": 10, |
|
"question": "Alan is <img>image_1</img>\n Mitch is <img>image_2</img>\n Please describe the image: <img>image_3</img>\n", |
|
"prediction": "Alan is seated on the left, holding a bowl of chips, while Mitch is seated on the right, both in a medical setting with an IV and monitoring equipment in the background." |
|
}, |
|
{ |
|
"id": 11, |
|
"question": "Mitch is <img>image_1</img>\n In the image: <img>image_2</img>\n What color is Mitch's clothes?", |
|
"prediction": "Mitch is wearing a beige jacket and blue jeans." |
|
}, |
|
{ |
|
"id": 12, |
|
"question": "Diane is <img>image_1</img>\n Richard is <img>image_2</img>\n In the image: <img>image_3</img>\n What is the spatial relation between Diane and Richard?", |
|
"prediction": "Diane is in front of Richard." |
|
}, |
|
{ |
|
"id": 13, |
|
"question": "Jackson is <img>image_1</img>\n Lilly is <img>image_2</img>\n Noah is <img>image_3</img>\n Please describe the photo: <img>image_4</img>\n", |
|
"prediction": "Lilly stands between a man and a boy, both facing a soldier in a camouflaged uniform. The man, Jackson, holds her hand, and Noah stands by his side looking at the soldier. They appear to be in a military operation or an area with smoke in the background." |
|
}, |
|
{ |
|
"id": 14, |
|
"question": "Kate is <img>image_1</img>\n Lilly is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Kate doing?", |
|
"prediction": "Kate is sitting in a car with her arm around Lilly." |
|
}, |
|
{ |
|
"id": 15, |
|
"question": "Jackson is <img>image_1</img>\n Gordon is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Gordon with grounding.", |
|
"prediction": "<ref>Gordon</ref><box>(503,125),(910,996)</box>" |
|
}, |
|
{ |
|
"id": 16, |
|
"question": "Kate is <img>image_1</img>\n Noah is <img>image_2</img>\n In the image: <img>image_3</img>\n From our view, which side of Kate is Noah at?", |
|
"prediction": "Noah is on the right side of Kate." |
|
}, |
|
{ |
|
"id": 17, |
|
"question": "Jackson is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Jackson with grounding.", |
|
"prediction": "<ref>Jackson</ref><box>(421,104),(735,956)</box>" |
|
}, |
|
{ |
|
"id": 18, |
|
"question": "Dukchoon is <img>image_1</img>\n Kim is <img>image_2</img>\n In the image: <img>image_3</img>\n Please give a description.", |
|
"prediction": "Dukchoon is kneeling beside Kim, who is also kneeling, wearing a firefighter's uniform. They appear to be in a sandy area with no structures visible." |
|
}, |
|
{ |
|
"id": 19, |
|
"question": "Kim is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Kim with grounding", |
|
"prediction": "<ref>Kim</ref><box>(199,226),(493,996)</box>" |
|
}, |
|
{ |
|
"id": 20, |
|
"question": "Kim is <img>image_1</img>\n Kangrim is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is pushing the bamboo raft nearby?", |
|
"prediction": "Kim is pushing the bamboo raft." |
|
}, |
|
{ |
|
"id": 21, |
|
"question": "Dukchoon is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Dukchoon's expression?", |
|
"prediction": "Dukchoon looks surprised or inquisitive." |
|
}, |
|
{ |
|
"id": 22, |
|
"question": "Ron is <img>image_1</img>\n Brian is <img>image_2</img>\n Champ is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is driving the car?", |
|
"prediction": "Ron is driving the car." |
|
}, |
|
{ |
|
"id": 23, |
|
"question": "Brian is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Brian with grounding.", |
|
"prediction": "<ref>Brian</ref><box>(645,309),(978,995)</box>" |
|
}, |
|
{ |
|
"id": 24, |
|
"question": "Ron is <img>image_1</img>\n Brick is <img>image_2</img>\n Explain the content of this image: <img>image_3</img>\n", |
|
"prediction": "Ron is sitting on the left, holding a can, and gesturing with his right hand. Brick is sitting on the right, wearing a patterned jacket. They appear to be in a room with blinds on the window behind them." |
|
}, |
|
{ |
|
"id": 25, |
|
"question": "Veronica is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Veronica with grounding.", |
|
"prediction": "<ref>Veronica</ref><box>(15,175),(303,995)</box>" |
|
}, |
|
{ |
|
"id": 26, |
|
"question": "Ron is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Ron doing?", |
|
"prediction": "Ron is sitting on a chair and interacting with a young boy." |
|
}, |
|
{ |
|
"id": 27, |
|
"question": "Ron is <img>image_1</img>\n Veronica is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe the image.", |
|
"prediction": "Veronica, wearing a yellow coat and pink hat, stands to the left with her arm extended towards a young boy, Ron, who is standing to her right. Both are facing forward, with a sandy beach and greenery in the background." |
|
}, |
|
{ |
|
"id": 28, |
|
"question": "Bill is <img>image_1</img>\n Barbara is <img>image_2</img>\n Violet is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is sitting at the middle of the table?", |
|
"prediction": "Bill is sitting at the middle of the table." |
|
}, |
|
{ |
|
"id": 29, |
|
"question": "Barbara is <img>image_1</img>\n Violet is <img>image_2</img>\n Mattie is <img>image_3</img>\n Explain the content of the image: <img>image_4</img>\n", |
|
"prediction": "Barbara stands holding papers, facing away from the camera. Violet sits to the right, looking at papers. Mattie sits to the left, also looking at papers. They appear to be in a discussion in an ornately decorated room." |
|
}, |
|
{ |
|
"id": 30, |
|
"question": "Barbara is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Barbara with grounding.", |
|
"prediction": "<ref>Barbara</ref><box>(660,86),(929,968)</box>" |
|
}, |
|
{ |
|
"id": 31, |
|
"question": "Barbara is <img>image_1</img>\n Mattie is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Mattie doing?", |
|
"prediction": "Mattie is sitting at a table with a glass of wine." |
|
}, |
|
{ |
|
"id": 32, |
|
"question": "Bill is <img>image_1</img>\n Charlie is <img>image_2</img>\n Barbara is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Bill with grounding.", |
|
"prediction": "<ref>Bill</ref><box>(0,20),(357,981)</box>" |
|
}, |
|
{ |
|
"id": 33, |
|
"question": "Lynn is <img>image_1</img>\n Lynn's father is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Lynn's father with grounding.", |
|
"prediction": "<ref>Lynn's father</ref><box>(465,75),(732,736)</box>" |
|
}, |
|
{ |
|
"id": 34, |
|
"question": "Grace is <img>image_1</img>\n In the image: <img>image_2</img>\n Describe Grace's state.", |
|
"prediction": "Grace is in a school uniform." |
|
}, |
|
{ |
|
"id": 35, |
|
"question": "Bank is <img>image_1</img>\n Lynn is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Bank stands on the left, wearing a white shirt with a black tie and carrying a bag, while Lynn is on the right, also in a white shirt with a black tie, both facing forward. They appear to be in a room with wooden furnishings and a mirror reflecting another person." |
|
}, |
|
{ |
|
"id": 36, |
|
"question": "Lynn is <img>image_1</img>\n Grace is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Lynn with grounding.", |
|
"prediction": "<ref>Lynn</ref><box>(439,44),(867,981)</box>" |
|
}, |
|
{ |
|
"id": 37, |
|
"question": "Tong is <img>image_1</img>\n In the image: <img>image_2</img>\n What color is Tong's clothes?", |
|
"prediction": "Tong is wearing a blue shirt." |
|
}, |
|
{ |
|
"id": 38, |
|
"question": "Grace is <img>image_1</img>\n Pat is <img>image_2</img>\n Please describe the image: <img>image_3</img>\n", |
|
"prediction": "Grace is sitting on a table looking away, wearing a pink shirt. Pat is reclining next to her with his head resting on a arm, wearing a blue shirt. They appear to be in a room with various equipment." |
|
}, |
|
{ |
|
"id": 39, |
|
"question": "Scott is <img>image_1</img>\n Elizabeth is <img>image_2</img>\n In the image: <img>image_3</img>\n What does Scott wear?", |
|
"prediction": "Scott wears a beige jacket with a checked tie." |
|
}, |
|
{ |
|
"id": 40, |
|
"question": "Amy is <img>image_1</img>\n Lynn is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Amy with grounding.", |
|
"prediction": "<ref>Amy</ref><box>(112,36),(525,948)</box>" |
|
}, |
|
{ |
|
"id": 41, |
|
"question": "Wally is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Wally with grounding.", |
|
"prediction": "<ref>Wally</ref><box>(149,283),(603,980)</box>" |
|
}, |
|
{ |
|
"id": 42, |
|
"question": "Bei Zhai is <img>image_1</img>\n Shen Lian is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe the visual content.", |
|
"prediction": "Bei Zhai stands to the left, holding an umbrella, dressed in traditional attire. Shen Lian is on the right, also in traditional clothing, facing her. They appear to be in a bamboo forest." |
|
}, |
|
{ |
|
"id": 43, |
|
"question": "Shen lian is <img>image_1</img>\n Lu Wenzhao is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Lu Wenzhao doing?", |
|
"prediction": "Lu Wenzhao is placing his hand on Shen lian's shoulder." |
|
}, |
|
{ |
|
"id": 44, |
|
"question": "Bei Zhai is <img>image_1</img>\n Shen Lian is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe the state of Bei Zhai.", |
|
"prediction": "Bei Zhai is sitting and looking downwards." |
|
}, |
|
{ |
|
"id": 45, |
|
"question": "Bei Zhai is <img>image_1</img>\n Shen Lian is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Shen Lian with grounding.", |
|
"prediction": "<ref>Shen Lian</ref><box>(713,31),(913,987)</box>" |
|
}, |
|
{ |
|
"id": 46, |
|
"question": "Bei Zhai is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Bei Zhai with grounding.", |
|
"prediction": "<ref>Bei Zhai</ref><box>(460,219),(757,981)</box>" |
|
}, |
|
{ |
|
"id": 47, |
|
"question": "Lu Wenzhao is <img>image_1</img>\n Ding Baiying is <img>image_2</img>\n Describe the image: <img>image_3</img>\n", |
|
"prediction": "Lu Wenzhao is standing with a sword in hand, looking to the side. Ding Baiying is behind him, holding onto her shoulder. They are surrounded by fallen soldiers in a battle-torn area." |
|
}, |
|
{ |
|
"id": 48, |
|
"question": "Haskell is <img>image_1</img>\n In the image: <img>image_2</img>\n What is he doing?", |
|
"prediction": "He is sitting at a dining table." |
|
}, |
|
{ |
|
"id": 49, |
|
"question": "Molyneux is <img>image_1</img>\n In the image: <img>image_2</img>\n Describe the content.", |
|
"prediction": "Molyneux is seated on the left side of a car, wearing a dark suit and tie, while another passenger is visible on the right side. They appear to be engaged in a conversation or looking forward, inside a vehicle with visible steering wheel and windows." |
|
}, |
|
{ |
|
"id": 50, |
|
"question": "Henry Goose is <img>image_1</img>\n Native Woman is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Henry Goose with grounding.", |
|
"prediction": "<ref>Henry Goose</ref><box>(109,0),(539,977)</box>" |
|
}, |
|
{ |
|
"id": 51, |
|
"question": "Molyneux is <img>image_1</img>\n In the image: <img>image_2</img>\n Describe the state of Molyneux.", |
|
"prediction": "Molyneux is seated and appears to be drinking wine." |
|
}, |
|
{ |
|
"id": 52, |
|
"question": "Mr. Griffith is <img>image_1</img>\n Mrs. Griffith is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Mr. Griffith doing?", |
|
"prediction": "Mr. Griffith is sitting and looking at papers." |
|
}, |
|
{ |
|
"id": 53, |
|
"question": "Gibbons is <img>image_1</img>\n Describe the image: <img>image_2</img>\n", |
|
"prediction": "Gibbons, an elderly man in a suit, is dancing with a young woman in a red and black outfit. They are in a gymnasium with other people around them, including cheerleaders and basketball players." |
|
}, |
|
{ |
|
"id": 54, |
|
"question": "Micah is <img>image_1</img>\n In the image: <img>image_2</img>\n Describe the image.", |
|
"prediction": "Two men are sitting next to each other; one is playing the acoustic guitar while the other is holding a harmonica. They are outdoors, possibly on a bench or a similar low seating surface." |
|
}, |
|
{ |
|
"id": 55, |
|
"question": "Rhiannon is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Rhiannon with grounding.", |
|
"prediction": "<ref>Rhiannon</ref><box>(25,125),(410,990)</box>" |
|
}, |
|
{ |
|
"id": 56, |
|
"question": "Olive is <img>image_1</img>\n Rhiannon is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is carrying a handbag?", |
|
"prediction": "Olive is carrying a handbag." |
|
}, |
|
{ |
|
"id": 57, |
|
"question": "Brandon is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Brandon with grounding.", |
|
"prediction": "<ref>Brandon</ref><box>(485,30),(767,981)</box>" |
|
}, |
|
{ |
|
"id": 58, |
|
"question": "Walt is <img>image_1</img>\n Sue is <img>image_2</img>\n In the image: <img>image_3</img>\n Explain the content.", |
|
"prediction": "Walt, an elderly man, stands on a porch with a woman, Sue, to his left, gesturing towards him with her arm raised. Both are in front of a house." |
|
}, |
|
{ |
|
"id": 59, |
|
"question": "Karen is <img>image_1</img>\n Mitch is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Karen with grounding.", |
|
"prediction": "<ref>Karen</ref><box>(566,125),(966,985)</box>" |
|
}, |
|
{ |
|
"id": 60, |
|
"question": "Walt is <img>image_1</img>\n Thao is <img>image_2</img>\n In the image: <img>image_3</img>\n Please reason out what role of Thao is in this scene.", |
|
"prediction": "Thao is standing across the table from Walt, facing each other." |
|
}, |
|
{ |
|
"id": 61, |
|
"question": "Mitch is <img>image_1</img>\n Walt is <img>image_2</img>\n In the image: <img>image_3</img>\n What color is Walt's clothes?", |
|
"prediction": "Walt is wearing a striped shirt." |
|
}, |
|
{ |
|
"id": 62, |
|
"question": "Thao is <img>image_1</img>\n Sue is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Sue with grounding.", |
|
"prediction": "<ref>Sue</ref><box>(714,106),(998,985)</box>" |
|
}, |
|
{ |
|
"id": 63, |
|
"question": "Harry is <img>image_1</img>\n Hermione is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Harry stands in the center wearing a blue shirt, while Hermione is to his left, partially behind him. They appear to be in a dimly lit, rustic room." |
|
}, |
|
{ |
|
"id": 64, |
|
"question": "Hermione is <img>image_1</img>\n Ron is <img>image_2</img>\n In the image: <img>image_3</img>\n What is the spatial relation between Hermione and Ron?", |
|
"prediction": "Hermione is standing to the right of Ron." |
|
}, |
|
{ |
|
"id": 65, |
|
"question": "Harry is <img>image_1</img>\n Albus is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Albus with grounding.", |
|
"prediction": "<ref>Albus</ref><box>(582,38),(829,986)</box>" |
|
}, |
|
{ |
|
"id": 66, |
|
"question": "Hermione is <img>image_1</img>\n Harry is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Hermione with grounding.", |
|
"prediction": "<ref>Hermione</ref><box>(307,11),(757,983)</box>" |
|
}, |
|
{ |
|
"id": 67, |
|
"question": "Ron is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Ron with grounding.", |
|
"prediction": "<ref>Ron</ref><box>(6,166),(275,988)</box>" |
|
}, |
|
{ |
|
"id": 68, |
|
"question": "Ariadne is <img>image_1</img>\n Mal is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Mal with grounding.", |
|
"prediction": "<ref>Mal</ref><box>(710,22),(899,981)</box>" |
|
}, |
|
{ |
|
"id": 69, |
|
"question": "Eames is <img>image_1</img>\n Cobb is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Cobb with grounding.", |
|
"prediction": "<ref>Cobb</ref><box>(649,90),(877,988)</box>" |
|
}, |
|
{ |
|
"id": 70, |
|
"question": "Ariadne is <img>image_1</img>\n Yusuf is <img>image_2</img>\n In the image: <img>image_3</img>\n Please describe the content.", |
|
"prediction": "Ariadne is reclining on a chair with her arm resting on a table, facing towards the right. Yusuf is also reclined on a chair with his arm extended along the backrest, facing towards the left. Both appear to be in a relaxed posture." |
|
}, |
|
{ |
|
"id": 71, |
|
"question": "Ariadne is <img>image_1</img>\n In the image: <img>image_2</img>\n What is she doing?", |
|
"prediction": "Ariadne is walking and looking at something or someone to her right." |
|
}, |
|
{ |
|
"id": 72, |
|
"question": "Cobb is <img>image_1</img>\n Ariadne is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is walking in front?", |
|
"prediction": "Cobb is walking in front." |
|
}, |
|
{ |
|
"id": 73, |
|
"question": "Cobb is <img>image_1</img>\n Saito is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Cobb is seated on the left side of a train, dressed in a suit, with his left arm resting on the back of the seat. Saito is seated on the right side, also in a suit, facing towards Cobb. They appear to be in conversation." |
|
}, |
|
{ |
|
"id": 74, |
|
"question": "Tony is <img>image_1</img>\n Pepper is <img>image_2</img>\n Natalie is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is the person standing?", |
|
"prediction": "Pepper Potts is the person standing." |
|
}, |
|
{ |
|
"id": 75, |
|
"question": "Agent is <img>image_1</img>\n Justin is <img>image_2</img>\n Please provide an overview of the visual information in this image: <img>image_3</img>\n", |
|
"prediction": "Agent is standing on the right, wearing a suit and holding a case, while Justin is on the left, also in a suit, facing Agent. They appear to be in a factory setting." |
|
}, |
|
{ |
|
"id": 76, |
|
"question": "Nick is <img>image_1</img>\n Tony is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Nick with grounding.", |
|
"prediction": "<ref>Nick</ref><box>(273,26),(579,868)</box>" |
|
}, |
|
{ |
|
"id": 77, |
|
"question": "Tony is <img>image_1</img>\n Justin is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Justin with grounding.", |
|
"prediction": "<ref>Justin</ref><box>(462,106),(692,988)</box>" |
|
}, |
|
{ |
|
"id": 78, |
|
"question": "Pepper is <img>image_1</img>\n Natalie is <img>image_2</img>\n In the image: <img>image_3</img>\n Whose clothes color is gray?", |
|
"prediction": "Pepper's clothes are gray." |
|
}, |
|
{ |
|
"id": 79, |
|
"question": "Tony is <img>image_1</img>\n In the image: <img>image_2</img>\n Give a description.", |
|
"prediction": "Tony, wearing a pinstriped suit and striped tie, is seated at a table with his hands clasped, attentively looking forward. Behind him is a crowded room with various attendees, some in military uniform." |
|
}, |
|
{ |
|
"id": 80, |
|
"question": "Mrs. Fairfax is <img>image_1</img>\n Jane is <img>image_2</img>\n In the image: <img>image_3</img>\n What color is Jane's dress?", |
|
"prediction": "Jane's dress is blue." |
|
}, |
|
{ |
|
"id": 81, |
|
"question": "Rochester is <img>image_1</img>\n Jane is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe Rochester's clothes.", |
|
"prediction": "Rochester is wearing a brown coat, white shirt, and black vest." |
|
}, |
|
{ |
|
"id": 82, |
|
"question": "Jane is <img>image_1</img>\n Varens is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Varens with grounding.", |
|
"prediction": "<ref>Varens</ref><box>(592,175),(928,995)</box>" |
|
}, |
|
{ |
|
"id": 83, |
|
"question": "Jane is <img>image_1</img>\n Mrs. Fairfax is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Mrs. Fairfax with grounding.", |
|
"prediction": "<ref>Mrs. Fairfax</ref><box>(575,109),(998,994)</box>" |
|
}, |
|
{ |
|
"id": 84, |
|
"question": "Bai Letian is <img>image_1</img>\n Kukai is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Bai Letian is seated on the left, wearing a brown robe, while Kukai is on the right, clad in a blue robe with a yellow belt, holding a wooden tablet. They are sitting against a brick wall, with what appears to be a basket of fruit between them." |
|
}, |
|
{ |
|
"id": 85, |
|
"question": "Bai Letian is <img>image_1</img>\n Kukai is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Bai Letian with grounding.", |
|
"prediction": "<ref>Bai Letian</ref><box>(503,211),(729,1022)</box>" |
|
}, |
|
{ |
|
"id": 86, |
|
"question": "Bai Letian is <img>image_1</img>\n Kukai is <img>image_2</img>\n In the image: <img>image_3</img>\n Please provide an overview of the visual information.", |
|
"prediction": "Bai Letian is seated on the left side of a wooden table, facing slightly right, while Kukai is seated on the right side, both with bowls in front of them. A standing man is in the center, appearing to be serving food." |
|
}, |
|
{ |
|
"id": 87, |
|
"question": "Gennady is <img>image_1</img>\n Eddie is <img>image_2</img>\n In the image: <img>image_3</img>\n Please provide an image caption.", |
|
"prediction": "Gennady is seated on the right side of a bench, holding a brown bag, while Eddie is seated to his left, both in a park setting." |
|
}, |
|
{ |
|
"id": 88, |
|
"question": "Eddie is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Eddie with grounding.", |
|
"prediction": "<ref>Eddie</ref><box>(582,166),(935,996)</box>" |
|
}, |
|
{ |
|
"id": 89, |
|
"question": "Lindy is <img>image_1</img>\n Eddie is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Lindy is holding a newspaper with the headline \" Poll Vault \" and standing on the left, while Eddie is on the right, wearing a black leather jacket. They appear to be on a street with a man in the background looking at a newspaper stand." |
|
}, |
|
{ |
|
"id": 90, |
|
"question": "Gennady is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Gennady doing?", |
|
"prediction": "Gennady is standing and looking to his right." |
|
}, |
|
{ |
|
"id": 91, |
|
"question": "Eddie is <img>image_1</img>\n Carl is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Carl with grounding.", |
|
"prediction": "<ref>Carl</ref><box>(63,219),(300,995)</box>" |
|
}, |
|
{ |
|
"id": 92, |
|
"question": "Old Joe is <img>image_1</img>\n Joe is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is on the left side of the table?", |
|
"prediction": "Old Joe is on the left side of the table." |
|
}, |
|
{ |
|
"id": 93, |
|
"question": "Sara is <img>image_1</img>\n Cid is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Cid with grounding.", |
|
"prediction": "<ref>Cid</ref><box>(264,406),(535,994)</box>" |
|
}, |
|
{ |
|
"id": 94, |
|
"question": "Ye Jin is <img>image_1</img>\n Vivian is <img>image_2</img>\n In the image: <img>image_3</img>\n Who just got out of the car?", |
|
"prediction": "Ye Jin just got out of the car." |
|
}, |
|
{ |
|
"id": 95, |
|
"question": "Vivian is <img>image_1</img>\n Ye Jin is <img>image_2</img>\n In the image: <img>image_3</img>\n What does Vivian wear?", |
|
"prediction": "Vivian wears a green skirt and a white blouse." |
|
}, |
|
{ |
|
"id": 96, |
|
"question": "Vivian is <img>image_1</img>\n Ye Jin is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Vivian with grounding.", |
|
"prediction": "<ref>Vivian</ref><box>(416,175),(697,994)</box>" |
|
}, |
|
{ |
|
"id": 97, |
|
"question": "Vivian is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Vivian doing?", |
|
"prediction": "Vivian is holding up a phone." |
|
}, |
|
{ |
|
"id": 98, |
|
"question": "Ye Jin is <img>image_1</img>\n Please describe the image: <img>image_2</img>\n", |
|
"prediction": "Ye Jin, wearing a white blazer, is walking away from the camera towards the right side of the image in a modern, brightly lit living room. A man in a grey suit stands behind her, holding a bouquet of flowers." |
|
}, |
|
{ |
|
"id": 99, |
|
"question": "Boris' Girlfriend is <img>image_1</img>\n Boris is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is carrying the cake?", |
|
"prediction": "Boris' girlfriend is carrying the cake." |
|
}, |
|
{ |
|
"id": 100, |
|
"question": "Agent K is <img>image_1</img>\n Agent J is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Agent K with grounding.", |
|
"prediction": "<ref>Agent K</ref><box>(583,100),(969,705)</box>" |
|
}, |
|
{ |
|
"id": 101, |
|
"question": "Agent J is <img>image_1</img>\n Agent O is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Agent O doing?", |
|
"prediction": "Agent O is standing and facing Agent J." |
|
}, |
|
{ |
|
"id": 102, |
|
"question": "Young Agent K is <img>image_1</img>\n Young Agent O is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Young Agent K is seated on the left, facing slightly right, wearing a black suit. Young Agent O stands on the right, holding a clipboard, dressed in a black dress with a white collar. They appear to be in a busy office setting." |
|
}, |
|
{ |
|
"id": 103, |
|
"question": "Young Agent K is <img>image_1</img>\n Agent J is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Agent J with grounding.", |
|
"prediction": "<ref>Agent J</ref><box>(648,58),(899,980)</box>" |
|
}, |
|
{ |
|
"id": 104, |
|
"question": "Agent J is <img>image_1</img>\n Young Agent K is <img>image_2</img>\n Griffin is <img>image_3</img>\n In the image: <img>image_4</img>\n Please provide a description.", |
|
"prediction": "Agent J stands on the left, facing Young Agent K who is on the right. Griffin, in the center, is handing something to Agent J. They are in a room with other people, some in the background and one close to the camera." |
|
}, |
|
{ |
|
"id": 105, |
|
"question": "Boris is <img>image_1</img>\n Griffin is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Griffin with grounding.", |
|
"prediction": "<ref>Griffin</ref><box>(532,236),(984,988)</box>" |
|
}, |
|
{ |
|
"id": 106, |
|
"question": "Billy Beane is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Billy Beane with grounding.", |
|
"prediction": "<ref>Billy Beane</ref><box>(476,45),(848,939)</box>" |
|
}, |
|
{ |
|
"id": 107, |
|
"question": "Peter Brand is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Peter Brand with grounding.", |
|
"prediction": "<ref>Peter Brand</ref><box>(10,43),(635,986)</box>" |
|
}, |
|
{ |
|
"id": 108, |
|
"question": "Billy is <img>image_1</img>\n Peter is <img>image_2</img>\n In the image: <img>image_3</img>\n Please give a description.", |
|
"prediction": "Billy is seated at a desk, talking on the phone, while Peter is sitting across, appearing to be in a conversation or thinking. They are in a room with various items, including a computer, books, and papers." |
|
}, |
|
{ |
|
"id": 109, |
|
"question": "Sharp is <img>image_1</img>\n Scout is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Scout with grounding.", |
|
"prediction": "<ref>Scout</ref><box>(539,172),(798,761)</box>" |
|
}, |
|
{ |
|
"id": 110, |
|
"question": "Sam is <img>image_1</img>\n Suzy is <img>image_2</img>\n Please describe the image: <img>image_3</img>\n", |
|
"prediction": "Sam is sitting on the ground outside, wearing a yellow scout uniform and holding a frying pan, while Suzy is sitting on the left, partially visible and holding a camera. There's a tent and various items in the background." |
|
}, |
|
{ |
|
"id": 111, |
|
"question": "Suzy is <img>image_1</img>\n Sam is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe Suzy's state.", |
|
"prediction": "Suzy is sitting and looking at something in her hands." |
|
}, |
|
{ |
|
"id": 112, |
|
"question": "Sharp is <img>image_1</img>\n Scout is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Sharp with grounding.", |
|
"prediction": "<ref>Sharp</ref><box>(665,79),(928,988)</box>" |
|
}, |
|
{ |
|
"id": 113, |
|
"question": "Sam is <img>image_1</img>\n Suzy is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Suzy with grounding.", |
|
"prediction": "<ref>Suzy</ref><box>(133,248),(402,989)</box>" |
|
}, |
|
{ |
|
"id": 114, |
|
"question": "Sam is <img>image_1</img>\n Suzy is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe the visual content.", |
|
"prediction": "Sam is seated at a table, looking forward with hands clasped, while Suzy is sitting next to him, also looking forward with hands near her chin. They appear to be in a room with a wooden interior and large windows." |
|
}, |
|
{ |
|
"id": 115, |
|
"question": "Sharp is <img>image_1</img>\n Scout is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Sharp doing?", |
|
"prediction": "Sharp is wiping his face with his hand." |
|
}, |
|
{ |
|
"id": 116, |
|
"question": "Social Services is <img>image_1</img>\n Scout is <img>image_2</img>\n Sharp is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Social Services, wearing a blue uniform, is gesturing with her hand while holding a book. Scout, in a brown uniform, stands with his hands by his sides. Sharp, partially visible on the right, appears to be in a conversation. Other individuals are present in the background." |
|
}, |
|
{ |
|
"id": 117, |
|
"question": "Chigusa is <img>image_1</img>\n Shimada is <img>image_2</img>\n Kawai is <img>image_3</img>\n In the image: <img>image_4</img>\n Please give a description.", |
|
"prediction": "Chigusa is seated on the left, wearing a white blouse with a red tie, looking towards the right. Shimada is seated in the center, also in a white blouse with a red tie, holding an object and looking downwards. Kawai is seated on the right, in a white shirt and dark pants, leaning forward with hands on his thighs." |
|
}, |
|
{ |
|
"id": 118, |
|
"question": "Shimada is <img>image_1</img>\n Chigusa is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Chigusa with grounding.", |
|
"prediction": "<ref>Chigusa</ref><box>(396,205),(600,996)</box>" |
|
}, |
|
{ |
|
"id": 119, |
|
"question": "Chigusa is <img>image_1</img>\n In the image: <img>image_2</img>\n What is her emotion?", |
|
"prediction": "Chigusa appears to be distressed or in distress." |
|
}, |
|
{ |
|
"id": 120, |
|
"question": "Kosaku is <img>image_1</img>\n Shimada is <img>image_2</img>\n For the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Kosaku stands to the right, extending a water bottle towards Shimada, who is seated to the left on a red bench in a dimly lit waiting area." |
|
}, |
|
{ |
|
"id": 121, |
|
"question": "Kosuke is <img>image_1</img>\n Sachiko is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Sachiko with grounding.", |
|
"prediction": "<ref>Sachiko</ref><box>(550,566),(759,994)</box>" |
|
}, |
|
{ |
|
"id": 122, |
|
"question": "Chigusa is <img>image_1</img>\n Kosuke is <img>image_2</img>\n Shimada is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is raising hand?", |
|
"prediction": "Shimada is raising hand." |
|
}, |
|
{ |
|
"id": 123, |
|
"question": "Sachiko is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Sachiko with grounding.", |
|
"prediction": "<ref>Sachiko</ref><box>(582,151),(840,996)</box>" |
|
}, |
|
{ |
|
"id": 124, |
|
"question": "Chigusa is <img>image_1</img>\n Shimada is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Shimada doing?", |
|
"prediction": "Shimada is writing in a notebook." |
|
}, |
|
{ |
|
"id": 125, |
|
"question": "Kosaku is <img>image_1</img>\n Shimada is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Kosaku, wearing a suit, stands in a crowded train, holding onto a pole. Next to him, Shimada, in a school uniform, looks down, adjusting her tie. Other passengers are visible around them." |
|
}, |
|
{ |
|
"id": 126, |
|
"question": "Kosaku is <img>image_1</img>\n Shimada is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Kosaku doing?", |
|
"prediction": "Kosaku is sitting and reading a book." |
|
}, |
|
{ |
|
"id": 127, |
|
"question": "Kosaku is <img>image_1</img>\n Shimada is <img>image_2</img>\n Please describe the image: <img>image_3</img>\n", |
|
"prediction": "Kosaku is seated on a bench, looking down at a book, while Shimada stands behind him with her hand on his head, both dressed in school uniforms." |
|
}, |
|
{ |
|
"id": 128, |
|
"question": "Shimada is <img>image_1</img>\n Kosaku is <img>image_2</img>\n In the image: <img>image_3</img>\n Give an image caption.", |
|
"prediction": "Shimada, wearing a school uniform with a white blouse and dark skirt, stands under an umbrella. Kosaku, in a suit, holds the other side of the umbrella. They appear to be on an escalator." |
|
}, |
|
{ |
|
"id": 129, |
|
"question": "Shimada is <img>image_1</img>\n Yusuke is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Shimada with grounding.", |
|
"prediction": "<ref>Shimada</ref><box>(106,18),(514,981)</box>" |
|
}, |
|
{ |
|
"id": 130, |
|
"question": "Kosaku Ito is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Kosaku Ito with grounding.", |
|
"prediction": "<ref>Kosaku Ito</ref><box>(46,191),(450,996)</box>" |
|
}, |
|
{ |
|
"id": 131, |
|
"question": "Hibiki Shimada is <img>image_1</img>\n Megumi Chigusa is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is holding a cylinder object?", |
|
"prediction": "Megumi Chigusa is holding a cylinder object." |
|
}, |
|
{ |
|
"id": 132, |
|
"question": "Kosuke is <img>image_1</img>\n Shimada is <img>image_2</img>\n Describe the image: <img>image_3</img>\n", |
|
"prediction": "Kosuke, wearing a black suit with a red flower on the lapel, stands to the left. To his right, Shimada, also in a black suit with a red flower, appears to be waving. They are both in front of cherry blossom trees in bloom." |
|
}, |
|
{ |
|
"id": 133, |
|
"question": "Kosaku Ito is <img>image_1</img>\n Hibiki Shimada is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Kosaku Ito stands on the left, facing Hibiki Shimada, who is holding a bouquet of flowers on the right. Both are dressed in school uniforms and are standing outdoors with a car and trees in the background." |
|
}, |
|
{ |
|
"id": 134, |
|
"question": "Emma is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Emma with grounding.", |
|
"prediction": "<ref>Emma</ref><box>(382,61),(780,988)</box>" |
|
}, |
|
{ |
|
"id": 135, |
|
"question": "Adam is <img>image_1</img>\n Alvin is <img>image_2</img>\n In the image: <img>image_3</img>\n Is Adam standing?", |
|
"prediction": "Yes, Adam is standing." |
|
}, |
|
{ |
|
"id": 136, |
|
"question": "Emma is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Emma with grounding.", |
|
"prediction": "<ref>Emma</ref><box>(278,226),(495,995)</box>" |
|
}, |
|
{ |
|
"id": 137, |
|
"question": "Adam is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Adam doing?", |
|
"prediction": "Adam is standing and holding his jacket while conversing with others." |
|
}, |
|
{ |
|
"id": 138, |
|
"question": "Emma is <img>image_1</img>\n Adam is <img>image_2</img>\n Please describe the image: <img>image_3</img>\n", |
|
"prediction": "Emma, wearing a white coat with a stethoscope, stands to the left of the image. Adam is lying in a hospital bed to the right, with medical equipment and a IV in the background." |
|
}, |
|
{ |
|
"id": 139, |
|
"question": "Alvin is <img>image_1</img>\n Lucy is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Alvin is seated at a dining table, holding a martini glass, engaged in conversation with Lucy, who is sitting across from him with a drink in her hand. They appear to be in a restaurant with other patrons in the background." |
|
}, |
|
{ |
|
"id": 140, |
|
"question": "Gao Jian Xiang is <img>image_1</img>\n Liu Hao is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Gao Jian Xiang with grounding.", |
|
"prediction": "<ref>Gao Jian Xiang</ref><box>(212,87),(567,916)</box>" |
|
}, |
|
{ |
|
"id": 141, |
|
"question": "Chen is <img>image_1</img>\n Gao is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe the scene.", |
|
"prediction": "Chen, dressed in a white suit, is being forcefully held by Gao, who is in a dark shirt and light pants, in a parking lot with cars and a building in the background." |
|
}, |
|
{ |
|
"id": 142, |
|
"question": "Gao is <img>image_1</img>\n Lin is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Lin with grounding.", |
|
"prediction": "<ref>Lin</ref><box>(25,83),(332,994)</box>" |
|
}, |
|
{ |
|
"id": 143, |
|
"question": "Chen is <img>image_1</img>\n Gao is <img>image_2</img>\n In the image: <img>image_3</img>\n What is the expression of Chen?", |
|
"prediction": "Chen looks surprised or in disbelief." |
|
}, |
|
{ |
|
"id": 144, |
|
"question": "Jack is <img>image_1</img>\n Gibbs is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Jack with grounding.", |
|
"prediction": "<ref>Jack</ref><box>(184,76),(535,992)</box>" |
|
}, |
|
{ |
|
"id": 145, |
|
"question": "Jack Sparrow is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Jack with grounding.", |
|
"prediction": "<ref>Jack</ref><box>(346,11),(689,984)</box>" |
|
}, |
|
{ |
|
"id": 146, |
|
"question": "Barbossa is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Barbossa with grounding.", |
|
"prediction": "<ref>Barbossa</ref><box>(610,137),(803,983)</box>" |
|
}, |
|
{ |
|
"id": 147, |
|
"question": "Barbossa is <img>image_1</img>\n In the image: <img>image_2</img>\n Please give a description.", |
|
"prediction": "Barbossa, dressed in a tricorne hat and elaborate coat, stands to the left, while another individual in similar attire stands to the right, both aboard a ship with visible rigging." |
|
}, |
|
{ |
|
"id": 148, |
|
"question": "Angelica is <img>image_1</img>\n Jack is <img>image_2</img>\n Describe the image: <img>image_3</img>\n", |
|
"prediction": "Angelica, wearing a dark hat, is handing a compass to Jack, who is shirtless and has a chest tattoo, amidst dense green foliage. Other indistinct figures are in the background." |
|
}, |
|
{ |
|
"id": 149, |
|
"question": "Syrena is <img>image_1</img>\n Philip is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Syrena is sitting closely behind Philip, both appear to be in a dense jungle setting. Syrena is embracing Philip from behind, and another person is partially visible sitting on the ground in front of them." |
|
}, |
|
{ |
|
"id": 150, |
|
"question": "Angelica is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Angelica with grounding.", |
|
"prediction": "<ref>Angelica</ref><box>(73,61),(507,990)</box>" |
|
}, |
|
{ |
|
"id": 151, |
|
"question": "Elizabeth is <img>image_1</img>\n William is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Elizabeth is seated on the left, wearing a blue blazer and skirt, looking down at a book in her lap. William is seated beside her, wearing a dark suit, also looking down at a book. They appear to be engaged in studying or reading together." |
|
}, |
|
{ |
|
"id": 152, |
|
"question": "William is <img>image_1</img>\n Elizabeth is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Elizabeth with grounding.", |
|
"prediction": "<ref>Elizabeth</ref><box>(664,0),(998,994)</box>" |
|
}, |
|
{ |
|
"id": 153, |
|
"question": "Brant is <img>image_1</img>\n Olive is <img>image_2</img>\n In the image: <img>image_3</img>\n What color is Olive's hat?", |
|
"prediction": "Olive's hat is brown." |
|
}, |
|
{ |
|
"id": 154, |
|
"question": "Elizabeth is <img>image_1</img>\n Olive is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Elizabeth with grounding.", |
|
"prediction": "<ref>Elizabeth</ref><box>(603,62),(872,984)</box>" |
|
}, |
|
{ |
|
"id": 155, |
|
"question": "Elizabeth is <img>image_1</img>\n William is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe William's state.", |
|
"prediction": "William is standing with his hands on his thighs." |
|
}, |
|
{ |
|
"id": 156, |
|
"question": "William is <img>image_1</img>\n Elizabeth is <img>image_2</img>\n In the image: <img>image_3</img>\n Is William sitting or lying down?", |
|
"prediction": "William is lying down." |
|
}, |
|
{ |
|
"id": 157, |
|
"question": "Robert is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Robert with grounding.", |
|
"prediction": "<ref>Robert</ref><box>(603,56),(896,981)</box>" |
|
}, |
|
{ |
|
"id": 158, |
|
"question": "Charles Rodman is <img>image_1</img>\n Will Rodman is <img>image_2</img>\n In the image: <img>image_3</img>\n Explain the visual content.", |
|
"prediction": "Charles Rodman is standing behind a table, leaning forward to feed a small chimpanzee, while Will Rodman sits at the table, looking on with a mug in his hand." |
|
}, |
|
{ |
|
"id": 159, |
|
"question": "Will Rodman is <img>image_1</img>\n Caesar is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is sitting in the back seat of the car?", |
|
"prediction": "Caesar is sitting in the back seat of the car." |
|
}, |
|
{ |
|
"id": 160, |
|
"question": "Will Rodman is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Will Rodman with grounding.", |
|
"prediction": "<ref>Will Rodman</ref><box>(385,22),(648,994)</box>" |
|
}, |
|
{ |
|
"id": 161, |
|
"question": "David Norris is <img>image_1</img>\n Elise Sellas is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is sitting by the window?", |
|
"prediction": "Elise Sellas is sitting by the window." |
|
}, |
|
{ |
|
"id": 162, |
|
"question": "Charlie Traynor is <img>image_1</img>\n David Norris is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Charlie Traynor with grounding.", |
|
"prediction": "<ref>Charlie Traynor</ref><box>(89,86),(467,987)</box>" |
|
}, |
|
{ |
|
"id": 163, |
|
"question": "Charlie is <img>image_1</img>\n David is <img>image_2</img>\n Elise is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Charlie stands behind a dining table, facing David and Elise, who are seated across from each other. David appears to be in conversation with Charlie, while Elise is looking down, possibly at a menu. Other diners are visible in the background." |
|
}, |
|
{ |
|
"id": 164, |
|
"question": "David Norris is <img>image_1</img>\n Jon Stewart is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Jon Stewart with grounding.", |
|
"prediction": "<ref>Jon Stewart</ref><box>(175,79),(435,988)</box>" |
|
}, |
|
{ |
|
"id": 165, |
|
"question": "Bloom is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Bloom with grounding.", |
|
"prediction": "<ref>Bloom</ref><box>(625,69),(998,981)</box>" |
|
}, |
|
{ |
|
"id": 166, |
|
"question": "Romeo is <img>image_1</img>\n Murphy is <img>image_2</img>\n Please describe the image: <img>image_3</img>\n", |
|
"prediction": "Murphy, holding a gun, stands on the left, while Romeo, dressed in a white chef's outfit with a feathered hat, stands on the right. They appear to be in a dimly lit bar with festive lights in the background." |
|
}, |
|
{ |
|
"id": 167, |
|
"question": "Romeo is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Romeo doing?", |
|
"prediction": "Romeo is standing at the bar with a drink in his hand." |
|
}, |
|
{ |
|
"id": 168, |
|
"question": "Connor is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Connor doing?", |
|
"prediction": "Connor is sitting at a table, looking at a card." |
|
}, |
|
{ |
|
"id": 169, |
|
"question": "Romeo is <img>image_1</img>\n In the image: <img>image_2</img>\n Give a description.", |
|
"prediction": "Romeo, holding a gun, confronts a man in a room with shelves and a 'No smoking' sign on the wall." |
|
}, |
|
{ |
|
"id": 170, |
|
"question": "Poppa is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Poppa with grounding.", |
|
"prediction": "<ref>Poppa</ref><box>(278,58),(546,981)</box>" |
|
}, |
|
{ |
|
"id": 171, |
|
"question": "Katsuro Matsuoka is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Katsuro Matsuoka with grounding.", |
|
"prediction": "<ref>Katsuro Matsuoka</ref><box>(300,172),(535,988)</box>" |
|
}, |
|
{ |
|
"id": 172, |
|
"question": "Zhu Bajie is <img>image_1</img>\n Tangseng is <img>image_2</img>\n Shaseng is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Tangseng with grounding.", |
|
"prediction": "<ref>Tangseng</ref><box>(25,247),(396,995)</box>" |
|
}, |
|
{ |
|
"id": 173, |
|
"question": "Shaseng is <img>image_1</img>\n Tangseng is <img>image_2</img>\n Sun Wukong is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Shaseng stands to the right holding a bow, Tangseng is in the center wearing a crown, and Sun Wukong is on the left with a sword, all in a forest setting." |
|
}, |
|
{ |
|
"id": 174, |
|
"question": "Shaseng is <img>image_1</img>\n Tangseng is <img>image_2</img>\n Sun Wukong is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Sun Wukong with grounding.", |
|
"prediction": "<ref>Sun Wukong</ref><box>(398,281),(777,981)</box>" |
|
}, |
|
{ |
|
"id": 175, |
|
"question": "Shary is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Shary with grounding.", |
|
"prediction": "<ref>Shary</ref><box>(7,472),(250,995)</box>" |
|
}, |
|
{ |
|
"id": 176, |
|
"question": "Shaseng is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Shaseng doing?", |
|
"prediction": "Shaseng is standing and seems to be in a conversation or interaction with others." |
|
}, |
|
{ |
|
"id": 177, |
|
"question": "Shaseng is <img>image_1</img>\n Zhu Bajie is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is lying down?", |
|
"prediction": "Zhu Bajie is lying down." |
|
}, |
|
{ |
|
"id": 178, |
|
"question": "Benjam is <img>image_1</img>\n Irene is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Benjam with grounding.", |
|
"prediction": "<ref>Benjam</ref><box>(160,43),(542,988)</box>" |
|
}, |
|
{ |
|
"id": 179, |
|
"question": "Irene is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Irene doing?", |
|
"prediction": "Irene is standing and holding some papers." |
|
}, |
|
{ |
|
"id": 180, |
|
"question": "Isidoro is <img>image_1</img>\n Benjam is <img>image_2</img>\n Irene is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Isidoro with grounding.", |
|
"prediction": "<ref>Isidoro</ref><box>(635,319),(998,994)</box>" |
|
}, |
|
{ |
|
"id": 181, |
|
"question": "Sam Witwicky is <img>image_1</img>\n Bruce Brazos is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Bruce Brazos going to do?", |
|
"prediction": "Bruce Brazos is going to place his hand on Sam Witwicky's shoulder." |
|
}, |
|
{ |
|
"id": 182, |
|
"question": "Sam Witwicky is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Sam Witwicky with grounding.", |
|
"prediction": "<ref>Sam Witwicky</ref><box>(0,0),(385,979)</box>" |
|
}, |
|
{ |
|
"id": 183, |
|
"question": "Lennox is <img>image_1</img>\n In the image: <img>image_2</img>\n Is Lennox the person on the left or the one on the right?", |
|
"prediction": "Lennox is the person on the right." |
|
}, |
|
{ |
|
"id": 184, |
|
"question": "Sam is <img>image_1</img>\n Carly is <img>image_2</img>\n In the image: <img>image_3</img>\n What color is Sam's clothes?", |
|
"prediction": "Sam's clothes are light blue." |
|
}, |
|
{ |
|
"id": 185, |
|
"question": "Dylan is <img>image_1</img>\n Carly is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Carly with grounding.", |
|
"prediction": "<ref>Carly</ref><box>(118,34),(376,908)</box>" |
|
}, |
|
{ |
|
"id": 186, |
|
"question": "Dylan is <img>image_1</img>\n Carly is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Dylan with grounding.", |
|
"prediction": "<ref>Dylan</ref><box>(467,125),(725,994)</box>" |
|
}, |
|
{ |
|
"id": 187, |
|
"question": "Rooster is <img>image_1</img>\n LaBoeuf is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Rooster doing?", |
|
"prediction": "Rooster is lighting a cigarette." |
|
}, |
|
{ |
|
"id": 188, |
|
"question": "Mattie Ross is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Mattie Ross with grounding.", |
|
"prediction": "<ref>Mattie Ross</ref><box>(131,125),(421,995)</box>" |
|
}, |
|
{ |
|
"id": 189, |
|
"question": "Mattie Ross is <img>image_1</img>\n LaBoeuf is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Mattie Ross, wearing a brown coat and hat, is standing and holding a metal cup. LaBoeuf, also in a brown coat and hat, is seated next to her, appearing to be in a forest setting." |
|
}, |
|
{ |
|
"id": 190, |
|
"question": "Mattie Ross is <img>image_1</img>\n LaBoeuf is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is hiding beside a rock?", |
|
"prediction": "LaBoeuf is hiding beside a rock." |
|
}, |
|
{ |
|
"id": 191, |
|
"question": "Qin is <img>image_1</img>\n Lord Ximen is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Qin with grounding.", |
|
"prediction": "<ref>Qin</ref><box>(485,1),(900,981)</box>" |
|
}, |
|
{ |
|
"id": 192, |
|
"question": "Qin is <img>image_1</img>\n In the image: <img>image_2</img>\n Describe Qin's state.", |
|
"prediction": "Qin is standing with his hand on another person's shoulder, appearing to be in a conversation or interaction." |
|
}, |
|
{ |
|
"id": 193, |
|
"question": "Lord is <img>image_1</img>\n In the image: <img>image_2</img>\n What color is Lord's clothes?", |
|
"prediction": "Lord's clothes are red and black." |
|
}, |
|
{ |
|
"id": 194, |
|
"question": "Lord Ximen is <img>image_1</img>\n Ho Sum-on is <img>image_2</img>\n In the image: <img>image_3</img>\n What color is Ho Sum-on's clothes?", |
|
"prediction": "Ho Sum-on's clothes are yellow." |
|
}, |
|
{ |
|
"id": 195, |
|
"question": "Qin is <img>image_1</img>\n Big Brother is <img>image_2</img>\n Please describe the image: <img>image_3</img>\n", |
|
"prediction": "Big Brother, wearing a pink shirt and gray vest, is seated at a table facing Qin, who is dressed in a black suit. They appear to be in a serious conversation across a table covered with books and surrounded by bookshelves." |
|
}, |
|
{ |
|
"id": 196, |
|
"question": "Qin is <img>image_1</img>\n SoSo is <img>image_2</img>\n In the image: <img>image_3</img>\n What does SoSo wear?", |
|
"prediction": "SoSo wears a black blouse with white polka dots." |
|
}, |
|
{ |
|
"id": 197, |
|
"question": "Qin Kwai is <img>image_1</img>\n Qin is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is waving hand?", |
|
"prediction": "Qin Kwai is waving hand." |
|
}, |
|
{ |
|
"id": 198, |
|
"question": "Qin is <img>image_1</img>\n Qin Kwai is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Qin Kwai with grounding.", |
|
"prediction": "<ref>Qin Kwai</ref><box>(612,216),(998,995)</box>" |
|
}, |
|
{ |
|
"id": 199, |
|
"question": "Big Brother is <img>image_1</img>\n In the image: <img>image_2</img>\n Give a description.", |
|
"prediction": "Big Brother, wearing a light blue shirt, is embracing a young child in a blue shirt with a white patterned skirt. They are standing in a room with traditional Chinese decor. Other individuals are present in the background." |
|
}, |
|
{ |
|
"id": 200, |
|
"question": "Qin is <img>image_1</img>\n SoSo is <img>image_2</img>\n Provide a description for the image: <img>image_3</img>\n", |
|
"prediction": "Qin is on the right, wearing a white shirt and pointing forward with his right hand. SoSo is on the left, wearing a white tank top, facing towards Qin. They are surrounded by blue and green balloons." |
|
}, |
|
{ |
|
"id": 201, |
|
"question": "Dr. Martin Harris is <img>image_1</img>\n Herr Strauss is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Herr Strauss with grounding.", |
|
"prediction": "<ref>Herr Strauss</ref><box>(610,83),(884,983)</box>" |
|
}, |
|
{ |
|
"id": 202, |
|
"question": "Herr Strauss is <img>image_1</img>\n Dr. Martin Harris is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is leaning against the table?", |
|
"prediction": "Dr. Martin Harris is leaning against the table." |
|
}, |
|
{ |
|
"id": 203, |
|
"question": "Martin is <img>image_1</img>\n Gina is <img>image_2</img>\n In the image: <img>image_3</img>\n Does Martin wear a hat?", |
|
"prediction": "No, Martin does not wear a hat." |
|
}, |
|
{ |
|
"id": 204, |
|
"question": "Martin is <img>image_1</img>\n Ernst is <img>image_2</img>\n Gina is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Martin is standing on the left, facing a woman, Gina, who is turned towards him. Ernst stands to the right, looking in their direction. They are on a bridge with a historic building in the background and it's snowing." |
|
}, |
|
{ |
|
"id": 205, |
|
"question": "Martin is <img>image_1</img>\n Elizabeth is <img>image_2</img>\n In the image: <img>image_3</img>\n What is on Elizabeth's neck?", |
|
"prediction": "Elizabeth is wearing a pearl necklace." |
|
}, |
|
{ |
|
"id": 206, |
|
"question": "Professor Bressler is <img>image_1</img>\n Provide a description for the image: <img>image_2</img>\n", |
|
"prediction": "Professor Bressler is standing in a crowded room, wearing a dark suit and appears to be in conversation. A young girl in a white dress is standing to his right, holding a stuffed animal. Other individuals are blurred and unidentifiable." |
|
}, |
|
{ |
|
"id": 207, |
|
"question": "Natalie is <img>image_1</img>\n Craig is <img>image_2</img>\n In the image: <img>image_3</img>\n Is Natalie the person standing closer to Craig or farther away?", |
|
"prediction": "Natalie is standing closer to Craig." |
|
}, |
|
{ |
|
"id": 208, |
|
"question": "Craig is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Craig with grounding.", |
|
"prediction": "<ref>Craig</ref><box>(496,47),(898,905)</box>" |
|
}, |
|
{ |
|
"id": 209, |
|
"question": "Ryan is <img>image_1</img>\n Natalie is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Ryan, in a suit, is holding a boarding pass while walking through an airport. Natalie, also in a suit, follows behind with a coat over her shoulder. They are surrounded by other travelers." |
|
}, |
|
{ |
|
"id": 210, |
|
"question": "Julie Bingham is <img>image_1</img>\n Kara Bingham is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Julie Bingham with grounding.", |
|
"prediction": "<ref>Julie Bingham</ref><box>(7,129),(407,992)</box>" |
|
}, |
|
{ |
|
"id": 211, |
|
"question": "Jim is <img>image_1</img>\n Julie is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Julie, in a white bridal dress with a veil and holding a bouquet, stands next to Jim, who is in a black suit with a red tie. They appear to be at a wedding ceremony." |
|
}, |
|
{ |
|
"id": 212, |
|
"question": "Ryan Bingham is <img>image_1</img>\n Alex Goran is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Alex Goran doing?", |
|
"prediction": "Alex Goran is holding a champagne glass." |
|
}, |
|
{ |
|
"id": 213, |
|
"question": "Brendan Conlon is <img>image_1</img>\n Frank Campana is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Frank Campana doing?", |
|
"prediction": "Frank Campana is pointing at something or someone." |
|
}, |
|
{ |
|
"id": 214, |
|
"question": "Paddy Conlon is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Paddy Conlon with grounding.", |
|
"prediction": "<ref>Paddy Conlon</ref><box>(181,40),(625,981)</box>" |
|
}, |
|
{ |
|
"id": 215, |
|
"question": "Principal Zito is <img>image_1</img>\n In the image: <img>image_2</img>\n What does Principal Zito wear?", |
|
"prediction": "Principal Zito is wearing a striped polo shirt." |
|
}, |
|
{ |
|
"id": 216, |
|
"question": "Fenroy is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Fenroy with grounding.", |
|
"prediction": "<ref>Fenroy</ref><box>(245,170),(603,995)</box>" |
|
}, |
|
{ |
|
"id": 217, |
|
"question": "Juan Lian is <img>image_1</img>\n Zi Xia is <img>image_2</img>\n Please describe the image: <img>image_3</img>\n", |
|
"prediction": "Juan Lian is on the left, wearing a dark outfit with a white sash, gesturing with his right hand near his head. Zi Xia is on the right, dressed in a white robe with a purple detail, standing calmly. They appear to be in a dimly lit room with shelves in the background." |
|
}, |
|
{ |
|
"id": 218, |
|
"question": "Sun Wukong is <img>image_1</img>\n In the image: <img>image_2</img>\n Give a description.", |
|
"prediction": "Sun Wukong is engaged in a fierce battle, wielding a weapon with both hands and defending against multiple opponents." |
|
}, |
|
{ |
|
"id": 219, |
|
"question": "Juan Lian is <img>image_1</img>\n Zi Xia is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Zi Xia doing?", |
|
"prediction": "Zi Xia is clapping her hands." |
|
}, |
|
{ |
|
"id": 220, |
|
"question": "Sun Wukong is <img>image_1</img>\n Zi Xia is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is sitting on top?", |
|
"prediction": "Sun Wukong is sitting on top." |
|
}, |
|
{ |
|
"id": 221, |
|
"question": "Erlang Shen is <img>image_1</img>\n Juan Lian is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Erlang Shen with grounding.", |
|
"prediction": "<ref>Erlang Shen</ref><box>(26,0),(662,994)</box>" |
|
}, |
|
{ |
|
"id": 222, |
|
"question": "Sun Wukong is <img>image_1</img>\n Zi Xia is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Zi Xia with grounding.", |
|
"prediction": "<ref>Zi Xia</ref><box>(189,236),(465,988)</box>" |
|
}, |
|
{ |
|
"id": 223, |
|
"question": "Royce is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Royce with grounding.", |
|
"prediction": "<ref>Royce</ref><box>(617,0),(979,956)</box>" |
|
}, |
|
{ |
|
"id": 224, |
|
"question": "Edwin is <img>image_1</img>\n Isabelle is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Isabelle with grounding.", |
|
"prediction": "<ref>Isabelle</ref><box>(386,195),(582,996)</box>" |
|
}, |
|
{ |
|
"id": 225, |
|
"question": "Elizabeth Shaw is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Elizabeth Shaw with grounding.", |
|
"prediction": "<ref>Elizabeth Shaw</ref><box>(98,131),(311,993)</box>" |
|
}, |
|
{ |
|
"id": 226, |
|
"question": "David is <img>image_1</img>\n Elizabeth Shaw is <img>image_2</img>\n In the image: <img>image_3</img>\n What is David doing?", |
|
"prediction": "David is standing and looking at a screen." |
|
}, |
|
{ |
|
"id": 227, |
|
"question": "David is <img>image_1</img>\n Elizabeth Shaw is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "David is lying on a table, facing away from the camera, with his arm around Elizabeth Shaw, who is also lying down, visible from the waist up, in a dimly lit room with industrial surroundings." |
|
}, |
|
{ |
|
"id": 228, |
|
"question": "Hilly Holbrook is <img>image_1</img>\n Jolene French is <img>image_2</img>\n Elizabeth Leefolt is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Elizabeth Leefolt with grounding.", |
|
"prediction": "<ref>Elizabeth Leefolt</ref><box>(547,110),(825,983)</box>" |
|
}, |
|
{ |
|
"id": 229, |
|
"question": "Hilly Holbrook is <img>image_1</img>\n Skeeter Phelan is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is holding the other person's arms?", |
|
"prediction": "Hilly Holbrook is holding Skeeter Phelan's arms." |
|
}, |
|
{ |
|
"id": 230, |
|
"question": "Skeeter Phelan is <img>image_1</img>\n Elizabeth Leefolt is <img>image_2</img>\n In the image: <img>image_3</img>\n who has a drink in front of herself?", |
|
"prediction": "Elizabeth Leefolt has a drink in front of herself." |
|
}, |
|
{ |
|
"id": 231, |
|
"question": "Skeeter Phelan is <img>image_1</img>\n Aibileen Clark is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Skeeter Phelan is seated at a kitchen table, looking at papers, while Aibileen Clark stands nearby, holding a spoon and wearing an apron." |
|
}, |
|
{ |
|
"id": 232, |
|
"question": "Hilly Holbrook is <img>image_1</img>\n Elizabeth Leefolt is <img>image_2</img>\n Jolene French is <img>image_3</img>\n In the image: <img>image_4</img>\n What does Jolene French wear?", |
|
"prediction": "Jolene French wears a black dress with a patterned design." |
|
}, |
|
{ |
|
"id": 233, |
|
"question": "Aibileen Clark is <img>image_1</img>\n Minny Jackson is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Minny Jackson with grounding.", |
|
"prediction": "<ref>Minny Jackson</ref><box>(650,20),(837,985)</box>" |
|
}, |
|
{ |
|
"id": 234, |
|
"question": "Aibileen is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Aibileen doing?", |
|
"prediction": "Aibileen is holding a picture and a purse." |
|
}, |
|
{ |
|
"id": 235, |
|
"question": "Hilly Holbrook is <img>image_1</img>\n Elizabeth Leefolt is <img>image_2</img>\n Describe the content of the image: <img>image_3</img>\n", |
|
"prediction": "Hilly Holbrook stands with her hands on her hips facing forward, while Elizabeth Leefolt holds a baby, both in a room." |
|
}, |
|
{ |
|
"id": 236, |
|
"question": "Meiqin is <img>image_1</img>\n Heizi is <img>image_2</img>\n Leizi is <img>image_3</img>\n Chuchun is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Leizi with grounding.", |
|
"prediction": "<ref>Leizi</ref><box>(10,260),(372,995)</box>" |
|
}, |
|
{ |
|
"id": 237, |
|
"question": "Heizi is <img>image_1</img>\n Chuchun is <img>image_2</img>\n Leizi is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is standing behind?", |
|
"prediction": "Heizi is standing behind Chuchun." |
|
}, |
|
{ |
|
"id": 238, |
|
"question": "Meiqin is <img>image_1</img>\n Shifeng is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Shifeng is standing and leaning forward to hand a book to Meiqin, who is sitting at a table in a library with other students in the background." |
|
}, |
|
{ |
|
"id": 239, |
|
"question": "Meiqin is <img>image_1</img>\n Heizi is <img>image_2</img>\n Leizi is <img>image_3</img>\n Chuchun is <img>image_4</img>\n In the image: <img>image_5</img>\n Who is squatting?", |
|
"prediction": "Leizi is squatting." |
|
}, |
|
{ |
|
"id": 240, |
|
"question": "Pei is <img>image_1</img>\n Heizi is <img>image_2</img>\n Leizi is <img>image_3</img>\n Chuchun is <img>image_4</img>\n In the image: <img>image_5</img>\n What is Chuchun doing?", |
|
"prediction": "Chuchun is standing and looking towards Heizi." |
|
}, |
|
{ |
|
"id": 241, |
|
"question": "Meiqin is <img>image_1</img>\n Heizi is <img>image_2</img>\n Pei is <img>image_3</img>\n Describe the image: <img>image_4</img>\n", |
|
"prediction": "Heizi is sitting on the left, facing towards a girl standing on the right, identified as Pei. Both characters appear to be conversing against a backdrop of a city skyline and a clear sky with clouds." |
|
}, |
|
{ |
|
"id": 242, |
|
"question": "Meiqin is <img>image_1</img>\n Pei is <img>image_2</img>\n Leizi is <img>image_3</img>\n Chuchun is <img>image_4</img>\n In the image: <img>image_5</img>\n Who is carrying Pei on her back?", |
|
"prediction": "Leizi is carrying Pei on her back." |
|
}, |
|
{ |
|
"id": 243, |
|
"question": "Leizi is <img>image_1</img>\n Chuchun is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Chuchun's experssion?", |
|
"prediction": "Chuchun looks surprised or amused." |
|
}, |
|
{ |
|
"id": 244, |
|
"question": "Meiqin is <img>image_1</img>\n Pei is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Pei is in a blue dress, leaping to the left, while Meiqin is in a brown shirt and grey skirt, seated and reaching out towards Pei." |
|
}, |
|
{ |
|
"id": 245, |
|
"question": "Meiqin is <img>image_1</img>\n Dangma is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Dangma with grounding.", |
|
"prediction": "<ref>Dangma</ref><box>(306,248),(525,994)</box>" |
|
}, |
|
{ |
|
"id": 246, |
|
"question": "Meiqin is <img>image_1</img>\n Heizi is <img>image_2</img>\n Leizi is <img>image_3</img>\n Chuchun is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Heizi with grounding.", |
|
"prediction": "<ref>Heizi</ref><box>(623,292),(803,825)</box>" |
|
}, |
|
{ |
|
"id": 247, |
|
"question": "Meiqin is <img>image_1</img>\n Heizi is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Heizi is seated at a table reaching out to touch Meiqin, who is standing across the table with a surprised expression. They are outdoors with a flower garden and trees in the background." |
|
}, |
|
{ |
|
"id": 248, |
|
"question": "Meiqin is <img>image_1</img>\n Shifeng is <img>image_2</img>\n In the image: <img>image_3</img>\n What does Meiqin wear?", |
|
"prediction": "Meiqin wears a black tank top with a white strap top." |
|
}, |
|
{ |
|
"id": 249, |
|
"question": "Dangma is <img>image_1</img>\n Leizi is <img>image_2</img>\n Describe the content of the image: <img>image_3</img>\n", |
|
"prediction": "Dangma is standing on the left, facing Leizi, who is holding a necklace in her hand. They appear to be in a cityscape with buildings and billboards in the background." |
|
}, |
|
{ |
|
"id": 250, |
|
"question": "Heizi is <img>image_1</img>\n Leizi is <img>image_2</img>\n Chuchun is <img>image_3</img>\n In the image: <img>image_4</img>\n What is Chuchun doing?", |
|
"prediction": "Chuchun is pushing Heizi in a wheelchair." |
|
}, |
|
{ |
|
"id": 251, |
|
"question": "Runzi is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Runzi with grounding.", |
|
"prediction": "<ref>Runzi</ref><box>(109,170),(359,994)</box>" |
|
}, |
|
{ |
|
"id": 252, |
|
"question": "Meiqin is <img>image_1</img>\n Heizi is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Heizi is holding up a photo to the camera with both hands, while Meiqin is looking at the photo with interest. Both are in a corridor." |
|
}, |
|
{ |
|
"id": 253, |
|
"question": "Meiqin is <img>image_1</img>\n Heizi is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is holding the umbrella?", |
|
"prediction": "Heizi is holding the umbrella." |
|
}, |
|
{ |
|
"id": 254, |
|
"question": "Leizi is <img>image_1</img>\n In the image: <img>image_2</img>\n What color is Leizi's clothes?", |
|
"prediction": "Leizi is wearing a white top and a blue vest." |
|
}, |
|
{ |
|
"id": 255, |
|
"question": "Meiqin is <img>image_1</img>\n Heizi is <img>image_2</img>\n Leizi is <img>image_3</img>\n Chuchun is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Heizi with grounding.", |
|
"prediction": "<ref>Heizi</ref><box>(229,539),(426,980)</box>" |
|
}, |
|
{ |
|
"id": 256, |
|
"question": "Tangsan is <img>image_1</img>\n Xiaowu is <img>image_2</img>\n Rongrong is <img>image_3</img>\n Zhuqing is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Rongrong with grounding.", |
|
"prediction": "<ref>Rongrong</ref><box>(658,193),(840,933)</box>" |
|
}, |
|
{ |
|
"id": 257, |
|
"question": "Daimubai is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Daimubai doing?", |
|
"prediction": "Daimubai is standing with his arms crossed." |
|
}, |
|
{ |
|
"id": 258, |
|
"question": "Tangsan is <img>image_1</img>\n Xiaowu is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Tangsan, dressed in a blue outfit, stands to the left, while Xiaowu, wearing a pink bunny costume, is on the right. They appear to be in a forest at night with glowing plants and lights in the background." |
|
}, |
|
{ |
|
"id": 259, |
|
"question": "Tangsan is <img>image_1</img>\n Xiaowu is <img>image_2</img>\n Rongrong is <img>image_3</img>\n Aosika is <img>image_4</img>\n In the image: <img>image_5</img>\n Give a description.", |
|
"prediction": "Tangsan, in a blue outfit, stands next to Xiaowu, who is fixing his clothes. Rongrong, with bunny ears, stands behind them. Aosika is partially visible on the right side. They appear to be at a lively event with lights in the background." |
|
}, |
|
{ |
|
"id": 260, |
|
"question": "Xiaose is <img>image_1</img>\n Wuxin is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Wuxin doing?", |
|
"prediction": "Wuxin is embracing Xiaose." |
|
}, |
|
{ |
|
"id": 261, |
|
"question": "Xiaose is <img>image_1</img>\n Wuxin is <img>image_2</img>\n Leiwujie is <img>image_3</img>\n In the image: <img>image_4</img>\n Provide description of visual content.", |
|
"prediction": "Wuxin is sitting by a campfire, looking to her left, while Xiaose is standing behind her, holding a staff and looking towards the right. Leiwujie is not visible within the given coordinates." |
|
}, |
|
{ |
|
"id": 262, |
|
"question": "Xiaose is <img>image_1</img>\n Wuxin is <img>image_2</img>\n Baifa is <img>image_3</img>\n Leiwujie is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Baifa with grounding.", |
|
"prediction": "<ref>Baifa</ref><box>(789,164),(998,995)</box>" |
|
}, |
|
{ |
|
"id": 263, |
|
"question": "Tanglian is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Tanglian with grounding.", |
|
"prediction": "<ref>Tanglian</ref><box>(210,286),(582,988)</box>" |
|
}, |
|
{ |
|
"id": 264, |
|
"question": "Qianluo is <img>image_1</img>\n Tanglian is <img>image_2</img>\n Rui is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Qianluo is seated on the left, holding a sword, Tanglian is seated on the right, holding a plate with food, and Rui is seated between them, appearing to be in conversation." |
|
}, |
|
{ |
|
"id": 265, |
|
"question": "Xiaose is <img>image_1</img>\n Leiwujie is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Xiaose doing?", |
|
"prediction": "Xiaose is sitting and looking to the side." |
|
}, |
|
{ |
|
"id": 266, |
|
"question": "Xiaose is <img>image_1</img>\n Qianluo is <img>image_2</img>\n Tanglian is <img>image_3</img>\n Leiwujie is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Qianluo with grounding.", |
|
"prediction": "<ref>Qianluo</ref><box>(201,243),(386,869)</box>" |
|
}, |
|
{ |
|
"id": 267, |
|
"question": "Yuechu is <img>image_1</img>\n Susu is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Susu with grounding.", |
|
"prediction": "<ref>Susu</ref><box>(510,560),(820,998)</box>" |
|
}, |
|
{ |
|
"id": 268, |
|
"question": "Yuechu is <img>image_1</img>\n Susu is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Yuechu doing?", |
|
"prediction": "Yuechu is holding a peach-colored umbrella." |
|
}, |
|
{ |
|
"id": 269, |
|
"question": "Yuechu is <img>image_1</img>\n Susu is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Yuechu stands on the left, holding a lollipop, wearing a white shirt with a gray vest. Susu is on the right, dressed in a colorful outfit with a pink bag, both against a clear sky background." |
|
}, |
|
{ |
|
"id": 270, |
|
"question": "Rongrong is <img>image_1</img>\n Yaya is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Rongrong with grounding.", |
|
"prediction": "<ref>Rongrong</ref><box>(22,226),(482,987)</box>" |
|
}, |
|
{ |
|
"id": 271, |
|
"question": "Fugui is <img>image_1</img>\n Qingtong is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Fugui doing?", |
|
"prediction": "Fugui is embracing Qingtong." |
|
}, |
|
{ |
|
"id": 272, |
|
"question": "Yuechu is <img>image_1</img>\n Susu is <img>image_2</img>\n Describe the image: <img>image_3</img>\n", |
|
"prediction": "Yuechu is holding up a drawing next to Susu, who is pointing at the drawing. Both are standing in a room with warm lighting." |
|
}, |
|
{ |
|
"id": 273, |
|
"question": "Yuechu is <img>image_1</img>\n Susu is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Yuechu is sitting on the ground, leaning over Susu who is lying down, seemingly injured. They are in a destroyed village with a dramatic red sky overhead." |
|
}, |
|
{ |
|
"id": 274, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is sitting on the chair?", |
|
"prediction": "Fujie is sitting on the chair." |
|
}, |
|
{ |
|
"id": 275, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Aniya doing?", |
|
"prediction": "Aniya is hiding behind a door." |
|
}, |
|
{ |
|
"id": 276, |
|
"question": "Aniya is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Aniya with grounding.", |
|
"prediction": "<ref>Aniya</ref><box>(102,376),(665,977)</box>" |
|
}, |
|
{ |
|
"id": 277, |
|
"question": "Fujie is <img>image_1</img>\n Yueer is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Yueer doing?", |
|
"prediction": "Yueer is leaning over a couch towards Fujie." |
|
}, |
|
{ |
|
"id": 278, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n In the image: <img>image_4</img>\n What does Yueer hold?", |
|
"prediction": "Yueer holds a picnic basket." |
|
}, |
|
{ |
|
"id": 279, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n Descirbe the image: <img>image_4</img>\n", |
|
"prediction": "Aniya is standing on the left with a shopping bag, Fujie is on the right holding a gift, and Yueer is in the center with a bag of items. They are posing against a striped background with a decorative border." |
|
}, |
|
{ |
|
"id": 280, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is near the window?", |
|
"prediction": "Fujie is near the window." |
|
}, |
|
{ |
|
"id": 281, |
|
"question": "Fujie is <img>image_1</img>\n Yueer is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe Yueer's outfit.", |
|
"prediction": "Yueer is wearing a blue dress with a yellow floral hat." |
|
}, |
|
{ |
|
"id": 282, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Aniya is seated on the floor, leaning against a wall with a book in hand. Fujie is sitting on a sofa, reading a document. Yueer is kneeling on the floor, looking at a book. They are in a cozy living room." |
|
}, |
|
{ |
|
"id": 283, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n What do you see in the image: <img>image_4</img>\n", |
|
"prediction": "Aniya is sitting on the lap of Fujie, who is also sitting, while Yueer stands to the side. They are all against a backdrop of a clear sky with some clouds." |
|
}, |
|
{ |
|
"id": 284, |
|
"question": "Fujie is <img>image_1</img>\n Yueer is <img>image_2</img>\n Beiji is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Fujie is seated on a couch with a surprised expression, while Yueer is standing next to her, appearing to comfort her. Beiji is seated on the floor, slightly away from the others. The room has a cozy, lived-in atmosphere." |
|
}, |
|
{ |
|
"id": 285, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Provide a description of the image: <img>image_3</img>\n", |
|
"prediction": "Aniya is lying on a surfboard in the water, while Fujie is balancing on the surfboard's nose, holding a wooden board." |
|
}, |
|
{ |
|
"id": 286, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n In the image: <img>image_4</img>\n What expression is on Yueer's face?", |
|
"prediction": "Yueer is smiling with her eyes closed." |
|
}, |
|
{ |
|
"id": 287, |
|
"question": "Aniya is <img>image_1</img>\n Cizi is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Cizi's emotion?", |
|
"prediction": "Cizi is feeling angry." |
|
}, |
|
{ |
|
"id": 288, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Aniya is lying in bed, seemingly asleep, while Fujie is bending over, looking at a clock." |
|
}, |
|
{ |
|
"id": 289, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n In the image: <img>image_4</img>\n What is Fujie doing?", |
|
"prediction": "Fujie is sitting on a chair with his legs crossed." |
|
}, |
|
{ |
|
"id": 290, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n In the image: <img>image_3</img>\n Describe the content.", |
|
"prediction": "Aniya is seated at a table, focused on writing in her notebook. Fujie stands behind her, leaning over to closely examine the papers on the table. They are in a room with a vintage aesthetic, featuring a redwood cabinet and a CRT television." |
|
}, |
|
{ |
|
"id": 291, |
|
"question": "Aniya is <img>image_1</img>\n Beiji is <img>image_2</img>\n Cizi is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Cizi with grounding.", |
|
"prediction": "<ref>Cizi</ref><box>(322,291),(546,994)</box>" |
|
}, |
|
{ |
|
"id": 292, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n In the image: <img>image_4</img>\n Whose arms is Aniya in?", |
|
"prediction": "Aniya is in Fujie's arms." |
|
}, |
|
{ |
|
"id": 293, |
|
"question": "Aniya is <img>image_1</img>\n Fujie is <img>image_2</img>\n Yueer is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Aniya is standing on one foot with a stretched arm, facing a smaller Yueer who is bending forward with a surprised expression. Fujie is partially visible on the right edge, looking towards Aniya and Yueer. They are in a cozy living room." |
|
}, |
|
{ |
|
"id": 294, |
|
"question": "Ranbing is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Ranbing with grounding.", |
|
"prediction": "<ref>Ranbing</ref><box>(189,296),(350,952)</box>" |
|
}, |
|
{ |
|
"id": 295, |
|
"question": "Make is <img>image_1</img>\n Ranbing is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Ranbing, dressed as a bride, stands to the left, facing a man identified as Make, who is dressed in a suit on the right. They appear to be at a wedding ceremony with guests in the background." |
|
}, |
|
{ |
|
"id": 296, |
|
"question": "Ailika is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Ailika doing?", |
|
"prediction": "Ailika is sitting in a vehicle with her arm raised." |
|
}, |
|
{ |
|
"id": 297, |
|
"question": "Baiyuekui is <img>image_1</img>\n Xiadou is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Xiadou with grounding.", |
|
"prediction": "<ref>Xiadou</ref><box>(465,209),(642,831)</box>" |
|
}, |
|
{ |
|
"id": 298, |
|
"question": "Hongkou is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Hongkou doing?", |
|
"prediction": "Hongkou is standing and holding a weapon with a soldier." |
|
}, |
|
{ |
|
"id": 299, |
|
"question": "Chengxiaoshi is <img>image_1</img>\n Luguang is <img>image_2</img>\n Qiaoling is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Chengxiaoshi with grounding.", |
|
"prediction": "<ref>Chengxiaoshi</ref><box>(282,188),(492,887)</box>" |
|
}, |
|
{ |
|
"id": 300, |
|
"question": "Chengxiaoshi is <img>image_1</img>\n Qiaoling is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Chengxiaoshi stands with his hands behind his head, looking upwards, while Qiaoling sits turned away, appearing to be in conversation with him." |
|
}, |
|
{ |
|
"id": 301, |
|
"question": "Chengxiaoshi is <img>image_1</img>\n Luguang is <img>image_2</img>\n Qiaoling is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is opening the door?", |
|
"prediction": "Qiaoling is opening the door." |
|
}, |
|
{ |
|
"id": 302, |
|
"question": "Chengxiaoshi is <img>image_1</img>\n Luguang is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Chengxiaoshi doing?", |
|
"prediction": "Chengxiaoshi is holding a phone and looking at it with Luguang." |
|
}, |
|
{ |
|
"id": 303, |
|
"question": "Luguang is <img>image_1</img>\n Qiaoling is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Luguang with grounding.", |
|
"prediction": "<ref>Luguang</ref><box>(37,102),(403,984)</box>" |
|
}, |
|
{ |
|
"id": 304, |
|
"question": "Cody is <img>image_1</img>\n May is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify May with grounding.", |
|
"prediction": "<ref>May</ref><box>(150,184),(422,934)</box>" |
|
}, |
|
{ |
|
"id": 305, |
|
"question": "Cody is <img>image_1</img>\n May is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Cody doing?", |
|
"prediction": "Cody is holding a large hammer and appears to be in a fighting stance." |
|
}, |
|
{ |
|
"id": 306, |
|
"question": "Cody is <img>image_1</img>\n May is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is carrying the red magnet?", |
|
"prediction": "Cody is carrying the red magnet." |
|
}, |
|
{ |
|
"id": 307, |
|
"question": "Bob parr is <img>image_1</img>\n Elastigirl is <img>image_2</img>\n Dashiell is <img>image_3</img>\n Violet parr is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Elastigirl with grounding.", |
|
"prediction": "<ref>Elastigirl</ref><box>(626,129),(983,958)</box>" |
|
}, |
|
{ |
|
"id": 308, |
|
"question": "Elastigirl is <img>image_1</img>\n Dashiell is <img>image_2</img>\n Violet parr is <img>image_3</img>\n Jack-jack parr is <img>image_4</img>\n In the image: <img>image_5</img>\n Who is holding Jack-jack in arms?", |
|
"prediction": "Violet Parr is holding Jack-jack in arms." |
|
}, |
|
{ |
|
"id": 309, |
|
"question": "Bob parr is <img>image_1</img>\n Dashiell is <img>image_2</img>\n Violet parr is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Violet parr with grounding.", |
|
"prediction": "<ref>Violet parr</ref><box>(757,341),(982,988)</box>" |
|
}, |
|
{ |
|
"id": 310, |
|
"question": "Elastigirl is <img>image_1</img>\n Jack-jack parr is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Elastigirl is standing behind JackJack Parr, who is sitting in a sink filled with bubbles. She is washing his hair. There's a window showing a view of a house in the background." |
|
}, |
|
{ |
|
"id": 311, |
|
"question": "Elastigirl is <img>image_1</img>\n Dashiell is <img>image_2</img>\n Jack-jack parr is <img>image_3</img>\n In the image: <img>image_4</img>\n What is Dashiell doing?", |
|
"prediction": "Dashiell is sitting at the table with his mouth full." |
|
}, |
|
{ |
|
"id": 312, |
|
"question": "Bob parr is <img>image_1</img>\n Elastigirl is <img>image_2</img>\n Dashiell is <img>image_3</img>\n Violet parr is <img>image_4</img>\n Jack-jack parr is <img>image_5</img>\n In the image: <img>image_6</img>\n Identify Bob parr with grounding.", |
|
"prediction": "<ref>Bob parr</ref><box>(116,41),(367,950)</box>" |
|
}, |
|
{ |
|
"id": 313, |
|
"question": "Bob parr is <img>image_1</img>\n/img>\n In the image: <img>image_2</img>\n What is Bob parr doing?", |
|
"prediction": "Bob parr is pouring a drink." |
|
}, |
|
{ |
|
"id": 314, |
|
"question": "Bob parr is <img>image_1</img>\n Elastigirl is <img>image_2</img>\n Jack-jack parr is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Elastigirl is seated on a red motorcycle, looking to her left. Bob Parr stands beside the motorcycle, facing forward. Jack-Jack Parr is seated on the back of the motorcycle, holding onto the motorcycle's handlebars." |
|
}, |
|
{ |
|
"id": 315, |
|
"question": "Woody is <img>image_1</img>\n Jessie is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Jessie with grounding.", |
|
"prediction": "<ref>Jessie</ref><box>(15,25),(525,988)</box>" |
|
}, |
|
{ |
|
"id": 316, |
|
"question": "Buzz is <img>image_1</img>\n Jessie is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Buzz Lightyear is playfully pushing Jessie on the floor, both characters dressed as toy action figures." |
|
}, |
|
{ |
|
"id": 317, |
|
"question": "Woody is <img>image_1</img>\n Jessie is <img>image_2</img>\n Describe the content of the image: <img>image_3</img>\n", |
|
"prediction": "Woody and Jessie are standing close together, facing each other with a backdrop of a brightly lit stage." |
|
}, |
|
{ |
|
"id": 318, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n Lotso is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Woody with grounding.", |
|
"prediction": "<ref>Woody</ref><box>(795,89),(942,820)</box>" |
|
}, |
|
{ |
|
"id": 319, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n Jessie is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is Buzz looking at?", |
|
"prediction": "Buzz is looking at Woody." |
|
}, |
|
{ |
|
"id": 320, |
|
"question": "Betty is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Betty with grounding.", |
|
"prediction": "<ref>Betty</ref><box>(489,106),(898,869)</box>" |
|
}, |
|
{ |
|
"id": 321, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n In the image: <img>image_3</img>\n Which hand of the boy is Buzz in?", |
|
"prediction": "Buzz is in the boy's right hand." |
|
}, |
|
{ |
|
"id": 322, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Woody doing?", |
|
"prediction": "Woody is standing with his back facing the camera." |
|
}, |
|
{ |
|
"id": 323, |
|
"question": "Buzz is <img>image_1</img>\n Jessie is <img>image_2</img>\n Rex is <img>image_3</img>\n In the image: <img>image_4</img>\n Who is being pressed at the bottom?", |
|
"prediction": "Rex is being pressed at the bottom." |
|
}, |
|
{ |
|
"id": 324, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n Jessie is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Woody stands on the left with a concerned expression, Buzz is in the center looking to his left, and Jessie is on the right, all facing forward. They are surrounded by various toy characters in a colorful room." |
|
}, |
|
{ |
|
"id": 325, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n Describe the image: <img>image_3</img>\n", |
|
"prediction": "Woody, wearing a cowboy hat and plaid shirt, is standing with one hand on his head, looking surprised. Buzz, in a green and purple space suit, is standing with one hand outstretched as if pointing or holding something. They appear to be in a colorful room filled with toys." |
|
}, |
|
{ |
|
"id": 326, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n Bo peep is <img>image_3</img>\n In the image: <img>image_4</img>\n What is Bo peep doing?", |
|
"prediction": "Bo peep is hugging Buzz Lightyear." |
|
}, |
|
{ |
|
"id": 327, |
|
"question": "Woody is <img>image_1</img>\n Bo peep is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Woody is lying on the ground, and Bo Peep is sitting on his lap, both positioned on grass under a structure with wooden beams." |
|
}, |
|
{ |
|
"id": 328, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n Please give a summary of the image: <img>image_3</img>\n", |
|
"prediction": "Woody is seated on the left with his arm resting on a red couch, while Buzz is on the right with his arms spread wide, both against a backdrop of a vibrant alien landscape." |
|
}, |
|
{ |
|
"id": 329, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n Jessie is <img>image_3</img>\n Rex is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Rex with grounding.", |
|
"prediction": "<ref>Rex</ref><box>(772,348),(982,828)</box>" |
|
}, |
|
{ |
|
"id": 330, |
|
"question": "Woody is <img>image_1</img>\n Buzz is <img>image_2</img>\n Jessie is <img>image_3</img>\n Bo peep is <img>image_4</img>\n In the image: <img>image_5</img>\n Who is on the right of Bo peep?", |
|
"prediction": "Woody is on the right of Bo peep." |
|
}, |
|
{ |
|
"id": 331, |
|
"question": "Fuheihui is <img>image_1</img>\n Qiangwei is <img>image_2</img>\n Wutiaowu is <img>image_3</img>\n Qihai is <img>image_4</img>\n In the image: <img>image_5</img>\n Identify Fuheihui with grounding.", |
|
"prediction": "<ref>Fuheihui</ref><box>(388,108),(907,991)</box>" |
|
}, |
|
{ |
|
"id": 332, |
|
"question": "Lizi is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Lizi doing?", |
|
"prediction": "Lizi is standing with her hands on her hips." |
|
}, |
|
{ |
|
"id": 333, |
|
"question": "Wutiaowu is <img>image_1</img>\n Xiayoujie is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Wutiaowu stands on the left, facing right, dressed in a dark suit with a badge on the left side. Xiayoujie stands on the right, facing left, also in a dark suit with a badge on the right side. They appear to be conversing with a cityscape in the background." |
|
}, |
|
{ |
|
"id": 334, |
|
"question": "Wutiaowu is <img>image_1</img>\n Lizi is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Wutiaowu doing?", |
|
"prediction": "Wutiaowu is sitting and embracing Lizi." |
|
}, |
|
{ |
|
"id": 335, |
|
"question": "Wutiaowu is <img>image_1</img>\n Xiayoujie is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Xiayoujie's expression?", |
|
"prediction": "Xiayoujie looks surprised or in a state of disbelief." |
|
}, |
|
{ |
|
"id": 336, |
|
"question": "Huzhang is <img>image_1</img>\n Fuheihui is <img>image_2</img>\n Qiangwei is <img>image_3</img>\n Wutiaowu is <img>image_4</img>\n In the image: <img>image_5</img>\n Who is sitting on the sofa?", |
|
"prediction": "Huzhang is sitting on the sofa." |
|
}, |
|
{ |
|
"id": 337, |
|
"question": "Dongtang is <img>image_1</img>\n Zhenren is <img>image_2</img>\n In the image: <img>image_3</img>\n What is Zhenren doing?", |
|
"prediction": "Zhenren is dodging an attack." |
|
}, |
|
{ |
|
"id": 338, |
|
"question": "Huzhang is <img>image_1</img>\n Fuheihui is <img>image_2</img>\n Goujuan is <img>image_3</img>\n In the image: <img>image_4</img>\n Give a description.", |
|
"prediction": "Huzhang is on the right, gesturing with both hands near his face. Fuheihui is in the middle, partially obscured and also making a hand gesture. Goujuan is on the left, also making a hand gesture with his fingers. They are all wearing baseball jerseys." |
|
}, |
|
{ |
|
"id": 339, |
|
"question": "Xiayoujie is <img>image_1</img>\n In the image: <img>image_2</img>\n What is Xiayoujie doing?", |
|
"prediction": "Xiayoujie is sitting and reading a book." |
|
}, |
|
{ |
|
"id": 340, |
|
"question": "Qihai is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Qihai with grounding.", |
|
"prediction": "<ref>Qihai</ref><box>(156,229),(600,986)</box>" |
|
}, |
|
{ |
|
"id": 341, |
|
"question": "Huzhang is <img>image_1</img>\n Mingming is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Mingming with grounding.", |
|
"prediction": "<ref>Mingming</ref><box>(425,147),(582,848)</box>" |
|
}, |
|
{ |
|
"id": 342, |
|
"question": "Louhu is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Louhu with grounding.", |
|
"prediction": "<ref>Louhu</ref><box>(264,226),(567,983)</box>" |
|
}, |
|
{ |
|
"id": 343, |
|
"question": "Fuheihui is <img>image_1</img>\n Qiangwei is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Qiangwei with grounding.", |
|
"prediction": "<ref>Qiangwei</ref><box>(96,129),(447,986)</box>" |
|
}, |
|
{ |
|
"id": 344, |
|
"question": "Huzhang is <img>image_1</img>\n Louhu is <img>image_2</img>\n Give a content description of the image: <img>image_3</img>\n", |
|
"prediction": "Louhu, wearing a spotted jacket, is standing and appears to be in a conversation with Huzhang, who is sitting down wearing a red jacket." |
|
}, |
|
{ |
|
"id": 345, |
|
"question": "Wutiaowu is <img>image_1</img>\n Xiayoujie is <img>image_2</img>\n In the image: <img>image_3</img>\n What does Wutiaowu wear?", |
|
"prediction": "Wutiaowu wears a red jacket with black pants." |
|
}, |
|
{ |
|
"id": 346, |
|
"question": "Wutiaowu is <img>image_1</img>\n Shener is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Wutiaowu is engaged in a combat stance with Shener, both characters appear to be in a tense altercation under a red torii gate." |
|
}, |
|
{ |
|
"id": 347, |
|
"question": "Wutiaowu is <img>image_1</img>\n Xiayoujie is <img>image_2</img>\n Lizi is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Xiayoujie with grounding.", |
|
"prediction": "<ref>Xiayoujie</ref><box>(785,101),(998,979)</box>" |
|
}, |
|
{ |
|
"id": 348, |
|
"question": "Huzhang is <img>image_1</img>\n Qiangwei is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Huzhang, on the right, is facing left, seemingly talking to Qiangwei, who is on the left with her back partially turned towards the viewer. Both are in a dimly lit room with pipes in the background." |
|
}, |
|
{ |
|
"id": 349, |
|
"question": "Huzhang is <img>image_1</img>\n Fuheihui is <img>image_2</img>\n Qiangwei is <img>image_3</img>\n Please explain what's happening in the photo: <img>image_4</img>\n", |
|
"prediction": "Huzhang, with pink hair and a red scarf, stands on the left. \nFuheihui, wearing a navy uniform with a purple collar, is on the right. \nQiangwei, with short brown hair and a navy uniform, is partially visible between them." |
|
}, |
|
{ |
|
"id": 350, |
|
"question": "Huzhang is <img>image_1</img>\n Fuheihui is <img>image_2</img>\n Qiangwei is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Huzhang with grounding.", |
|
"prediction": "<ref>Huzhang</ref><box>(150,108),(600,986)</box>" |
|
}, |
|
{ |
|
"id": 351, |
|
"question": "Ningguang is <img>image_1</img>\n Beidou is <img>image_2</img>\n In the image: <img>image_3</img>\n Give a description.", |
|
"prediction": "Ningguang, with white hair and a golden armor, stands to the left, while Beidou, in a red outfit with black boots, is seated to the right across a table in a forest setting." |
|
}, |
|
{ |
|
"id": 352, |
|
"question": "Zhongli is <img>image_1</img>\n Leishen is <img>image_2</img>\n Funingna is <img>image_3</img>\n In the image: <img>image_4</img>\n Identify Leishen with grounding.", |
|
"prediction": "<ref>Leishen</ref><box>(562,214),(802,994)</box>" |
|
}, |
|
{ |
|
"id": 353, |
|
"question": "Hutao is <img>image_1</img>\n Yelan is <img>image_2</img>\n Xiao is <img>image_3</img>\n In the image: <img>image_4</img>\n What is Xiao doing?", |
|
"prediction": "Xiao is holding a sword with both hands." |
|
}, |
|
{ |
|
"id": 354, |
|
"question": "Linghua is <img>image_1</img>\n Lingren is <img>image_2</img>\n In the image: <img>image_3</img>\n What is in Lingren's hand?", |
|
"prediction": "Lingren is holding a teapot." |
|
}, |
|
{ |
|
"id": 355, |
|
"question": "Wulang is <img>image_1</img>\n In the image: <img>image_2</img>\n Identify Wulang with grounding.", |
|
"prediction": "<ref>Wulang</ref><box>(265,175),(467,909)</box>" |
|
}, |
|
{ |
|
"id": 356, |
|
"question": "Abeiduo is <img>image_1</img>\n Kong is <img>image_2</img>\n In the image: <img>image_3</img>\n Who is holding a sword?", |
|
"prediction": "Kong is holding a sword." |
|
}, |
|
{ |
|
"id": 357, |
|
"question": "Diluke is <img>image_1</img>\n Qin is <img>image_2</img>\n In the image: <img>image_3</img>\n Identify Qin with grounding.", |
|
"prediction": "<ref>Qin</ref><box>(145,210),(358,972)</box>" |
|
}, |
|
{ |
|
"id": 358, |
|
"question": "Ningguang is <img>image_1</img>\n Kong is <img>image_2</img>\n Describe the image: <img>image_3</img>\n", |
|
"prediction": "Ningguang is sitting to the left, holding a torch, and Kong is seated to the right, both in front of a campfire." |
|
}, |
|
{ |
|
"id": 359, |
|
"question": "Keqing is <img>image_1</img>\n Ying is <img>image_2</img>\n Give a content description of the image: <img>image_3</img>\n", |
|
"prediction": "Keqing is on the left, wearing a purple gown with a cat ears headband, standing beside Ying, who is in a white and blue outfit with a curly hair braid. They are both looking forward, set against a sky background with clouds and mountains." |
|
}, |
|
{ |
|
"id": 360, |
|
"question": "Regina Lampert is <img>image_0</img>\n In the following four images, Which is Regina Lampert? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 361, |
|
"question": "Peter Joshua is <img>image_0</img>\n In the following four images, Which is Peter Joshua? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 362, |
|
"question": "Peter Joshua is <img>image_0</img>\n In the following four images, Which is Peter Joshua? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 363, |
|
"question": "Hamilton Bartholomew is <img>image_0</img>\n In the following four images, Which is Hamilton Bartholomew? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 364, |
|
"question": "Kazan is <img>image_0</img>\n In the following four images, Which is Kazan? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 365, |
|
"question": "Worth is <img>image_0</img>\n In the following four images, Which is Worth? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 366, |
|
"question": "Worth is <img>image_0</img>\n In the following four images, Which is Worth? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 367, |
|
"question": "Worth is <img>image_0</img>\n In the following four images, Which is Worth? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 368, |
|
"question": "Quentin is <img>image_0</img>\n In the following four images, Which is Quentin? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 369, |
|
"question": "Holloway is <img>image_0</img>\n In the following four images, Which is Holloway? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 370, |
|
"question": "Leaven is <img>image_0</img>\n In the following four images, Which is Leaven? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 371, |
|
"question": "Leaven is <img>image_0</img>\n In the following four images, Which is Leaven? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 372, |
|
"question": "Agent Fox Mulder is <img>image_0</img>\n In the following four images, Which is Agent Fox Mulder? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 373, |
|
"question": "Agent Dana Scully is <img>image_0</img>\n In the following four images, Which is Agent Dana Scully? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 374, |
|
"question": "Reed Richards is <img>image_0</img>\n In the following four images, Which is Reed Richards? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 375, |
|
"question": "Johnny Storm is <img>image_0</img>\n In the following four images, Which is Johnny Storm? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 376, |
|
"question": "Sue Storm is <img>image_0</img>\n In the following four images, Which is Sue Storm? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 377, |
|
"question": "Victor Von Doom is <img>image_0</img>\n In the following four images, Which is Victor Von Doom? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 378, |
|
"question": "Sharon is <img>image_0</img>\n In the following four images, Which is Sharon? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 379, |
|
"question": "Burke Dennings is <img>image_0</img>\n In the following four images, Which is Burke Dennings? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 380, |
|
"question": "Jen Yu (Mandarin version) is <img>image_0</img>\n In the following four images, Which is Jen Yu (Mandarin version)? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 381, |
|
"question": "Master Li Mu Bai is <img>image_0</img>\n In the following four images, Which is Master Li Mu Bai? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 382, |
|
"question": "Yu Shu Lien is <img>image_0</img>\n In the following four images, Which is Yu Shu Lien? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 383, |
|
"question": "Lo 'Dark Cloud' is <img>image_0</img>\n In the following four images, Which is Lo 'Dark Cloud'? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 384, |
|
"question": "Evan is <img>image_0</img>\n In the following four images, Which is Evan? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 385, |
|
"question": "Andrea is <img>image_0</img>\n In the following four images, Which is Andrea? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 386, |
|
"question": "Lenny is <img>image_0</img>\n In the following four images, Which is Lenny? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 387, |
|
"question": "Kayleigh is <img>image_0</img>\n In the following four images, Which is Kayleigh? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 388, |
|
"question": "antelope is <img>image_0</img>\n In the following four images, Which is antelope? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 389, |
|
"question": "appaloosa is <img>image_0</img>\n In the following four images, Which is appaloosa? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 390, |
|
"question": "arabiancamel is <img>image_0</img>\n In the following four images, Which is arabiancamel? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 391, |
|
"question": "asiancrocodile is <img>image_0</img>\n In the following four images, Which is asiancrocodile? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 392, |
|
"question": "belgianhare is <img>image_0</img>\n In the following four images, Which is belgianhare? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 393, |
|
"question": "bighorn is <img>image_0</img>\n In the following four images, Which is bighorn? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 394, |
|
"question": "bovine is <img>image_0</img>\n In the following four images, Which is bovine? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 395, |
|
"question": "cheetah is <img>image_0</img>\n In the following four images, Which is cheetah? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 396, |
|
"question": "cheviot is <img>image_0</img>\n In the following four images, Which is cheviot? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 397, |
|
"question": "dallsheep is <img>image_0</img>\n In the following four images, Which is dallsheep? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 398, |
|
"question": "elk is <img>image_0</img>\n In the following four images, Which is elk? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 399, |
|
"question": "forestgoat is <img>image_0</img>\n In the following four images, Which is forestgoat? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 400, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 401, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 402, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 403, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 404, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 405, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 406, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 407, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 408, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 409, |
|
"question": "The reference vehicle is <img>image_0</img>\n In the following four images, Which is the reference vehicle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 410, |
|
"question": "Willem_Merkxtuin is <img>image_0</img>\n In the following four images, Which is Willem_Merkxtuin? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 411, |
|
"question": "Ch%C3%A2teau_de_Chenonceau is <img>image_0</img>\n In the following four images, Which is Ch%C3%A2teau_de_Chenonceau? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 412, |
|
"question": "Munshi_Ghat is <img>image_0</img>\n In the following four images, Which is Munshi_Ghat? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 413, |
|
"question": "Burg_Heidenreichstein is <img>image_0</img>\n In the following four images, Which is Burg_Heidenreichstein? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 414, |
|
"question": "Santa_Maria_in_Cappella_(Rome) is <img>image_0</img>\n In the following four images, Which is Santa_Maria_in_Cappella_(Rome)? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 1" |
|
}, |
|
{ |
|
"id": 415, |
|
"question": "%C3%89glise_Saint-Martin_(Laon) is <img>image_0</img>\n In the following four images, Which is %C3%89glise_Saint-Martin_(Laon)? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 416, |
|
"question": "Bizzell_Memorial_Library is <img>image_0</img>\n In the following four images, Which is Bizzell_Memorial_Library? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 4" |
|
}, |
|
{ |
|
"id": 417, |
|
"question": "Hiyoshi_Taisha is <img>image_0</img>\n In the following four images, Which is Hiyoshi_Taisha? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 418, |
|
"question": "Michelangelo's_Moses is <img>image_0</img>\n In the following four images, Which is Michelangelo's_Moses? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 419, |
|
"question": "%C4%BDubov%C5%88a_Castle is <img>image_0</img>\n In the following four images, Which is %C4%BDubov%C5%88a_Castle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 420, |
|
"question": "Coll%C3%A9giale_Notre-Dame_de_Vernon is <img>image_0</img>\n In the following four images, Which is Coll%C3%A9giale_Notre-Dame_de_Vernon? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
}, |
|
{ |
|
"id": 421, |
|
"question": "Cathedral_of_Guadalajara,_Mexico is <img>image_0</img>\n In the following four images, Which is Cathedral_of_Guadalajara,_Mexico? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 422, |
|
"question": "Kankalini_Temple,_Saptari is <img>image_0</img>\n In the following four images, Which is Kankalini_Temple,_Saptari? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 423, |
|
"question": "Wat_Thewarat_Kunchon is <img>image_0</img>\n In the following four images, Which is Wat_Thewarat_Kunchon? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 424, |
|
"question": "Moszna_Castle is <img>image_0</img>\n In the following four images, Which is Moszna_Castle? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 425, |
|
"question": "Cathedral-Basilica_of_Mary,_Queen_of_the_World is <img>image_0</img>\n In the following four images, Which is Cathedral-Basilica_of_Mary,_Queen_of_the_World? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 3" |
|
}, |
|
{ |
|
"id": 426, |
|
"question": "Helsinki_Lutheran_Cathedral is <img>image_0</img>\n In the following four images, Which is Helsinki_Lutheran_Cathedral? Image 1: <img>image_1</img>\n Image 2: <img>image_2</img>\n Image 3: <img>image_3</img>\n Image 4: <img>image_4</img>\n", |
|
"prediction": "Image 2" |
|
} |
|
] |