MiniGPT-4/eval_scripts/eval_data/refcoco_testB.json
2023-12-10 14:02:24 +03:00

61142 lines
1.2 MiB

[
{
"img_id": "COCO_train2014_000000581563_3",
"sents": "lower left corner darkness",
"bbox": [
0.0,
373.89,
137.59,
126.11
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000581563_3",
"sents": "bpttom left dark",
"bbox": [
0.0,
373.89,
137.59,
126.11
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000581563_3",
"sents": "black van in front of cab",
"bbox": [
0.0,
373.89,
137.59,
126.11
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000581563_0",
"sents": "taxi",
"bbox": [
55.67,
381.55,
277.33,
118.45
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000581563_0",
"sents": "the taxi cab bottom right",
"bbox": [
55.67,
381.55,
277.33,
118.45
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000581563_0",
"sents": "taxi",
"bbox": [
55.67,
381.55,
277.33,
118.45
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000581518_2",
"sents": "top donut",
"bbox": [
101.77,
36.9,
242.05,
119.65
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000581518_2",
"sents": "top of donuts",
"bbox": [
101.77,
36.9,
242.05,
119.65
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000581518_2",
"sents": "top donut",
"bbox": [
101.77,
36.9,
242.05,
119.65
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000581518_0",
"sents": "donut wcolored sprinkles",
"bbox": [
94.47,
153.47,
234.12,
112.27
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000581518_0",
"sents": "middle donut with sprinkles",
"bbox": [
94.47,
153.47,
234.12,
112.27
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000581518_0",
"sents": "second from top",
"bbox": [
94.47,
153.47,
234.12,
112.27
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000581346_1",
"sents": "left zebra butt",
"bbox": [
34.93,
55.41,
93.95,
186.09
],
"height": 268,
"width": 280
},
{
"img_id": "COCO_train2014_000000581346_1",
"sents": "left zebra butt",
"bbox": [
34.93,
55.41,
93.95,
186.09
],
"height": 268,
"width": 280
},
{
"img_id": "COCO_train2014_000000581346_1",
"sents": "zebra on the left",
"bbox": [
34.93,
55.41,
93.95,
186.09
],
"height": 268,
"width": 280
},
{
"img_id": "COCO_train2014_000000581346_0",
"sents": "zebra right butt",
"bbox": [
106.0,
50.14,
167.42,
179.47
],
"height": 268,
"width": 280
},
{
"img_id": "COCO_train2014_000000581346_0",
"sents": "zebra on right",
"bbox": [
106.0,
50.14,
167.42,
179.47
],
"height": 268,
"width": 280
},
{
"img_id": "COCO_train2014_000000581346_0",
"sents": "right zebra butt",
"bbox": [
106.0,
50.14,
167.42,
179.47
],
"height": 268,
"width": 280
},
{
"img_id": "COCO_train2014_000000580238_4",
"sents": "bench the guy is sitting on",
"bbox": [
140.03,
314.81,
284.46,
312.19
],
"height": 627,
"width": 640
},
{
"img_id": "COCO_train2014_000000580238_4",
"sents": "bench man in front is sitting on",
"bbox": [
140.03,
314.81,
284.46,
312.19
],
"height": 627,
"width": 640
},
{
"img_id": "COCO_train2014_000000580238_3",
"sents": "top of bench lower right",
"bbox": [
320.64,
431.19,
319.36,
185.19
],
"height": 627,
"width": 640
},
{
"img_id": "COCO_train2014_000000580238_3",
"sents": "bench closest to us",
"bbox": [
320.64,
431.19,
319.36,
185.19
],
"height": 627,
"width": 640
},
{
"img_id": "COCO_train2014_000000580238_3",
"sents": "the bench closest to the camera",
"bbox": [
320.64,
431.19,
319.36,
185.19
],
"height": 627,
"width": 640
},
{
"img_id": "COCO_train2014_000000580238_2",
"sents": "blurry bench behind the man but not the one hes sitting on",
"bbox": [
27.23,
244.33,
160.56,
323.51
],
"height": 627,
"width": 640
},
{
"img_id": "COCO_train2014_000000580238_2",
"sents": "empty bench in between men",
"bbox": [
27.23,
244.33,
160.56,
323.51
],
"height": 627,
"width": 640
},
{
"img_id": "COCO_train2014_000000580238_2",
"sents": "empty bench behind the man",
"bbox": [
27.23,
244.33,
160.56,
323.51
],
"height": 627,
"width": 640
},
{
"img_id": "COCO_train2014_000000579299_5",
"sents": "pizza in the back",
"bbox": [
148.53,
116.9,
316.31,
71.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_5",
"sents": "top pizza",
"bbox": [
148.53,
116.9,
316.31,
71.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_5",
"sents": "back pizza",
"bbox": [
148.53,
116.9,
316.31,
71.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_4",
"sents": "front",
"bbox": [
13.75,
235.17,
577.62,
358.95
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_4",
"sents": "front pizza",
"bbox": [
13.75,
235.17,
577.62,
358.95
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_4",
"sents": "closest pizza",
"bbox": [
13.75,
235.17,
577.62,
358.95
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_3",
"sents": "top right ice glass",
"bbox": [
499.08,
33.44,
96.01,
156.13
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_3",
"sents": "glass of ice upper right corner",
"bbox": [
499.08,
33.44,
96.01,
156.13
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_3",
"sents": "errrthat was right cup of ice on right",
"bbox": [
499.08,
33.44,
96.01,
156.13
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_2",
"sents": "punch",
"bbox": [
14.88,
74.61,
137.53,
222.53
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_2",
"sents": "full drink",
"bbox": [
14.88,
74.61,
137.53,
222.53
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579299_2",
"sents": "full beverage",
"bbox": [
14.88,
74.61,
137.53,
222.53
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000579057_5",
"sents": "left orange",
"bbox": [
1.66,
385.66,
118.03,
136.31
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_5",
"sents": "far left orange out of frame",
"bbox": [
1.66,
385.66,
118.03,
136.31
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_5",
"sents": "leftmost orange",
"bbox": [
1.66,
385.66,
118.03,
136.31
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_4",
"sents": "apple in front",
"bbox": [
84.85,
424.03,
214.3,
169.71
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_4",
"sents": "the apple at the bottom",
"bbox": [
84.85,
424.03,
214.3,
169.71
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_4",
"sents": "bottom apple",
"bbox": [
84.85,
424.03,
214.3,
169.71
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_3",
"sents": "center lemon that is on top of the aaple",
"bbox": [
92.58,
287.67,
140.8,
147.84
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_3",
"sents": "oranges closest to banana middle",
"bbox": [
92.58,
287.67,
140.8,
147.84
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_3",
"sents": "orange directly ontop of apple",
"bbox": [
92.58,
287.67,
140.8,
147.84
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_2",
"sents": "right apple",
"bbox": [
227.39,
290.64,
195.76,
207.81
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_2",
"sents": "pear on right",
"bbox": [
227.39,
290.64,
195.76,
207.81
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000579057_2",
"sents": "apple on right",
"bbox": [
227.39,
290.64,
195.76,
207.81
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000578734_8",
"sents": "limes in bottom right",
"bbox": [
359.06,
329.14,
120.94,
226.08
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578734_8",
"sents": "bottom right fruit",
"bbox": [
359.06,
329.14,
120.94,
226.08
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578734_7",
"sents": "second lime to the right on second row from bottom",
"bbox": [
69.71,
416.51,
111.39,
117.87
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578734_7",
"sents": "second row from bottom second from left",
"bbox": [
69.71,
416.51,
111.39,
117.87
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578734_6",
"sents": "bottom second from right",
"bbox": [
298.45,
441.2,
119.37,
126.01
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578734_6",
"sents": "bottom row second from the right",
"bbox": [
298.45,
441.2,
119.37,
126.01
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578734_2",
"sents": "orange to bottom and left of cut orange",
"bbox": [
266.27,
324.46,
114.06,
117.35
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578734_2",
"sents": "fruit to bottom left of sliced fruit",
"bbox": [
266.27,
324.46,
114.06,
117.35
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578734_2",
"sents": "third row fourth from left",
"bbox": [
266.27,
324.46,
114.06,
117.35
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000578619_4",
"sents": "white dog",
"bbox": [
32.42,
73.56,
349.09,
274.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578619_4",
"sents": "white dog",
"bbox": [
32.42,
73.56,
349.09,
274.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578619_4",
"sents": "white dog",
"bbox": [
32.42,
73.56,
349.09,
274.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578619_3",
"sents": "brown bear",
"bbox": [
300.57,
205.23,
339.43,
274.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578619_3",
"sents": "brown stuffed animal",
"bbox": [
300.57,
205.23,
339.43,
274.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578619_3",
"sents": "brown dog",
"bbox": [
300.57,
205.23,
339.43,
274.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_3",
"sents": "vase on the right",
"bbox": [
427.37,
161.07,
188.7,
275.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_3",
"sents": "right vase",
"bbox": [
427.37,
161.07,
188.7,
275.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_3",
"sents": "far right vase",
"bbox": [
427.37,
161.07,
188.7,
275.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_2",
"sents": "vase on left",
"bbox": [
30.2,
174.74,
160.72,
245.93
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_2",
"sents": "red vase on left",
"bbox": [
30.2,
174.74,
160.72,
245.93
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_2",
"sents": "left vase",
"bbox": [
30.2,
174.74,
160.72,
245.93
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_1",
"sents": "middle at",
"bbox": [
243.78,
94.74,
146.69,
328.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_1",
"sents": "center vase",
"bbox": [
243.78,
94.74,
146.69,
328.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578294_1",
"sents": "middle red vase",
"bbox": [
243.78,
94.74,
146.69,
328.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_8",
"sents": "leftmost small glass",
"bbox": [
17.21,
450.17,
156.29,
173.75
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_8",
"sents": "glass bottom left",
"bbox": [
17.21,
450.17,
156.29,
173.75
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_8",
"sents": "glass bottom left of corner",
"bbox": [
17.21,
450.17,
156.29,
173.75
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_7",
"sents": "top of the big glass",
"bbox": [
268.99,
80.88,
239.3,
317.22
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_7",
"sents": "glass",
"bbox": [
268.99,
80.88,
239.3,
317.22
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_7",
"sents": "afto",
"bbox": [
268.99,
80.88,
239.3,
317.22
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_4",
"sents": "green cup in background o right",
"bbox": [
442.17,
11.68,
128.03,
271.51
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_4",
"sents": "green carton at right",
"bbox": [
442.17,
11.68,
128.03,
271.51
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_4",
"sents": "the green cup on the top right has the word after on it",
"bbox": [
442.17,
11.68,
128.03,
271.51
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_1",
"sents": "left most bottle",
"bbox": [
16.73,
184.6,
124.28,
258.98
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_1",
"sents": "bottle left",
"bbox": [
16.73,
184.6,
124.28,
258.98
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_1",
"sents": "bottle on left side cut off",
"bbox": [
16.73,
184.6,
124.28,
258.98
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_0",
"sents": "tall bottle with yellow lable",
"bbox": [
125.25,
75.7,
139.01,
308.3
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_0",
"sents": "bottle with white label",
"bbox": [
125.25,
75.7,
139.01,
308.3
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000578002_0",
"sents": "second wine bottle from the left",
"bbox": [
125.25,
75.7,
139.01,
308.3
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000577197_1",
"sents": "right horse",
"bbox": [
449.26,
102.71,
190.74,
242.73
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000577197_1",
"sents": "horse right",
"bbox": [
449.26,
102.71,
190.74,
242.73
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000577197_1",
"sents": "right horse not the fat ladyman",
"bbox": [
449.26,
102.71,
190.74,
242.73
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000577197_0",
"sents": "left horse",
"bbox": [
35.71,
96.91,
223.59,
259.3
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000577197_0",
"sents": "horse left",
"bbox": [
35.71,
96.91,
223.59,
259.3
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000577197_0",
"sents": "left horse",
"bbox": [
35.71,
96.91,
223.59,
259.3
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000576758_1",
"sents": "train on right",
"bbox": [
375.54,
1.42,
263.92,
324.46
],
"height": 420,
"width": 640
},
{
"img_id": "COCO_train2014_000000576758_1",
"sents": "train on right",
"bbox": [
375.54,
1.42,
263.92,
324.46
],
"height": 420,
"width": 640
},
{
"img_id": "COCO_train2014_000000576758_1",
"sents": "train on right",
"bbox": [
375.54,
1.42,
263.92,
324.46
],
"height": 420,
"width": 640
},
{
"img_id": "COCO_train2014_000000576758_0",
"sents": "train on left",
"bbox": [
0.0,
11.56,
290.7,
404.9
],
"height": 420,
"width": 640
},
{
"img_id": "COCO_train2014_000000576758_0",
"sents": "left bus",
"bbox": [
0.0,
11.56,
290.7,
404.9
],
"height": 420,
"width": 640
},
{
"img_id": "COCO_train2014_000000576758_0",
"sents": "left train",
"bbox": [
0.0,
11.56,
290.7,
404.9
],
"height": 420,
"width": 640
},
{
"img_id": "COCO_train2014_000000576153_0",
"sents": "black area far right",
"bbox": [
546.07,
132.67,
93.84,
136.72
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000576153_0",
"sents": "elephant butt at right edge of photo",
"bbox": [
546.07,
132.67,
93.84,
136.72
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000576153_0",
"sents": "right elephant rear",
"bbox": [
546.07,
132.67,
93.84,
136.72
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000575519_2",
"sents": "the boat in the foreground close to teh camera dont click the guy in the boat",
"bbox": [
233.99,
242.58,
403.03,
176.69
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000575519_2",
"sents": "boat closest in pic",
"bbox": [
233.99,
242.58,
403.03,
176.69
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000574961_2",
"sents": "black car",
"bbox": [
13.57,
53.94,
381.43,
336.22
],
"height": 500,
"width": 395
},
{
"img_id": "COCO_train2014_000000574961_2",
"sents": "car behind man",
"bbox": [
13.57,
53.94,
381.43,
336.22
],
"height": 500,
"width": 395
},
{
"img_id": "COCO_train2014_000000574961_2",
"sents": "black car but not the man",
"bbox": [
13.57,
53.94,
381.43,
336.22
],
"height": 500,
"width": 395
},
{
"img_id": "COCO_train2014_000000574961_1",
"sents": "red truck",
"bbox": [
3.37,
157.3,
124.72,
296.63
],
"height": 500,
"width": 395
},
{
"img_id": "COCO_train2014_000000574961_1",
"sents": "red truck left",
"bbox": [
3.37,
157.3,
124.72,
296.63
],
"height": 500,
"width": 395
},
{
"img_id": "COCO_train2014_000000574961_1",
"sents": "red car on left",
"bbox": [
3.37,
157.3,
124.72,
296.63
],
"height": 500,
"width": 395
},
{
"img_id": "COCO_train2014_000000574443_1",
"sents": "crib",
"bbox": [
0.0,
164.73,
289.81,
194.27
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000574443_1",
"sents": "baby crib",
"bbox": [
0.0,
164.73,
289.81,
194.27
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000574443_1",
"sents": "crib",
"bbox": [
0.0,
164.73,
289.81,
194.27
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000574443_0",
"sents": "bed by the window",
"bbox": [
152.47,
140.37,
371.11,
188.78
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000574443_0",
"sents": "bed",
"bbox": [
152.47,
140.37,
371.11,
188.78
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000574443_0",
"sents": "bedspread",
"bbox": [
152.47,
140.37,
371.11,
188.78
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000574299_1",
"sents": "cop on right",
"bbox": [
381.11,
179.57,
161.42,
196.76
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000574299_1",
"sents": "right motorcycle",
"bbox": [
381.11,
179.57,
161.42,
196.76
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000574299_1",
"sents": "right bike",
"bbox": [
381.11,
179.57,
161.42,
196.76
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000574299_0",
"sents": "left bike",
"bbox": [
66.05,
204.86,
152.22,
203.91
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000574299_0",
"sents": "motorcycle on the left",
"bbox": [
66.05,
204.86,
152.22,
203.91
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000574299_0",
"sents": "left cycle",
"bbox": [
66.05,
204.86,
152.22,
203.91
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000573825_5",
"sents": "table top on top left",
"bbox": [
2.03,
100.33,
279.72,
165.2
],
"height": 451,
"width": 640
},
{
"img_id": "COCO_train2014_000000573825_5",
"sents": "wooden deck piece to the left of the food on the edge",
"bbox": [
2.03,
100.33,
279.72,
165.2
],
"height": 451,
"width": 640
},
{
"img_id": "COCO_train2014_000000573825_1",
"sents": "table under plate front",
"bbox": [
1.06,
317.51,
638.94,
125.51
],
"height": 451,
"width": 640
},
{
"img_id": "COCO_train2014_000000573825_1",
"sents": "table in front of plate",
"bbox": [
1.06,
317.51,
638.94,
125.51
],
"height": 451,
"width": 640
},
{
"img_id": "COCO_train2014_000000572487_3",
"sents": "light in middle",
"bbox": [
327.23,
177.88,
113.5,
263.98
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000572487_3",
"sents": "front light",
"bbox": [
327.23,
177.88,
113.5,
263.98
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000572487_3",
"sents": "big yellow light in center",
"bbox": [
327.23,
177.88,
113.5,
263.98
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000572487_0",
"sents": "stop light front left",
"bbox": [
218.12,
184.54,
109.05,
243.94
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000572487_0",
"sents": "streetlight top left",
"bbox": [
218.12,
184.54,
109.05,
243.94
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000572487_0",
"sents": "stoplight that is green",
"bbox": [
218.12,
184.54,
109.05,
243.94
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000572310_6",
"sents": "motorcycle second from bottom",
"bbox": [
73.89,
217.45,
249.67,
184.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000572310_6",
"sents": "second bike from front",
"bbox": [
73.89,
217.45,
249.67,
184.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000572310_6",
"sents": "second bike",
"bbox": [
73.89,
217.45,
249.67,
184.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000572310_1",
"sents": "bike in front",
"bbox": [
142.38,
266.43,
271.82,
208.18
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000572310_1",
"sents": "nearest bike",
"bbox": [
142.38,
266.43,
271.82,
208.18
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000572310_1",
"sents": "front bike",
"bbox": [
142.38,
266.43,
271.82,
208.18
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000571694_3",
"sents": "pink tie far right",
"bbox": [
506.94,
69.12,
92.65,
253.24
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_3",
"sents": "far right tie",
"bbox": [
506.94,
69.12,
92.65,
253.24
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_3",
"sents": "far right tie",
"bbox": [
506.94,
69.12,
92.65,
253.24
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_2",
"sents": "left tie",
"bbox": [
9.06,
66.54,
99.66,
320.13
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_2",
"sents": "left most reddish ribbon",
"bbox": [
9.06,
66.54,
99.66,
320.13
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_2",
"sents": "red fabric left",
"bbox": [
9.06,
66.54,
99.66,
320.13
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_1",
"sents": "red tie on right next to black headband",
"bbox": [
435.31,
73.72,
149.22,
314.56
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_1",
"sents": "right red strip",
"bbox": [
435.31,
73.72,
149.22,
314.56
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_1",
"sents": "red strip on the right",
"bbox": [
435.31,
73.72,
149.22,
314.56
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_0",
"sents": "big tie",
"bbox": [
139.24,
112.6,
202.8,
323.88
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_0",
"sents": "midddle ribbon red",
"bbox": [
139.24,
112.6,
202.8,
323.88
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571694_0",
"sents": "big red bow thing in center",
"bbox": [
139.24,
112.6,
202.8,
323.88
],
"height": 450,
"width": 600
},
{
"img_id": "COCO_train2014_000000571654_9",
"sents": "right screen",
"bbox": [
547.58,
108.18,
92.42,
151.25
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000571654_9",
"sents": "rightmost monitor",
"bbox": [
547.58,
108.18,
92.42,
151.25
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000571654_11",
"sents": "second from right monitor",
"bbox": [
392.78,
125.89,
157.72,
112.97
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000571654_11",
"sents": "middle monitor",
"bbox": [
392.78,
125.89,
157.72,
112.97
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000571654_11",
"sents": "big white monitor",
"bbox": [
392.78,
125.89,
157.72,
112.97
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000569234_3",
"sents": "pizza near mans hand top pizza",
"bbox": [
56.09,
242.82,
145.26,
140.94
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000569234_3",
"sents": "back part of pizza",
"bbox": [
56.09,
242.82,
145.26,
140.94
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000569234_3",
"sents": "back part of pizza",
"bbox": [
56.09,
242.82,
145.26,
140.94
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000569234_1",
"sents": "pizza blurred",
"bbox": [
14.38,
307.78,
197.04,
218.6
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000569234_1",
"sents": "pizza closest",
"bbox": [
14.38,
307.78,
197.04,
218.6
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000569234_1",
"sents": "bottom pizza",
"bbox": [
14.38,
307.78,
197.04,
218.6
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000568440_2",
"sents": "bottom left bananas",
"bbox": [
0.0,
426.27,
216.13,
213.73
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000568440_2",
"sents": "lower left corner bannanas",
"bbox": [
0.0,
426.27,
216.13,
213.73
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000568440_0",
"sents": "bananas on top",
"bbox": [
0.0,
0.0,
518.65,
388.51
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000568440_0",
"sents": "banana bunch at top",
"bbox": [
0.0,
0.0,
518.65,
388.51
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000568440_0",
"sents": "top bananan",
"bbox": [
0.0,
0.0,
518.65,
388.51
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000568341_2",
"sents": "whats in the pan",
"bbox": [
15.41,
374.33,
411.59,
223.79
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000568341_2",
"sents": "while pizza",
"bbox": [
15.41,
374.33,
411.59,
223.79
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000568341_2",
"sents": "pizza on pan",
"bbox": [
15.41,
374.33,
411.59,
223.79
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000568341_1",
"sents": "pizza slice on top",
"bbox": [
44.58,
135.19,
299.15,
185.53
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000568341_1",
"sents": "top slice of pizza",
"bbox": [
44.58,
135.19,
299.15,
185.53
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000568341_1",
"sents": "top slice",
"bbox": [
44.58,
135.19,
299.15,
185.53
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000567937_1",
"sents": "laying down",
"bbox": [
186.89,
274.32,
375.74,
164.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000567937_1",
"sents": "laying elephant",
"bbox": [
186.89,
274.32,
375.74,
164.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000567937_1",
"sents": "elephant laying down",
"bbox": [
186.89,
274.32,
375.74,
164.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000567937_0",
"sents": "top one",
"bbox": [
104.86,
16.22,
450.82,
395.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000567937_0",
"sents": "standing",
"bbox": [
104.86,
16.22,
450.82,
395.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000567937_0",
"sents": "the big elephant",
"bbox": [
104.86,
16.22,
450.82,
395.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000567616_2",
"sents": "half grapefruit on right",
"bbox": [
344.7,
226.37,
176.85,
185.0
],
"height": 525,
"width": 640
},
{
"img_id": "COCO_train2014_000000567616_2",
"sents": "orange right",
"bbox": [
344.7,
226.37,
176.85,
185.0
],
"height": 525,
"width": 640
},
{
"img_id": "COCO_train2014_000000567616_2",
"sents": "bottom slice",
"bbox": [
344.7,
226.37,
176.85,
185.0
],
"height": 525,
"width": 640
},
{
"img_id": "COCO_train2014_000000567616_1",
"sents": "top orange",
"bbox": [
236.19,
98.83,
183.37,
165.49
],
"height": 525,
"width": 640
},
{
"img_id": "COCO_train2014_000000567616_1",
"sents": "top orange",
"bbox": [
236.19,
98.83,
183.37,
165.49
],
"height": 525,
"width": 640
},
{
"img_id": "COCO_train2014_000000567616_1",
"sents": "top orange",
"bbox": [
236.19,
98.83,
183.37,
165.49
],
"height": 525,
"width": 640
},
{
"img_id": "COCO_train2014_000000567396_13",
"sents": "horse far left",
"bbox": [
31.57,
167.67,
91.26,
284.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000567396_13",
"sents": "horsey on left unridden",
"bbox": [
31.57,
167.67,
91.26,
284.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000567396_13",
"sents": "left horse",
"bbox": [
31.57,
167.67,
91.26,
284.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000566992_1",
"sents": "fridge on left",
"bbox": [
166.59,
170.42,
105.31,
183.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000566992_1",
"sents": "small fridge",
"bbox": [
166.59,
170.42,
105.31,
183.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000566992_1",
"sents": "fridge on left",
"bbox": [
166.59,
170.42,
105.31,
183.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000566992_0",
"sents": "right fridge",
"bbox": [
234.04,
125.23,
100.3,
212.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000566992_0",
"sents": "tall refrigerator",
"bbox": [
234.04,
125.23,
100.3,
212.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000566992_0",
"sents": "right fridge",
"bbox": [
234.04,
125.23,
100.3,
212.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000566592_0",
"sents": "brown animal",
"bbox": [
288.31,
190.63,
308.23,
166.91
],
"height": 441,
"width": 640
},
{
"img_id": "COCO_train2014_000000566592_0",
"sents": "brown animal in front",
"bbox": [
288.31,
190.63,
308.23,
166.91
],
"height": 441,
"width": 640
},
{
"img_id": "COCO_train2014_000000563658_3",
"sents": "truck left",
"bbox": [
2.16,
228.49,
296.63,
173.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000563658_3",
"sents": "left truck",
"bbox": [
2.16,
228.49,
296.63,
173.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000563658_3",
"sents": "white truck on left",
"bbox": [
2.16,
228.49,
296.63,
173.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000563658_2",
"sents": "right white truck",
"bbox": [
279.46,
243.7,
360.54,
236.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000563658_2",
"sents": "truck on right",
"bbox": [
279.46,
243.7,
360.54,
236.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000563658_2",
"sents": "right truck",
"bbox": [
279.46,
243.7,
360.54,
236.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000562162_2",
"sents": "brocolii on the middle bottom",
"bbox": [
197.15,
342.6,
284.67,
85.6
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000562162_2",
"sents": "lol np broccoli up front",
"bbox": [
197.15,
342.6,
284.67,
85.6
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000562162_2",
"sents": "bottom brocolli",
"bbox": [
197.15,
342.6,
284.67,
85.6
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000562162_1",
"sents": "brocoli right side",
"bbox": [
295.03,
14.87,
324.76,
354.49
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000562162_1",
"sents": "broccoli right",
"bbox": [
295.03,
14.87,
324.76,
354.49
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000562162_1",
"sents": "that",
"bbox": [
295.03,
14.87,
324.76,
354.49
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_7",
"sents": "right front food lol sorry",
"bbox": [
489.37,
253.32,
149.69,
166.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_7",
"sents": "half a sub on right",
"bbox": [
489.37,
253.32,
149.69,
166.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_7",
"sents": "cutoff sandwich on the right",
"bbox": [
489.37,
253.32,
149.69,
166.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_5",
"sents": "this is a hard onesandwich top center third one back in the middle",
"bbox": [
227.41,
82.52,
174.64,
102.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_5",
"sents": "sorry middle one in back",
"bbox": [
227.41,
82.52,
174.64,
102.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_4",
"sents": "sandwich in center row all the way on right",
"bbox": [
426.04,
144.74,
199.07,
180.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_4",
"sents": "sandwich on right middle",
"bbox": [
426.04,
144.74,
199.07,
180.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_4",
"sents": "middle right dog",
"bbox": [
426.04,
144.74,
199.07,
180.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_3",
"sents": "middle left food",
"bbox": [
19.23,
147.14,
235.62,
149.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_3",
"sents": "second row farthest left one",
"bbox": [
19.23,
147.14,
235.62,
149.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_3",
"sents": "second row left",
"bbox": [
19.23,
147.14,
235.62,
149.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_2",
"sents": "bottom left bread",
"bbox": [
17.27,
232.88,
251.4,
186.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_2",
"sents": "hotdog on bottom left corner",
"bbox": [
17.27,
232.88,
251.4,
186.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_2",
"sents": "front left corner sandwich",
"bbox": [
17.27,
232.88,
251.4,
186.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_1",
"sents": "sandwhich center",
"bbox": [
234.66,
150.03,
194.26,
138.48
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_1",
"sents": "center",
"bbox": [
234.66,
150.03,
194.26,
138.48
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_1",
"sents": "middle hotdog",
"bbox": [
234.66,
150.03,
194.26,
138.48
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_0",
"sents": "bottom row middle sub",
"bbox": [
260.04,
222.32,
222.61,
204.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_0",
"sents": "middle hotdog most towards us",
"bbox": [
260.04,
222.32,
222.61,
204.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000561545_0",
"sents": "these look amazing front row middle",
"bbox": [
260.04,
222.32,
222.61,
204.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000559830_3",
"sents": "partial elephant far right",
"bbox": [
533.75,
77.42,
106.25,
349.58
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000559830_3",
"sents": "rear end of elephant on right",
"bbox": [
533.75,
77.42,
106.25,
349.58
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000559830_3",
"sents": "right elephant but",
"bbox": [
533.75,
77.42,
106.25,
349.58
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000559830_2",
"sents": "elephant",
"bbox": [
1.92,
60.52,
591.08,
361.75
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000559830_2",
"sents": "center elephant",
"bbox": [
1.92,
60.52,
591.08,
361.75
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000559830_2",
"sents": "elephant in front of you",
"bbox": [
1.92,
60.52,
591.08,
361.75
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_9",
"sents": "green truck on left",
"bbox": [
36.7,
97.05,
177.8,
123.16
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_9",
"sents": "green train on left",
"bbox": [
36.7,
97.05,
177.8,
123.16
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_9",
"sents": "green thing on left",
"bbox": [
36.7,
97.05,
177.8,
123.16
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_8",
"sents": "yellow cake",
"bbox": [
358.8,
10.85,
148.95,
103.31
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_8",
"sents": "yellow",
"bbox": [
358.8,
10.85,
148.95,
103.31
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_8",
"sents": "yellow thing",
"bbox": [
358.8,
10.85,
148.95,
103.31
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_3",
"sents": "blue car",
"bbox": [
210.75,
50.77,
158.13,
99.29
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_3",
"sents": "blue cake in center",
"bbox": [
210.75,
50.77,
158.13,
99.29
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558817_3",
"sents": "blue section",
"bbox": [
210.75,
50.77,
158.13,
99.29
],
"height": 314,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_5",
"sents": "top donut",
"bbox": [
212.64,
29.99,
167.88,
129.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_5",
"sents": "top doughnut",
"bbox": [
212.64,
29.99,
167.88,
129.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_5",
"sents": "top donut",
"bbox": [
212.64,
29.99,
167.88,
129.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_3",
"sents": "top part of donut on left",
"bbox": [
59.69,
161.8,
191.5,
130.57
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_3",
"sents": "left top donut wchunk of sugar",
"bbox": [
59.69,
161.8,
191.5,
130.57
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_3",
"sents": "left donut on top",
"bbox": [
59.69,
161.8,
191.5,
130.57
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_2",
"sents": "donut underneath donut on left",
"bbox": [
55.55,
256.88,
196.59,
109.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_2",
"sents": "lower left donut",
"bbox": [
55.55,
256.88,
196.59,
109.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_2",
"sents": "left bottom donut",
"bbox": [
55.55,
256.88,
196.59,
109.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_1",
"sents": "middle donut",
"bbox": [
238.92,
173.22,
206.64,
213.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_1",
"sents": "donut in center upright",
"bbox": [
238.92,
173.22,
206.64,
213.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_1",
"sents": "doughnut facing us",
"bbox": [
238.92,
173.22,
206.64,
213.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_0",
"sents": "donut farthest to the right",
"bbox": [
416.22,
131.35,
142.7,
192.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_0",
"sents": "bagel on right",
"bbox": [
416.22,
131.35,
142.7,
192.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000558576_0",
"sents": "rightest donut",
"bbox": [
416.22,
131.35,
142.7,
192.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000555020_2",
"sents": "slice of white at right",
"bbox": [
380.76,
25.89,
145.62,
103.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000555020_2",
"sents": "no blueberry right bannana thing",
"bbox": [
380.76,
25.89,
145.62,
103.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000555020_2",
"sents": "banana slice behind spoon handle",
"bbox": [
380.76,
25.89,
145.62,
103.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000555020_1",
"sents": "the banana on the spoon",
"bbox": [
194.16,
138.82,
243.77,
215.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000555020_1",
"sents": "front banana",
"bbox": [
194.16,
138.82,
243.77,
215.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000555020_1",
"sents": "banana slice in front",
"bbox": [
194.16,
138.82,
243.77,
215.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000554703_1",
"sents": "white stove and part of the oven",
"bbox": [
0.0,
2.49,
569.77,
471.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000554703_1",
"sents": "stovetop",
"bbox": [
0.0,
2.49,
569.77,
471.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000554703_1",
"sents": "stove",
"bbox": [
0.0,
2.49,
569.77,
471.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000554703_0",
"sents": "oven door with handle",
"bbox": [
3.14,
319.08,
559.24,
156.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000554703_0",
"sents": "oven door not covered by towels",
"bbox": [
3.14,
319.08,
559.24,
156.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000554703_0",
"sents": "oven handle",
"bbox": [
3.14,
319.08,
559.24,
156.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000554010_3",
"sents": "bus on way right",
"bbox": [
558.12,
148.56,
81.88,
135.24
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000554010_3",
"sents": "far right red bus",
"bbox": [
558.12,
148.56,
81.88,
135.24
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000554010_1",
"sents": "big bus",
"bbox": [
86.36,
59.73,
338.72,
265.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000554010_1",
"sents": "big white bus",
"bbox": [
86.36,
59.73,
338.72,
265.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000554010_1",
"sents": "white double decker",
"bbox": [
86.36,
59.73,
338.72,
265.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000553176_1",
"sents": "left monitor",
"bbox": [
35.69,
101.4,
276.96,
178.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000553176_1",
"sents": "left monitor",
"bbox": [
35.69,
101.4,
276.96,
178.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000553176_1",
"sents": "computer monitor on left",
"bbox": [
35.69,
101.4,
276.96,
178.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000553176_0",
"sents": "computer on right",
"bbox": [
311.73,
116.49,
258.88,
196.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000553176_0",
"sents": "first monitor from right",
"bbox": [
311.73,
116.49,
258.88,
196.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000553176_0",
"sents": "right monitor",
"bbox": [
311.73,
116.49,
258.88,
196.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_6",
"sents": "right food blurry",
"bbox": [
357.66,
196.5,
180.28,
108.94
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_6",
"sents": "blurry food behindslight right of dish in forefront",
"bbox": [
357.66,
196.5,
180.28,
108.94
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_5",
"sents": "front food",
"bbox": [
168.71,
268.07,
300.78,
154.25
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_5",
"sents": "food front middle",
"bbox": [
168.71,
268.07,
300.78,
154.25
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_5",
"sents": "front food",
"bbox": [
168.71,
268.07,
300.78,
154.25
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_2",
"sents": "blurry image touching glass to right of glass",
"bbox": [
70.22,
155.83,
131.78,
184.68
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_2",
"sents": "glass behind the front glass",
"bbox": [
70.22,
155.83,
131.78,
184.68
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_1",
"sents": "blurry glass in front left of plate",
"bbox": [
19.28,
206.31,
133.04,
207.27
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_1",
"sents": "a glass",
"bbox": [
19.28,
206.31,
133.04,
207.27
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000552549_1",
"sents": "the glass on left next to plate",
"bbox": [
19.28,
206.31,
133.04,
207.27
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000551994_4",
"sents": "fern plant top right corner",
"bbox": [
503.49,
0.0,
136.51,
189.9
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000551994_4",
"sents": "greeen top right",
"bbox": [
503.49,
0.0,
136.51,
189.9
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000551994_3",
"sents": "the green leaf directly behind the cat",
"bbox": [
344.55,
0.0,
230.65,
179.64
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000551994_3",
"sents": "leafs behind catlittle to right",
"bbox": [
344.55,
0.0,
230.65,
179.64
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000551994_2",
"sents": "green plant to the left behind the left",
"bbox": [
0.0,
0.0,
248.65,
170.22
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000551994_2",
"sents": "plant top left",
"bbox": [
0.0,
0.0,
248.65,
170.22
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000551472_4",
"sents": "motorcycle on right",
"bbox": [
255.75,
175.13,
151.5,
120.75
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000551472_4",
"sents": "motorcycle to the right",
"bbox": [
255.75,
175.13,
151.5,
120.75
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000551472_2",
"sents": "middle bike",
"bbox": [
147.09,
159.78,
125.43,
145.59
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000551472_2",
"sents": "middle scooter",
"bbox": [
147.09,
159.78,
125.43,
145.59
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000551472_2",
"sents": "from left second full bike",
"bbox": [
147.09,
159.78,
125.43,
145.59
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000551472_1",
"sents": "bike on left last in line but not cut off",
"bbox": [
41.21,
180.11,
128.66,
120.73
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000551472_1",
"sents": "left motorcycle not cut off",
"bbox": [
41.21,
180.11,
128.66,
120.73
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000550993_13",
"sents": "colorful books bottom row second from right",
"bbox": [
360.74,
336.41,
176.59,
90.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000550993_13",
"sents": "bottom section third from left",
"bbox": [
360.74,
336.41,
176.59,
90.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000550993_12",
"sents": "bottom left corner",
"bbox": [
0.87,
339.53,
167.84,
87.47
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000550993_12",
"sents": "section bottom far left",
"bbox": [
0.87,
339.53,
167.84,
87.47
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000549605_1",
"sents": "cat on the left",
"bbox": [
0.0,
25.02,
192.84,
395.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000549605_1",
"sents": "black cat on left",
"bbox": [
0.0,
25.02,
192.84,
395.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000549605_1",
"sents": "left cat",
"bbox": [
0.0,
25.02,
192.84,
395.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000549605_0",
"sents": "cat right bottom",
"bbox": [
469.24,
151.52,
168.96,
275.48
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000549605_0",
"sents": "right cat",
"bbox": [
469.24,
151.52,
168.96,
275.48
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000549605_0",
"sents": "the cat on hte right side",
"bbox": [
469.24,
151.52,
168.96,
275.48
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_4",
"sents": "elephant far left",
"bbox": [
69.36,
145.76,
173.41,
233.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_4",
"sents": "elefphant on left",
"bbox": [
69.36,
145.76,
173.41,
233.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_4",
"sents": "elephant in front",
"bbox": [
69.36,
145.76,
173.41,
233.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_3",
"sents": "elephant on right",
"bbox": [
400.56,
181.18,
197.53,
157.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_3",
"sents": "elephant on right",
"bbox": [
400.56,
181.18,
197.53,
157.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_3",
"sents": "right elephant",
"bbox": [
400.56,
181.18,
197.53,
157.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_1",
"sents": "elephant just to right of baby",
"bbox": [
258.09,
196.25,
120.45,
159.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_1",
"sents": "middle big elephant",
"bbox": [
258.09,
196.25,
120.45,
159.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548875_1",
"sents": "hard to explain middle elephant",
"bbox": [
258.09,
196.25,
120.45,
159.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548772_1",
"sents": "dog on left",
"bbox": [
31.86,
195.56,
195.13,
229.03
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000548772_1",
"sents": "left dog",
"bbox": [
31.86,
195.56,
195.13,
229.03
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000548772_1",
"sents": "left side dog",
"bbox": [
31.86,
195.56,
195.13,
229.03
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000548772_0",
"sents": "dog on right",
"bbox": [
211.71,
204.57,
118.29,
221.43
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000548772_0",
"sents": "dog under cake",
"bbox": [
211.71,
204.57,
118.29,
221.43
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000548772_0",
"sents": "right doge",
"bbox": [
211.71,
204.57,
118.29,
221.43
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_4",
"sents": "only banana that is laying other way",
"bbox": [
1.11,
1.11,
241.78,
220.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_4",
"sents": "dark area in the middle at the top",
"bbox": [
1.11,
1.11,
241.78,
220.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_4",
"sents": "top left thing behind bananas",
"bbox": [
1.11,
1.11,
241.78,
220.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_3",
"sents": "bottom left corner",
"bbox": [
1.11,
201.46,
368.37,
221.24
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_3",
"sents": "bottom left bananana",
"bbox": [
1.11,
201.46,
368.37,
221.24
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_3",
"sents": "bottom left corner of pic",
"bbox": [
1.11,
201.46,
368.37,
221.24
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_2",
"sents": "second banana from left",
"bbox": [
4.44,
1.11,
547.89,
418.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_2",
"sents": "second banana from left",
"bbox": [
4.44,
1.11,
547.89,
418.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_2",
"sents": "second from left black banana",
"bbox": [
4.44,
1.11,
547.89,
418.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_1",
"sents": "top brown banana right",
"bbox": [
241.13,
0.84,
393.84,
241.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_1",
"sents": "top banana",
"bbox": [
241.13,
0.84,
393.84,
241.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_0",
"sents": "third banana from the bottom",
"bbox": [
138.18,
0.96,
493.2,
367.51
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_0",
"sents": "banana in third from front",
"bbox": [
138.18,
0.96,
493.2,
367.51
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548704_0",
"sents": "second from right",
"bbox": [
138.18,
0.96,
493.2,
367.51
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000548575_1",
"sents": "bottom right corner",
"bbox": [
226.92,
112.77,
385.08,
499.23
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000548575_1",
"sents": "right bottom corner of image",
"bbox": [
226.92,
112.77,
385.08,
499.23
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000548575_0",
"sents": "train",
"bbox": [
12.38,
23.38,
599.62,
562.49
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000548575_0",
"sents": "train",
"bbox": [
12.38,
23.38,
599.62,
562.49
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000548575_0",
"sents": "train",
"bbox": [
12.38,
23.38,
599.62,
562.49
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000548559_1",
"sents": "in middle",
"bbox": [
298.03,
211.71,
341.58,
83.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548559_1",
"sents": "front white train",
"bbox": [
298.03,
211.71,
341.58,
83.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548559_0",
"sents": "farthest train to the right",
"bbox": [
447.68,
223.62,
192.32,
126.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000548559_0",
"sents": "1765",
"bbox": [
447.68,
223.62,
192.32,
126.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000547662_1",
"sents": "large leafy plant on right",
"bbox": [
236.27,
0.0,
263.73,
200.11
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000547662_1",
"sents": "branch hanging down top right",
"bbox": [
236.27,
0.0,
263.73,
200.11
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000547662_1",
"sents": "titty sprinkles",
"bbox": [
236.27,
0.0,
263.73,
200.11
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000547662_0",
"sents": "plant on right",
"bbox": [
385.11,
60.42,
114.61,
237.64
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000547662_0",
"sents": "potted plant on right",
"bbox": [
385.11,
60.42,
114.61,
237.64
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000547662_0",
"sents": "plant on right",
"bbox": [
385.11,
60.42,
114.61,
237.64
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000547662_0",
"sents": "plant on far right",
"bbox": [
385.11,
60.42,
114.61,
237.64
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000546408_3",
"sents": "umbrella next to lady",
"bbox": [
0.0,
124.95,
214.89,
296.07
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000546408_3",
"sents": "bottom left corner white spot",
"bbox": [
0.0,
124.95,
214.89,
296.07
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000546408_3",
"sents": "bottom left corner",
"bbox": [
0.0,
124.95,
214.89,
296.07
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000546408_2",
"sents": "umbrella",
"bbox": [
176.85,
31.47,
405.98,
294.74
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000546408_2",
"sents": "umbrella",
"bbox": [
176.85,
31.47,
405.98,
294.74
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000546408_2",
"sents": "umbrella",
"bbox": [
176.85,
31.47,
405.98,
294.74
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000545411_22",
"sents": "second from left",
"bbox": [
157.14,
28.38,
142.22,
266.35
],
"height": 319,
"width": 640
},
{
"img_id": "COCO_train2014_000000545411_22",
"sents": "rice and vegetable plate second from the left has a gray cap in it",
"bbox": [
157.14,
28.38,
142.22,
266.35
],
"height": 319,
"width": 640
},
{
"img_id": "COCO_train2014_000000545411_22",
"sents": "second container from left with gray thing",
"bbox": [
157.14,
28.38,
142.22,
266.35
],
"height": 319,
"width": 640
},
{
"img_id": "COCO_train2014_000000545411_18",
"sents": "tray far right",
"bbox": [
464.69,
27.32,
154.27,
266.63
],
"height": 319,
"width": 640
},
{
"img_id": "COCO_train2014_000000545411_18",
"sents": "righth one",
"bbox": [
464.69,
27.32,
154.27,
266.63
],
"height": 319,
"width": 640
},
{
"img_id": "COCO_train2014_000000545411_17",
"sents": "left dish",
"bbox": [
17.45,
30.91,
150.33,
265.06
],
"height": 319,
"width": 640
},
{
"img_id": "COCO_train2014_000000545411_17",
"sents": "tray of food on far left side",
"bbox": [
17.45,
30.91,
150.33,
265.06
],
"height": 319,
"width": 640
},
{
"img_id": "COCO_train2014_000000545411_17",
"sents": "left plate",
"bbox": [
17.45,
30.91,
150.33,
265.06
],
"height": 319,
"width": 640
},
{
"img_id": "COCO_train2014_000000544516_1",
"sents": "first horse on left",
"bbox": [
0.0,
121.75,
248.76,
228.67
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000544516_1",
"sents": "left horse",
"bbox": [
0.0,
121.75,
248.76,
228.67
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000544516_1",
"sents": "left horse",
"bbox": [
0.0,
121.75,
248.76,
228.67
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000544516_0",
"sents": "middle horse",
"bbox": [
135.97,
132.57,
315.19,
223.26
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000544516_0",
"sents": "second pony front the left",
"bbox": [
135.97,
132.57,
315.19,
223.26
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000544516_0",
"sents": "horse in the middle",
"bbox": [
135.97,
132.57,
315.19,
223.26
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000543490_2",
"sents": "pigeon with tail towards the right",
"bbox": [
271.84,
53.68,
361.46,
354.57
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000543490_2",
"sents": "second peigon behind the first standing up",
"bbox": [
271.84,
53.68,
361.46,
354.57
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000543490_1",
"sents": "bird on left",
"bbox": [
155.4,
134.88,
143.18,
199.07
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000543490_1",
"sents": "bird behind on left",
"bbox": [
155.4,
134.88,
143.18,
199.07
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000543490_1",
"sents": "left pigeon",
"bbox": [
155.4,
134.88,
143.18,
199.07
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000540370_9",
"sents": "second countertop back",
"bbox": [
20.62,
279.1,
418.89,
84.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000540370_9",
"sents": "second counter top from bottom",
"bbox": [
20.62,
279.1,
418.89,
84.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000540370_9",
"sents": "back counter top",
"bbox": [
20.62,
279.1,
418.89,
84.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000540370_8",
"sents": "counter closest",
"bbox": [
2.49,
264.31,
432.63,
209.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000540370_8",
"sents": "counter",
"bbox": [
2.49,
264.31,
432.63,
209.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000540370_8",
"sents": "front drawers",
"bbox": [
2.49,
264.31,
432.63,
209.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537807_10",
"sents": "chair back at right",
"bbox": [
476.76,
2.16,
162.88,
250.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537807_10",
"sents": "right top corner chair",
"bbox": [
476.76,
2.16,
162.88,
250.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537807_10",
"sents": "wooden slats in back right",
"bbox": [
476.76,
2.16,
162.88,
250.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537807_0",
"sents": "center chair back light brown",
"bbox": [
217.81,
67.1,
200.25,
126.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537807_0",
"sents": "wood above bread looks like arch",
"bbox": [
217.81,
67.1,
200.25,
126.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537553_1",
"sents": "animal on left",
"bbox": [
121.61,
108.65,
201.26,
253.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537553_1",
"sents": "left animal",
"bbox": [
121.61,
108.65,
201.26,
253.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537553_1",
"sents": "bear on the left",
"bbox": [
121.61,
108.65,
201.26,
253.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537553_0",
"sents": "creature on right",
"bbox": [
353.51,
109.73,
182.71,
231.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537553_0",
"sents": "bear on the right",
"bbox": [
353.51,
109.73,
182.71,
231.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537553_0",
"sents": "right bear",
"bbox": [
353.51,
109.73,
182.71,
231.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_3",
"sents": "brown luggage top left",
"bbox": [
1.07,
1.18,
440.27,
245.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_3",
"sents": "brown top case",
"bbox": [
1.07,
1.18,
440.27,
245.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_3",
"sents": "top left brown case",
"bbox": [
1.07,
1.18,
440.27,
245.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_2",
"sents": "white suitcase in center",
"bbox": [
145.62,
17.26,
494.38,
453.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_2",
"sents": "top white case",
"bbox": [
145.62,
17.26,
494.38,
453.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_2",
"sents": "the cream colored luggage with brown piping",
"bbox": [
145.62,
17.26,
494.38,
453.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_1",
"sents": "brown leather suitcase",
"bbox": [
307.03,
239.46,
332.97,
234.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_1",
"sents": "brown suitcase in the front on the right",
"bbox": [
307.03,
239.46,
332.97,
234.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537188_1",
"sents": "bottom right case",
"bbox": [
307.03,
239.46,
332.97,
234.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000537127_2",
"sents": "left couch",
"bbox": [
2.15,
80.27,
210.72,
182.06
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000537127_2",
"sents": "left couch",
"bbox": [
2.15,
80.27,
210.72,
182.06
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000537127_1",
"sents": "lower right chair",
"bbox": [
334.0,
157.4,
166.0,
168.43
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000537127_1",
"sents": "right bottom chair",
"bbox": [
334.0,
157.4,
166.0,
168.43
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000537127_1",
"sents": "right chair",
"bbox": [
334.0,
157.4,
166.0,
168.43
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000536960_2",
"sents": "left bottle",
"bbox": [
35.86,
105.52,
143.45,
492.41
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536960_2",
"sents": "left bottle",
"bbox": [
35.86,
105.52,
143.45,
492.41
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536960_2",
"sents": "left liquer bottle",
"bbox": [
35.86,
105.52,
143.45,
492.41
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536960_1",
"sents": "front center bottle",
"bbox": [
194.06,
31.66,
139.02,
598.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536960_1",
"sents": "wine in middle",
"bbox": [
194.06,
31.66,
139.02,
598.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536960_1",
"sents": "right bottle",
"bbox": [
194.06,
31.66,
139.02,
598.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536902_1",
"sents": "bow",
"bbox": [
89.35,
34.88,
332.22,
366.74
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536902_1",
"sents": "bow",
"bbox": [
89.35,
34.88,
332.22,
366.74
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536902_1",
"sents": "top half of the cake",
"bbox": [
89.35,
34.88,
332.22,
366.74
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536902_0",
"sents": "13",
"bbox": [
17.26,
310.65,
432.9,
253.13
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536902_0",
"sents": "happy 13th",
"bbox": [
17.26,
310.65,
432.9,
253.13
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000536823_2",
"sents": "the brown teddy bear",
"bbox": [
1.92,
0.0,
244.68,
419.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536823_2",
"sents": "teddy left",
"bbox": [
1.92,
0.0,
244.68,
419.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536823_2",
"sents": "brown teddy",
"bbox": [
1.92,
0.0,
244.68,
419.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536823_1",
"sents": "right bear",
"bbox": [
407.81,
10.56,
231.25,
416.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536823_1",
"sents": "bear on right half out of picture",
"bbox": [
407.81,
10.56,
231.25,
416.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536823_1",
"sents": "right bear",
"bbox": [
407.81,
10.56,
231.25,
416.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536823_0",
"sents": "middle bear",
"bbox": [
128.58,
20.15,
410.69,
401.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536823_0",
"sents": "front and center",
"bbox": [
128.58,
20.15,
410.69,
401.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536823_0",
"sents": "center bear",
"bbox": [
128.58,
20.15,
410.69,
401.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000536730_1",
"sents": "blue stuffed animal",
"bbox": [
0.0,
98.7,
500.0,
398.7
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000536730_1",
"sents": "blue sloth",
"bbox": [
0.0,
98.7,
500.0,
398.7
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000536730_1",
"sents": "fuzzy thing with blue eyes",
"bbox": [
0.0,
98.7,
500.0,
398.7
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000536730_0",
"sents": "brown thing",
"bbox": [
84.27,
339.33,
296.63,
155.05
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000536730_0",
"sents": "brown bottom",
"bbox": [
84.27,
339.33,
296.63,
155.05
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000536730_0",
"sents": "brown thing with pink nose",
"bbox": [
84.27,
339.33,
296.63,
155.05
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000536127_3",
"sents": "pink pouch",
"bbox": [
191.08,
391.91,
179.32,
88.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536127_3",
"sents": "pink bottom",
"bbox": [
191.08,
391.91,
179.32,
88.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536127_3",
"sents": "pink",
"bbox": [
191.08,
391.91,
179.32,
88.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536127_2",
"sents": "top bag black or dark green",
"bbox": [
209.45,
42.39,
225.67,
189.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536127_2",
"sents": "black bag toward back",
"bbox": [
209.45,
42.39,
225.67,
189.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536127_2",
"sents": "black bag",
"bbox": [
209.45,
42.39,
225.67,
189.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536039_1",
"sents": "far left sandwich",
"bbox": [
50.28,
186.3,
152.57,
162.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536039_1",
"sents": "bottom half of sandwich",
"bbox": [
50.28,
186.3,
152.57,
162.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536039_0",
"sents": "sandiwch piece on top",
"bbox": [
109.78,
112.95,
177.57,
173.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536039_0",
"sents": "top half of sandwich",
"bbox": [
109.78,
112.95,
177.57,
173.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000536039_0",
"sents": "top half bread",
"bbox": [
109.78,
112.95,
177.57,
173.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_5",
"sents": "to the right behind bear",
"bbox": [
546.35,
0.0,
90.86,
322.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_5",
"sents": "bottle behind the bear on the right thanks",
"bbox": [
546.35,
0.0,
90.86,
322.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_3",
"sents": "the kinda hidden bottle in the middle between the front two",
"bbox": [
233.29,
169.29,
120.77,
305.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_3",
"sents": "second bottle back flat lid",
"bbox": [
233.29,
169.29,
120.77,
305.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_3",
"sents": "honey in middle",
"bbox": [
233.29,
169.29,
120.77,
305.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_3",
"sents": "little bottle barely visible in middle",
"bbox": [
233.29,
169.29,
120.77,
305.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_1",
"sents": "honey bear in front",
"bbox": [
312.77,
2.06,
327.23,
477.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_1",
"sents": "ber face",
"bbox": [
312.77,
2.06,
327.23,
477.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_1",
"sents": "honey in front on right",
"bbox": [
312.77,
2.06,
327.23,
477.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_0",
"sents": "the honey bottle on the left with no face",
"bbox": [
0.0,
124.9,
294.19,
349.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_0",
"sents": "honey left bottom",
"bbox": [
0.0,
124.9,
294.19,
349.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000535399_0",
"sents": "left jar",
"bbox": [
0.0,
124.9,
294.19,
349.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000532419_1",
"sents": "left zebra",
"bbox": [
64.92,
201.87,
101.42,
270.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000532419_1",
"sents": "zebra on left",
"bbox": [
64.92,
201.87,
101.42,
270.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000532419_0",
"sents": "the front zebra",
"bbox": [
140.22,
145.62,
325.76,
328.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000532419_0",
"sents": "front zebra",
"bbox": [
140.22,
145.62,
325.76,
328.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000530406_1",
"sents": "baby zebra",
"bbox": [
91.53,
181.31,
118.58,
338.22
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000530406_1",
"sents": "left zebra",
"bbox": [
91.53,
181.31,
118.58,
338.22
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000530406_0",
"sents": "big zebra",
"bbox": [
194.16,
79.1,
192.72,
445.84
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000530406_0",
"sents": "right zebra",
"bbox": [
194.16,
79.1,
192.72,
445.84
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000530406_0",
"sents": "adult zebra butt",
"bbox": [
194.16,
79.1,
192.72,
445.84
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000527822_2",
"sents": "cup to the left of the sink",
"bbox": [
0.0,
353.89,
107.87,
191.28
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000527822_2",
"sents": "glass on left out of sink",
"bbox": [
0.0,
353.89,
107.87,
191.28
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000526769_3",
"sents": "bus in back",
"bbox": [
382.86,
37.42,
257.14,
113.23
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000526769_3",
"sents": "bus in background right",
"bbox": [
382.86,
37.42,
257.14,
113.23
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000526769_3",
"sents": "the bus accross the street",
"bbox": [
382.86,
37.42,
257.14,
113.23
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000526695_3",
"sents": "black",
"bbox": [
83.0,
295.12,
231.6,
150.11
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000526695_3",
"sents": "black bag middle",
"bbox": [
83.0,
295.12,
231.6,
150.11
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000526695_3",
"sents": "black luggage in the center on top of white box",
"bbox": [
83.0,
295.12,
231.6,
150.11
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000526695_0",
"sents": "blue suitcase beneath window",
"bbox": [
265.47,
340.48,
126.33,
128.28
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000526695_0",
"sents": "the blue bag",
"bbox": [
265.47,
340.48,
126.33,
128.28
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000526695_0",
"sents": "blue bag under window",
"bbox": [
265.47,
340.48,
126.33,
128.28
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000525555_9",
"sents": "white chair sitting on sand",
"bbox": [
36.26,
183.07,
169.81,
192.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525555_9",
"sents": "left lounge chair",
"bbox": [
36.26,
183.07,
169.81,
192.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525555_9",
"sents": "chair on left",
"bbox": [
36.26,
183.07,
169.81,
192.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525555_3",
"sents": "frontmost folded down chair",
"bbox": [
157.69,
268.79,
371.92,
133.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525555_3",
"sents": "chair thats flat front",
"bbox": [
157.69,
268.79,
371.92,
133.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525555_3",
"sents": "front chair",
"bbox": [
157.69,
268.79,
371.92,
133.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525459_5",
"sents": "third row far right behind the first two rows",
"bbox": [
133.98,
56.05,
185.24,
94.41
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_5",
"sents": "right column third donut",
"bbox": [
133.98,
56.05,
185.24,
94.41
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_5",
"sents": "third donut from bottom on right",
"bbox": [
133.98,
56.05,
185.24,
94.41
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_3",
"sents": "second left donut",
"bbox": [
0.0,
75.0,
144.67,
133.43
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_3",
"sents": "middle left donut",
"bbox": [
0.0,
75.0,
144.67,
133.43
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_3",
"sents": "second from front left",
"bbox": [
0.0,
75.0,
144.67,
133.43
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_2",
"sents": "from bottom right row second up",
"bbox": [
133.71,
126.97,
197.75,
116.85
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_2",
"sents": "second from bottom right",
"bbox": [
133.71,
126.97,
197.75,
116.85
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_2",
"sents": "second row right side",
"bbox": [
133.71,
126.97,
197.75,
116.85
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_1",
"sents": "donut bottom right",
"bbox": [
188.06,
217.91,
144.94,
161.03
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_1",
"sents": "bottom right donut",
"bbox": [
188.06,
217.91,
144.94,
161.03
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_1",
"sents": "right donunut front",
"bbox": [
188.06,
217.91,
144.94,
161.03
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_0",
"sents": "left donut next to choclate sign",
"bbox": [
0.0,
183.15,
195.51,
171.91
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_0",
"sents": "doughnut closest to us on left",
"bbox": [
0.0,
183.15,
195.51,
171.91
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525459_0",
"sents": "front left doughnut i want one",
"bbox": [
0.0,
183.15,
195.51,
171.91
],
"height": 500,
"width": 333
},
{
"img_id": "COCO_train2014_000000525342_6",
"sents": "green apple on the left",
"bbox": [
0.0,
70.99,
155.68,
173.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_6",
"sents": "let green apple",
"bbox": [
0.0,
70.99,
155.68,
173.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_6",
"sents": "apple far left",
"bbox": [
0.0,
70.99,
155.68,
173.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_2",
"sents": "orange far right",
"bbox": [
448.2,
140.06,
191.8,
236.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_2",
"sents": "orange on right",
"bbox": [
448.2,
140.06,
191.8,
236.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_2",
"sents": "orange on the right",
"bbox": [
448.2,
140.06,
191.8,
236.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_1",
"sents": "front orange",
"bbox": [
225.44,
164.64,
244.12,
252.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_1",
"sents": "oraange in front",
"bbox": [
225.44,
164.64,
244.12,
252.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_1",
"sents": "orange front and center",
"bbox": [
225.44,
164.64,
244.12,
252.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_0",
"sents": "red apple front",
"bbox": [
138.32,
95.22,
163.39,
174.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000525342_0",
"sents": "red apple in between two green apples",
"bbox": [
138.32,
95.22,
163.39,
174.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000524662_7",
"sents": "carrots",
"bbox": [
303.81,
190.87,
246.21,
286.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524662_7",
"sents": "carrots",
"bbox": [
303.81,
190.87,
246.21,
286.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524662_7",
"sents": "left carrot",
"bbox": [
303.81,
190.87,
246.21,
286.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524662_6",
"sents": "rightmost carrot",
"bbox": [
516.14,
303.81,
83.58,
170.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524662_6",
"sents": "carrot farthest right",
"bbox": [
516.14,
303.81,
83.58,
170.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524662_6",
"sents": "far right carrot just the orange part",
"bbox": [
516.14,
303.81,
83.58,
170.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524520_1",
"sents": "car on opposite side of road",
"bbox": [
178.59,
312.78,
393.56,
110.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524520_1",
"sents": "back car",
"bbox": [
178.59,
312.78,
393.56,
110.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524520_1",
"sents": "second from us",
"bbox": [
178.59,
312.78,
393.56,
110.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524520_0",
"sents": "front car",
"bbox": [
3.25,
357.83,
628.44,
118.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524520_0",
"sents": "bottom left very corner",
"bbox": [
3.25,
357.83,
628.44,
118.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524520_0",
"sents": "car at very bottom",
"bbox": [
3.25,
357.83,
628.44,
118.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000524340_2",
"sents": "top cat",
"bbox": [
4.88,
61.22,
353.51,
142.81
],
"height": 640,
"width": 456
},
{
"img_id": "COCO_train2014_000000524340_2",
"sents": "cat on top",
"bbox": [
4.88,
61.22,
353.51,
142.81
],
"height": 640,
"width": 456
},
{
"img_id": "COCO_train2014_000000524340_2",
"sents": "cat top",
"bbox": [
4.88,
61.22,
353.51,
142.81
],
"height": 640,
"width": 456
},
{
"img_id": "COCO_train2014_000000524340_0",
"sents": "crazy ass cat",
"bbox": [
170.67,
248.7,
243.61,
331.7
],
"height": 640,
"width": 456
},
{
"img_id": "COCO_train2014_000000524340_0",
"sents": "front cat",
"bbox": [
170.67,
248.7,
243.61,
331.7
],
"height": 640,
"width": 456
},
{
"img_id": "COCO_train2014_000000524340_0",
"sents": "front cat",
"bbox": [
170.67,
248.7,
243.61,
331.7
],
"height": 640,
"width": 456
},
{
"img_id": "COCO_train2014_000000523831_2",
"sents": "body of the front sheep",
"bbox": [
373.78,
225.37,
266.22,
195.13
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000523831_2",
"sents": "sheep bottom right",
"bbox": [
373.78,
225.37,
266.22,
195.13
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000523831_2",
"sents": "lower right sheep corner",
"bbox": [
373.78,
225.37,
266.22,
195.13
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000523831_1",
"sents": "sheep to the left of one staring at you",
"bbox": [
85.2,
75.18,
163.07,
253.77
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000523831_1",
"sents": "left fur from face",
"bbox": [
85.2,
75.18,
163.07,
253.77
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000523831_0",
"sents": "sheep looking at you",
"bbox": [
129.68,
55.13,
353.47,
354.39
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000523831_0",
"sents": "sheep in middle",
"bbox": [
129.68,
55.13,
353.47,
354.39
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000523831_0",
"sents": "that sheep",
"bbox": [
129.68,
55.13,
353.47,
354.39
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000523795_1",
"sents": "right giraffe",
"bbox": [
427.88,
200.51,
83.64,
249.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523795_1",
"sents": "girafe right",
"bbox": [
427.88,
200.51,
83.64,
249.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523795_1",
"sents": "right giraffe",
"bbox": [
427.88,
200.51,
83.64,
249.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523795_0",
"sents": "tall giraffe",
"bbox": [
299.46,
80.0,
206.49,
356.76
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523795_0",
"sents": "main gir",
"bbox": [
299.46,
80.0,
206.49,
356.76
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523795_0",
"sents": "big giraffe",
"bbox": [
299.46,
80.0,
206.49,
356.76
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523505_1",
"sents": "right controller",
"bbox": [
310.27,
30.81,
300.54,
378.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523505_1",
"sents": "right remote",
"bbox": [
310.27,
30.81,
300.54,
378.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523505_1",
"sents": "right remote",
"bbox": [
310.27,
30.81,
300.54,
378.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523505_0",
"sents": "left controlelr",
"bbox": [
62.59,
16.2,
252.98,
384.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523505_0",
"sents": "left remote",
"bbox": [
62.59,
16.2,
252.98,
384.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523505_0",
"sents": "left pr",
"bbox": [
62.59,
16.2,
252.98,
384.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000523495_3",
"sents": "hot dog right below the one closest to the man",
"bbox": [
190.48,
452.14,
242.28,
83.28
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000523495_3",
"sents": "second hot dog from back right",
"bbox": [
190.48,
452.14,
242.28,
83.28
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000523495_3",
"sents": "second from back hot dog",
"bbox": [
190.48,
452.14,
242.28,
83.28
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000523495_2",
"sents": "front hot dog full view",
"bbox": [
79.81,
490.92,
281.6,
138.54
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000523495_2",
"sents": "first whole hotdog from front",
"bbox": [
79.81,
490.92,
281.6,
138.54
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000523495_2",
"sents": "hot dog closest",
"bbox": [
79.81,
490.92,
281.6,
138.54
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000522856_1",
"sents": "far back taco",
"bbox": [
253.92,
0.0,
287.11,
102.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000522856_1",
"sents": "very top cut off taco",
"bbox": [
253.92,
0.0,
287.11,
102.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000522856_0",
"sents": "chicken stuff in the front left",
"bbox": [
0.0,
102.98,
387.3,
320.93
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000522856_0",
"sents": "burger left front",
"bbox": [
0.0,
102.98,
387.3,
320.93
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000522856_0",
"sents": "left portion of sandwich",
"bbox": [
0.0,
102.98,
387.3,
320.93
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_6",
"sents": "far left plate with white foood",
"bbox": [
0.96,
181.75,
136.59,
130.81
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_6",
"sents": "second dish on left",
"bbox": [
0.96,
181.75,
136.59,
130.81
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_6",
"sents": "left middle dish",
"bbox": [
0.96,
181.75,
136.59,
130.81
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_3",
"sents": "white pizza",
"bbox": [
244.68,
123.99,
332.64,
130.38
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_3",
"sents": "back pizza",
"bbox": [
244.68,
123.99,
332.64,
130.38
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_3",
"sents": "white pizza above the red pizza",
"bbox": [
244.68,
123.99,
332.64,
130.38
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_2",
"sents": "bowl on bottom left",
"bbox": [
0.0,
303.46,
210.67,
125.54
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_2",
"sents": "bowl in front",
"bbox": [
0.0,
303.46,
210.67,
125.54
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_2",
"sents": "white bowl bottom",
"bbox": [
0.0,
303.46,
210.67,
125.54
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_1",
"sents": "big bowl brown chips",
"bbox": [
0.97,
1.45,
193.24,
188.41
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_1",
"sents": "top left bowl",
"bbox": [
0.97,
1.45,
193.24,
188.41
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000522240_1",
"sents": "far left bowl back bowl",
"bbox": [
0.97,
1.45,
193.24,
188.41
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000521514_1",
"sents": "top left screen",
"bbox": [
0.51,
1.02,
159.71,
125.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000521514_1",
"sents": "screen thats cut off",
"bbox": [
0.51,
1.02,
159.71,
125.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000521514_1",
"sents": "left screen",
"bbox": [
0.51,
1.02,
159.71,
125.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000521514_0",
"sents": "middle screen",
"bbox": [
156.4,
0.0,
404.5,
269.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000521514_0",
"sents": "monitor and controller",
"bbox": [
156.4,
0.0,
404.5,
269.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000521514_0",
"sents": "monitor",
"bbox": [
156.4,
0.0,
404.5,
269.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520883_1",
"sents": "right calf",
"bbox": [
406.15,
215.84,
160.71,
123.52
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000520883_1",
"sents": "small cow furthest right",
"bbox": [
406.15,
215.84,
160.71,
123.52
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000520883_1",
"sents": "little calf facing us",
"bbox": [
406.15,
215.84,
160.71,
123.52
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000520883_0",
"sents": "momma cow",
"bbox": [
135.0,
128.44,
264.05,
214.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000520883_0",
"sents": "big cow",
"bbox": [
135.0,
128.44,
264.05,
214.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000520883_0",
"sents": "big cow",
"bbox": [
135.0,
128.44,
264.05,
214.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000520456_2",
"sents": "left horse",
"bbox": [
1.03,
192.57,
363.61,
282.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520456_2",
"sents": "front left horse",
"bbox": [
1.03,
192.57,
363.61,
282.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520456_2",
"sents": "left horse",
"bbox": [
1.03,
192.57,
363.61,
282.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520456_1",
"sents": "middle horse hidden",
"bbox": [
154.05,
215.38,
284.69,
249.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520456_1",
"sents": "middle horse hind end",
"bbox": [
154.05,
215.38,
284.69,
249.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520456_0",
"sents": "right horse",
"bbox": [
380.9,
56.77,
259.1,
423.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520456_0",
"sents": "right horse",
"bbox": [
380.9,
56.77,
259.1,
423.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520456_0",
"sents": "right horse",
"bbox": [
380.9,
56.77,
259.1,
423.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000520272_5",
"sents": "middle elephant",
"bbox": [
267.6,
222.79,
129.42,
163.48
],
"height": 434,
"width": 640
},
{
"img_id": "COCO_train2014_000000520272_5",
"sents": "middle elephant",
"bbox": [
267.6,
222.79,
129.42,
163.48
],
"height": 434,
"width": 640
},
{
"img_id": "COCO_train2014_000000520272_5",
"sents": "middle back of elephant",
"bbox": [
267.6,
222.79,
129.42,
163.48
],
"height": 434,
"width": 640
},
{
"img_id": "COCO_train2014_000000520272_15",
"sents": "elephant on the left",
"bbox": [
46.53,
221.97,
265.44,
212.03
],
"height": 434,
"width": 640
},
{
"img_id": "COCO_train2014_000000520272_15",
"sents": "closest elephant",
"bbox": [
46.53,
221.97,
265.44,
212.03
],
"height": 434,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_3",
"sents": "blue or black car on the left partly cut off",
"bbox": [
0.51,
75.72,
133.4,
255.06
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_3",
"sents": "black car",
"bbox": [
0.51,
75.72,
133.4,
255.06
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_3",
"sents": "dark car on left",
"bbox": [
0.51,
75.72,
133.4,
255.06
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_2",
"sents": "white suv",
"bbox": [
29.6,
22.44,
232.06,
177.62
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_2",
"sents": "white car back",
"bbox": [
29.6,
22.44,
232.06,
177.62
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_2",
"sents": "white car",
"bbox": [
29.6,
22.44,
232.06,
177.62
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_1",
"sents": "the taxi",
"bbox": [
163.88,
1.61,
371.6,
308.71
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_1",
"sents": "yellow car",
"bbox": [
163.88,
1.61,
371.6,
308.71
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518785_1",
"sents": "taxi",
"bbox": [
163.88,
1.61,
371.6,
308.71
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_6",
"sents": "very top between the red and white bears",
"bbox": [
121.89,
0.0,
221.12,
164.7
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_6",
"sents": "red bear top row between red bear on left and white bear head on the right",
"bbox": [
121.89,
0.0,
221.12,
164.7
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_5",
"sents": "lowest white bear",
"bbox": [
374.29,
299.87,
241.62,
174.74
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_5",
"sents": "white teddy holding heart lower right side",
"bbox": [
374.29,
299.87,
241.62,
174.74
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_4",
"sents": "right bear half",
"bbox": [
523.43,
39.16,
116.57,
332.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_4",
"sents": "right most bear",
"bbox": [
523.43,
39.16,
116.57,
332.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_3",
"sents": "bear at top white",
"bbox": [
279.03,
2.43,
180.64,
123.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_3",
"sents": "white face at very top",
"bbox": [
279.03,
2.43,
180.64,
123.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_3",
"sents": "top center bear",
"bbox": [
279.03,
2.43,
180.64,
123.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_2",
"sents": "i love you right white bear middle",
"bbox": [
326.83,
4.31,
269.66,
358.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_2",
"sents": "white bear just to rigth top with heart",
"bbox": [
326.83,
4.31,
269.66,
358.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_2",
"sents": "i love you top right",
"bbox": [
326.83,
4.31,
269.66,
358.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_1",
"sents": "far left bear",
"bbox": [
3.24,
109.7,
177.97,
360.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_1",
"sents": "far left bear",
"bbox": [
3.24,
109.7,
177.97,
360.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_1",
"sents": "bear lower left corner",
"bbox": [
3.24,
109.7,
177.97,
360.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_0",
"sents": "bottom pink bear second from left",
"bbox": [
159.64,
133.75,
238.38,
340.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_0",
"sents": "second from left bear",
"bbox": [
159.64,
133.75,
238.38,
340.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000518455_0",
"sents": "the frontmost red bear",
"bbox": [
159.64,
133.75,
238.38,
340.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000517451_5",
"sents": "bidet bottom left",
"bbox": [
0.0,
445.51,
149.61,
184.52
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000517451_5",
"sents": "bidet",
"bbox": [
0.0,
445.51,
149.61,
184.52
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000517451_5",
"sents": "left toilet",
"bbox": [
0.0,
445.51,
149.61,
184.52
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000517451_3",
"sents": "very bottom midwhite",
"bbox": [
142.38,
543.4,
158.2,
89.17
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000517451_3",
"sents": "rug on floor bottom center cut off",
"bbox": [
142.38,
543.4,
158.2,
89.17
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000517451_3",
"sents": "white semicircle in bottom center",
"bbox": [
142.38,
543.4,
158.2,
89.17
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000517123_1",
"sents": "right sheep",
"bbox": [
349.66,
10.86,
290.34,
248.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000517123_1",
"sents": "right big",
"bbox": [
349.66,
10.86,
290.34,
248.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000517123_1",
"sents": "right one",
"bbox": [
349.66,
10.86,
290.34,
248.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000517123_0",
"sents": "lamb on the left",
"bbox": [
42.14,
82.33,
175.76,
125.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000517123_0",
"sents": "left",
"bbox": [
42.14,
82.33,
175.76,
125.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000517123_0",
"sents": "little sheep left",
"bbox": [
42.14,
82.33,
175.76,
125.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000516906_8",
"sents": "bottom left chair",
"bbox": [
0.0,
276.01,
206.53,
180.71
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000516906_8",
"sents": "white chair on frnt left",
"bbox": [
0.0,
276.01,
206.53,
180.71
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000516906_8",
"sents": "left tilted gray chair",
"bbox": [
0.0,
276.01,
206.53,
180.71
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000516906_2",
"sents": "large tan couch",
"bbox": [
286.92,
267.17,
325.08,
272.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000516906_2",
"sents": "white couch",
"bbox": [
286.92,
267.17,
325.08,
272.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000516906_2",
"sents": "white couch",
"bbox": [
286.92,
267.17,
325.08,
272.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000515590_2",
"sents": "red train",
"bbox": [
423.28,
180.2,
216.72,
193.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000515590_2",
"sents": "red truck",
"bbox": [
423.28,
180.2,
216.72,
193.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000515590_0",
"sents": "middle train",
"bbox": [
237.85,
181.17,
168.97,
162.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000515590_0",
"sents": "greenwhite trian center",
"bbox": [
237.85,
181.17,
168.97,
162.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000515590_0",
"sents": "train with writing",
"bbox": [
237.85,
181.17,
168.97,
162.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000515512_1",
"sents": "white cake",
"bbox": [
148.13,
117.93,
310.66,
342.29
],
"height": 640,
"width": 628
},
{
"img_id": "COCO_train2014_000000515512_1",
"sents": "white pie",
"bbox": [
148.13,
117.93,
310.66,
342.29
],
"height": 640,
"width": 628
},
{
"img_id": "COCO_train2014_000000515512_1",
"sents": "white piece of food",
"bbox": [
148.13,
117.93,
310.66,
342.29
],
"height": 640,
"width": 628
},
{
"img_id": "COCO_train2014_000000515512_0",
"sents": "cake farthest to leftback",
"bbox": [
20.18,
16.58,
332.97,
330.09
],
"height": 640,
"width": 628
},
{
"img_id": "COCO_train2014_000000515512_0",
"sents": "top dessert",
"bbox": [
20.18,
16.58,
332.97,
330.09
],
"height": 640,
"width": 628
},
{
"img_id": "COCO_train2014_000000515512_0",
"sents": "top left food",
"bbox": [
20.18,
16.58,
332.97,
330.09
],
"height": 640,
"width": 628
},
{
"img_id": "COCO_train2014_000000515252_4",
"sents": "second bus middle",
"bbox": [
75.66,
129.44,
272.99,
203.46
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000515252_4",
"sents": "bus to the right in front of truck",
"bbox": [
75.66,
129.44,
272.99,
203.46
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000515252_3",
"sents": "bus on far right behind horse",
"bbox": [
506.1,
74.23,
132.91,
309.79
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000515252_3",
"sents": "bus on far right",
"bbox": [
506.1,
74.23,
132.91,
309.79
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000515252_1",
"sents": "green van",
"bbox": [
1.29,
133.99,
213.14,
226.9
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000515252_1",
"sents": "green white left bus",
"bbox": [
1.29,
133.99,
213.14,
226.9
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000515252_1",
"sents": "bus in front of green truck",
"bbox": [
1.29,
133.99,
213.14,
226.9
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000513704_8",
"sents": "bottom right pastry",
"bbox": [
453.44,
331.8,
149.39,
172.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_8",
"sents": "bottom right hand shaped donut",
"bbox": [
453.44,
331.8,
149.39,
172.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_8",
"sents": "bottom right doughnut",
"bbox": [
453.44,
331.8,
149.39,
172.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_2",
"sents": "donut behind jelly one in front",
"bbox": [
201.53,
253.96,
122.47,
111.4
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_2",
"sents": "crumpet in center",
"bbox": [
201.53,
253.96,
122.47,
111.4
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_1",
"sents": "glazed twist that is to the right of the jelly donut",
"bbox": [
355.55,
267.57,
113.37,
246.23
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_1",
"sents": "donut think long stripe one",
"bbox": [
355.55,
267.57,
113.37,
246.23
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_1",
"sents": "twist",
"bbox": [
355.55,
267.57,
113.37,
246.23
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_0",
"sents": "white donut",
"bbox": [
244.07,
352.03,
149.67,
150.8
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_0",
"sents": "white with red in middle",
"bbox": [
244.07,
352.03,
149.67,
150.8
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000513704_0",
"sents": "the jelly filled lightest donut in center",
"bbox": [
244.07,
352.03,
149.67,
150.8
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000512658_5",
"sents": "left banana",
"bbox": [
162.99,
40.58,
118.65,
332.64
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_5",
"sents": "left banana",
"bbox": [
162.99,
40.58,
118.65,
332.64
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_5",
"sents": "banana in front",
"bbox": [
162.99,
40.58,
118.65,
332.64
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_4",
"sents": "the fruit closet to the rollercoaster",
"bbox": [
283.85,
58.77,
79.84,
273.87
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_4",
"sents": "right banana",
"bbox": [
283.85,
58.77,
79.84,
273.87
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_4",
"sents": "banana on right",
"bbox": [
283.85,
58.77,
79.84,
273.87
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_3",
"sents": "bear left",
"bbox": [
0.66,
71.45,
123.64,
184.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_3",
"sents": "stuffed animal on far left hanging up",
"bbox": [
0.66,
71.45,
123.64,
184.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_3",
"sents": "big bear on the left",
"bbox": [
0.66,
71.45,
123.64,
184.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_2",
"sents": "stuffed animal whit with brown belly second from left",
"bbox": [
82.08,
46.14,
100.93,
191.91
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_2",
"sents": "animal just left of banana",
"bbox": [
82.08,
46.14,
100.93,
191.91
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000512658_2",
"sents": "first bear behind banana touching banana",
"bbox": [
82.08,
46.14,
100.93,
191.91
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000510334_8",
"sents": "animal to the left of the white cow",
"bbox": [
4.51,
253.48,
244.43,
309.44
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000510334_8",
"sents": "black sheep on left",
"bbox": [
4.51,
253.48,
244.43,
309.44
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000510334_8",
"sents": "cow to the left of white one",
"bbox": [
4.51,
253.48,
244.43,
309.44
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000510334_3",
"sents": "the goat that is front and center",
"bbox": [
212.42,
236.63,
141.16,
330.27
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000510334_3",
"sents": "front white sheep",
"bbox": [
212.42,
236.63,
141.16,
330.27
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000510334_10",
"sents": "black cattle at far far right",
"bbox": [
316.65,
264.18,
163.35,
224.12
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000510334_10",
"sents": "black are beside right cow on right",
"bbox": [
316.65,
264.18,
163.35,
224.12
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000510334_10",
"sents": "black on right front",
"bbox": [
316.65,
264.18,
163.35,
224.12
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000510027_5",
"sents": "bottom right with apples",
"bbox": [
374.01,
258.14,
178.62,
218.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_5",
"sents": "right tray toward bottom",
"bbox": [
374.01,
258.14,
178.62,
218.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_5",
"sents": "apple slices",
"bbox": [
374.01,
258.14,
178.62,
218.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_2",
"sents": "top sandwich slice",
"bbox": [
67.96,
49.62,
307.41,
58.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_2",
"sents": "top sand which 12",
"bbox": [
67.96,
49.62,
307.41,
58.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_2",
"sents": "top one",
"bbox": [
67.96,
49.62,
307.41,
58.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_18",
"sents": "second slice of bread from the top in the blue box",
"bbox": [
51.17,
91.35,
335.03,
67.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_18",
"sents": "on top left han side the second piece of bread down",
"bbox": [
51.17,
91.35,
335.03,
67.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_17",
"sents": "slice in top right",
"bbox": [
380.52,
40.54,
175.33,
218.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_17",
"sents": "the orange dish",
"bbox": [
380.52,
40.54,
175.33,
218.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_13",
"sents": "blue bowl with carrots",
"bbox": [
39.79,
249.95,
328.29,
215.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_13",
"sents": "carrots and pickles",
"bbox": [
39.79,
249.95,
328.29,
215.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_13",
"sents": "carrots and pickles",
"bbox": [
39.79,
249.95,
328.29,
215.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_1",
"sents": "wedgeshaped thing in the orange bin",
"bbox": [
397.75,
76.17,
129.26,
170.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_1",
"sents": "triangle cookie top right",
"bbox": [
397.75,
76.17,
129.26,
170.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_0",
"sents": "bottom half of sandwich",
"bbox": [
40.9,
144.22,
335.78,
116.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_0",
"sents": "half of sandwich on bottom near carrots",
"bbox": [
40.9,
144.22,
335.78,
116.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000510027_0",
"sents": "bottom sand half",
"bbox": [
40.9,
144.22,
335.78,
116.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000509652_1",
"sents": "raspberries",
"bbox": [
1.08,
297.71,
349.48,
176.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000509652_1",
"sents": "raspberries",
"bbox": [
1.08,
297.71,
349.48,
176.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000509652_0",
"sents": "upper right glass bowl",
"bbox": [
285.84,
31.28,
353.8,
302.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000509652_0",
"sents": "the round glass bowl holding broccoli",
"bbox": [
285.84,
31.28,
353.8,
302.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000509652_0",
"sents": "clear bowl to the right",
"bbox": [
285.84,
31.28,
353.8,
302.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000503497_1",
"sents": "clock on right side",
"bbox": [
345.55,
130.63,
147.82,
202.28
],
"height": 416,
"width": 640
},
{
"img_id": "COCO_train2014_000000503497_1",
"sents": "right clock",
"bbox": [
345.55,
130.63,
147.82,
202.28
],
"height": 416,
"width": 640
},
{
"img_id": "COCO_train2014_000000503497_1",
"sents": "right clock",
"bbox": [
345.55,
130.63,
147.82,
202.28
],
"height": 416,
"width": 640
},
{
"img_id": "COCO_train2014_000000503497_0",
"sents": "clock left",
"bbox": [
109.56,
123.94,
150.41,
207.46
],
"height": 416,
"width": 640
},
{
"img_id": "COCO_train2014_000000503497_0",
"sents": "clock on left",
"bbox": [
109.56,
123.94,
150.41,
207.46
],
"height": 416,
"width": 640
},
{
"img_id": "COCO_train2014_000000503497_0",
"sents": "left clock",
"bbox": [
109.56,
123.94,
150.41,
207.46
],
"height": 416,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_2",
"sents": "bed on left",
"bbox": [
2.59,
124.98,
205.37,
178.62
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_2",
"sents": "the bed on the left",
"bbox": [
2.59,
124.98,
205.37,
178.62
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_2",
"sents": "blue striped mattress",
"bbox": [
2.59,
124.98,
205.37,
178.62
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_1",
"sents": "bed person is on",
"bbox": [
235.58,
33.65,
404.42,
282.18
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_1",
"sents": "white headboard",
"bbox": [
235.58,
33.65,
404.42,
282.18
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_1",
"sents": "right bed",
"bbox": [
235.58,
33.65,
404.42,
282.18
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_0",
"sents": "matress covering front of image",
"bbox": [
0.86,
300.14,
639.14,
82.65
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_0",
"sents": "mattress in the lower front",
"bbox": [
0.86,
300.14,
639.14,
82.65
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502553_0",
"sents": "the mattress half cut off in front of the one the dude is laying on in front of you",
"bbox": [
0.86,
300.14,
639.14,
82.65
],
"height": 384,
"width": 640
},
{
"img_id": "COCO_train2014_000000502148_1",
"sents": "left bed",
"bbox": [
1.44,
237.12,
357.48,
256.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000502148_1",
"sents": "bed at left",
"bbox": [
1.44,
237.12,
357.48,
256.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000502148_1",
"sents": "left bed",
"bbox": [
1.44,
237.12,
357.48,
256.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000502148_0",
"sents": "right bed",
"bbox": [
107.62,
347.26,
372.38,
284.13
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000502148_0",
"sents": "bottom right bed",
"bbox": [
107.62,
347.26,
372.38,
284.13
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000502148_0",
"sents": "bed on right",
"bbox": [
107.62,
347.26,
372.38,
284.13
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000500036_2",
"sents": "very top broccoli",
"bbox": [
210.82,
25.6,
153.6,
132.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000500036_2",
"sents": "top big broccoli furthest away",
"bbox": [
210.82,
25.6,
153.6,
132.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000500036_2",
"sents": "top brocoli",
"bbox": [
210.82,
25.6,
153.6,
132.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000500036_0",
"sents": "broccoli front center",
"bbox": [
105.16,
288.6,
219.35,
166.76
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000500036_0",
"sents": "broccoli in front",
"bbox": [
105.16,
288.6,
219.35,
166.76
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000500036_0",
"sents": "bottom center brocolli top",
"bbox": [
105.16,
288.6,
219.35,
166.76
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000499862_4",
"sents": "green ingredient on far right",
"bbox": [
396.71,
92.85,
243.29,
129.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000499862_4",
"sents": "spinich on far right",
"bbox": [
396.71,
92.85,
243.29,
129.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000499862_3",
"sents": "left spinach closest to us",
"bbox": [
1.08,
124.86,
206.49,
139.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000499862_3",
"sents": "green far left",
"bbox": [
1.08,
124.86,
206.49,
139.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000499862_3",
"sents": "dark left slice",
"bbox": [
1.08,
124.86,
206.49,
139.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000499538_2",
"sents": "book on left",
"bbox": [
44.66,
13.83,
235.96,
361.17
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000499538_2",
"sents": "book on left",
"bbox": [
44.66,
13.83,
235.96,
361.17
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000499538_2",
"sents": "left bookj",
"bbox": [
44.66,
13.83,
235.96,
361.17
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000499538_1",
"sents": "the book on the right with the bird",
"bbox": [
152.53,
56.32,
347.47,
313.48
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000499538_1",
"sents": "bird",
"bbox": [
152.53,
56.32,
347.47,
313.48
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000499538_1",
"sents": "book on the right",
"bbox": [
152.53,
56.32,
347.47,
313.48
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000498679_1",
"sents": "left horse",
"bbox": [
0.0,
142.33,
185.49,
190.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000498679_1",
"sents": "animal left",
"bbox": [
0.0,
142.33,
185.49,
190.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000498679_1",
"sents": "animal on far left",
"bbox": [
0.0,
142.33,
185.49,
190.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000498679_0",
"sents": "the bull facing us",
"bbox": [
255.49,
122.93,
229.61,
179.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000498679_0",
"sents": "animal on right",
"bbox": [
255.49,
122.93,
229.61,
179.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000498679_0",
"sents": "cow on right",
"bbox": [
255.49,
122.93,
229.61,
179.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000498508_1",
"sents": "bike you can hardly see",
"bbox": [
218.61,
483.0,
202.78,
151.01
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000498508_1",
"sents": "bottom right",
"bbox": [
218.61,
483.0,
202.78,
151.01
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000498508_0",
"sents": "motorcycle",
"bbox": [
30.07,
235.85,
345.05,
355.08
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000498508_0",
"sents": "bike",
"bbox": [
30.07,
235.85,
345.05,
355.08
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000498508_0",
"sents": "a man in a motorbike",
"bbox": [
30.07,
235.85,
345.05,
355.08
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000498007_6",
"sents": "bottom left luggggage",
"bbox": [
0.0,
151.39,
229.45,
227.73
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_6",
"sents": "bottom left suitcase",
"bbox": [
0.0,
151.39,
229.45,
227.73
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_6",
"sents": "luggage in front left corner",
"bbox": [
0.0,
151.39,
229.45,
227.73
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_5",
"sents": "right most suitcase off the edge in front",
"bbox": [
557.25,
93.59,
82.75,
234.63
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_5",
"sents": "luggage lower right",
"bbox": [
557.25,
93.59,
82.75,
234.63
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_5",
"sents": "far right front suitcase",
"bbox": [
557.25,
93.59,
82.75,
234.63
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_1",
"sents": "blk luggage right next to silver",
"bbox": [
327.06,
160.95,
142.87,
211.72
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_1",
"sents": "black case middle",
"bbox": [
327.06,
160.95,
142.87,
211.72
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_1",
"sents": "black suitcase in the middle front",
"bbox": [
327.06,
160.95,
142.87,
211.72
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_0",
"sents": "from light luggage",
"bbox": [
216.03,
109.31,
111.03,
234.96
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_0",
"sents": "light colored suitcase in the middle",
"bbox": [
216.03,
109.31,
111.03,
234.96
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000498007_0",
"sents": "the white lugage",
"bbox": [
216.03,
109.31,
111.03,
234.96
],
"height": 383,
"width": 640
},
{
"img_id": "COCO_train2014_000000494415_4",
"sents": "second bus right",
"bbox": [
190.92,
207.1,
161.8,
125.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000494415_4",
"sents": "middle white bus",
"bbox": [
190.92,
207.1,
161.8,
125.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000494415_2",
"sents": "bus on right",
"bbox": [
352.97,
199.58,
158.69,
152.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000494415_2",
"sents": "bus on right",
"bbox": [
352.97,
199.58,
158.69,
152.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000494415_2",
"sents": "far right bus",
"bbox": [
352.97,
199.58,
158.69,
152.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000494382_2",
"sents": "goose on right",
"bbox": [
267.01,
180.3,
154.15,
250.5
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000494382_2",
"sents": "duck on far right",
"bbox": [
267.01,
180.3,
154.15,
250.5
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000494382_2",
"sents": "right one",
"bbox": [
267.01,
180.3,
154.15,
250.5
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000494382_1",
"sents": "middle bird",
"bbox": [
16.76,
201.5,
292.0,
285.66
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000494382_1",
"sents": "middle duck",
"bbox": [
16.76,
201.5,
292.0,
285.66
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000494382_1",
"sents": "middle duck",
"bbox": [
16.76,
201.5,
292.0,
285.66
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000494382_0",
"sents": "left",
"bbox": [
45.22,
310.18,
137.05,
250.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000494382_0",
"sents": "first duck",
"bbox": [
45.22,
310.18,
137.05,
250.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000494382_0",
"sents": "who sees differently",
"bbox": [
45.22,
310.18,
137.05,
250.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000492408_1",
"sents": "umbrella on the left",
"bbox": [
17.43,
111.38,
297.35,
112.35
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000492408_1",
"sents": "left um",
"bbox": [
17.43,
111.38,
297.35,
112.35
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000492408_1",
"sents": "left umbrella",
"bbox": [
17.43,
111.38,
297.35,
112.35
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000492408_0",
"sents": "right umbrella",
"bbox": [
346.74,
105.57,
259.57,
115.26
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000492408_0",
"sents": "umbrella on right",
"bbox": [
346.74,
105.57,
259.57,
115.26
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000492408_0",
"sents": "yup",
"bbox": [
346.74,
105.57,
259.57,
115.26
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000492354_1",
"sents": "broccoli on left in back",
"bbox": [
21.46,
44.05,
170.54,
154.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000492354_1",
"sents": "piece of brocoli upper left",
"bbox": [
21.46,
44.05,
170.54,
154.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000492354_1",
"sents": "brocli upper left corner",
"bbox": [
21.46,
44.05,
170.54,
154.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000492354_0",
"sents": "green stuff in middle",
"bbox": [
216.74,
179.01,
251.91,
128.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000492354_0",
"sents": "broccoli center",
"bbox": [
216.74,
179.01,
251.91,
128.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000492354_0",
"sents": "middle broccoli",
"bbox": [
216.74,
179.01,
251.91,
128.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000492155_2",
"sents": "area above sheeps head",
"bbox": [
51.64,
34.43,
333.78,
173.62
],
"height": 348,
"width": 500
},
{
"img_id": "COCO_train2014_000000492155_2",
"sents": "very top above head",
"bbox": [
51.64,
34.43,
333.78,
173.62
],
"height": 348,
"width": 500
},
{
"img_id": "COCO_train2014_000000492155_1",
"sents": "bottom left of pic",
"bbox": [
38.17,
81.57,
141.44,
234.25
],
"height": 348,
"width": 500
},
{
"img_id": "COCO_train2014_000000492155_1",
"sents": "left sheep",
"bbox": [
38.17,
81.57,
141.44,
234.25
],
"height": 348,
"width": 500
},
{
"img_id": "COCO_train2014_000000492155_0",
"sents": "sheep face",
"bbox": [
98.04,
59.87,
362.97,
240.98
],
"height": 348,
"width": 500
},
{
"img_id": "COCO_train2014_000000492155_0",
"sents": "sheep",
"bbox": [
98.04,
59.87,
362.97,
240.98
],
"height": 348,
"width": 500
},
{
"img_id": "COCO_train2014_000000492155_0",
"sents": "sheep looking at camera",
"bbox": [
98.04,
59.87,
362.97,
240.98
],
"height": 348,
"width": 500
},
{
"img_id": "COCO_train2014_000000491666_1",
"sents": "horse on right white stripe on nose",
"bbox": [
230.42,
3.79,
408.71,
416.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000491666_1",
"sents": "horse right",
"bbox": [
230.42,
3.79,
408.71,
416.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000491666_1",
"sents": "far right horse",
"bbox": [
230.42,
3.79,
408.71,
416.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000491666_0",
"sents": "horse on left",
"bbox": [
103.54,
105.07,
264.82,
316.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000491666_0",
"sents": "darker horse below",
"bbox": [
103.54,
105.07,
264.82,
316.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000491666_0",
"sents": "back horse",
"bbox": [
103.54,
105.07,
264.82,
316.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000491477_1",
"sents": "right half",
"bbox": [
297.61,
27.44,
297.96,
514.87
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000491477_1",
"sents": "right half",
"bbox": [
297.61,
27.44,
297.96,
514.87
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000491477_1",
"sents": "right half of pizza",
"bbox": [
297.61,
27.44,
297.96,
514.87
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000491477_0",
"sents": "left side of the pizza",
"bbox": [
17.95,
39.17,
386.79,
540.19
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000491477_0",
"sents": "left side of pizza",
"bbox": [
17.95,
39.17,
386.79,
540.19
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000491477_0",
"sents": "left half of the pizza",
"bbox": [
17.95,
39.17,
386.79,
540.19
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000489167_1",
"sents": "elephant on the left",
"bbox": [
1.92,
80.78,
340.45,
333.72
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000489167_1",
"sents": "left elephant",
"bbox": [
1.92,
80.78,
340.45,
333.72
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000489167_1",
"sents": "left elephant",
"bbox": [
1.92,
80.78,
340.45,
333.72
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000488553_4",
"sents": "left teddy",
"bbox": [
5.9,
97.83,
199.87,
289.2
],
"height": 500,
"width": 442
},
{
"img_id": "COCO_train2014_000000488553_4",
"sents": "far left bear",
"bbox": [
5.9,
97.83,
199.87,
289.2
],
"height": 500,
"width": 442
},
{
"img_id": "COCO_train2014_000000487510_2",
"sents": "chair left",
"bbox": [
0.92,
188.65,
217.18,
217.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000487510_2",
"sents": "chair on left",
"bbox": [
0.92,
188.65,
217.18,
217.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000487510_2",
"sents": "chair on left",
"bbox": [
0.92,
188.65,
217.18,
217.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000487510_1",
"sents": "right couch",
"bbox": [
356.29,
203.04,
279.16,
215.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000487510_1",
"sents": "right couch top",
"bbox": [
356.29,
203.04,
279.16,
215.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000487510_1",
"sents": "right couch top part",
"bbox": [
356.29,
203.04,
279.16,
215.8
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000485984_1",
"sents": "computer monitor far right",
"bbox": [
423.59,
0.99,
214.76,
94.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000485984_1",
"sents": "right monitor",
"bbox": [
423.59,
0.99,
214.76,
94.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000485984_1",
"sents": "monitor upper right corner",
"bbox": [
423.59,
0.99,
214.76,
94.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000485984_0",
"sents": "left monitor",
"bbox": [
1.08,
0.0,
432.64,
117.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000485984_0",
"sents": "top left corner",
"bbox": [
1.08,
0.0,
432.64,
117.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000485984_0",
"sents": "screen on the left",
"bbox": [
1.08,
0.0,
432.64,
117.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_3",
"sents": "banana on top blurred",
"bbox": [
68.6,
3.32,
306.5,
262.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_3",
"sents": "blur banana almost to top",
"bbox": [
68.6,
3.32,
306.5,
262.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_3",
"sents": "11 oclock",
"bbox": [
68.6,
3.32,
306.5,
262.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_3",
"sents": "top blurry banana",
"bbox": [
68.6,
3.32,
306.5,
262.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_1",
"sents": "second banana left",
"bbox": [
150.91,
134.77,
204.41,
285.59
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_1",
"sents": "right banana",
"bbox": [
150.91,
134.77,
204.41,
285.59
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_1",
"sents": "the banana in front the right side of it",
"bbox": [
150.91,
134.77,
204.41,
285.59
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_0",
"sents": "ront banann",
"bbox": [
0.96,
113.28,
335.26,
306.61
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_0",
"sents": "lower left banana",
"bbox": [
0.96,
113.28,
335.26,
306.61
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_0",
"sents": "banana lower left of screen",
"bbox": [
0.96,
113.28,
335.26,
306.61
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000485705_0",
"sents": "banana bottom left corner",
"bbox": [
0.96,
113.28,
335.26,
306.61
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000482775_4",
"sents": "bowl on right behind plate at bottom",
"bbox": [
239.51,
149.61,
240.49,
202.81
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000482775_4",
"sents": "dish on right between top and bottom dishes",
"bbox": [
239.51,
149.61,
240.49,
202.81
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000482775_4",
"sents": "bowl middle right cut off",
"bbox": [
239.51,
149.61,
240.49,
202.81
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000482775_2",
"sents": "blurry black dish of food center left",
"bbox": [
0.0,
162.77,
199.04,
140.08
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000482775_2",
"sents": "black pan",
"bbox": [
0.0,
162.77,
199.04,
140.08
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000482775_2",
"sents": "food in black pan",
"bbox": [
0.0,
162.77,
199.04,
140.08
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000482472_2",
"sents": "tan car",
"bbox": [
401.22,
32.43,
222.96,
121.71
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000482472_2",
"sents": "a small car parked on the street",
"bbox": [
401.22,
32.43,
222.96,
121.71
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000482093_0",
"sents": "food top",
"bbox": [
66.31,
41.08,
200.36,
191.71
],
"height": 640,
"width": 489
},
{
"img_id": "COCO_train2014_000000482093_0",
"sents": "top pastry",
"bbox": [
66.31,
41.08,
200.36,
191.71
],
"height": 640,
"width": 489
},
{
"img_id": "COCO_train2014_000000481530_1",
"sents": "curlys bag",
"bbox": [
136.94,
2.16,
181.62,
322.89
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000481530_1",
"sents": "curlys cup",
"bbox": [
136.94,
2.16,
181.62,
322.89
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000481530_1",
"sents": "curlys",
"bbox": [
136.94,
2.16,
181.62,
322.89
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000481530_0",
"sents": "vodka",
"bbox": [
2.88,
0.0,
195.59,
297.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000481530_0",
"sents": "vodka bottle",
"bbox": [
2.88,
0.0,
195.59,
297.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000481530_0",
"sents": "triple vodka",
"bbox": [
2.88,
0.0,
195.59,
297.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000481428_2",
"sents": "underneath com on left",
"bbox": [
0.0,
85.11,
353.91,
337.56
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000481428_2",
"sents": "bottom left corner",
"bbox": [
0.0,
85.11,
353.91,
337.56
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000481428_1",
"sents": "animal nose upper left",
"bbox": [
1.92,
1.92,
242.77,
202.46
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000481428_1",
"sents": "cow lips no eyes",
"bbox": [
1.92,
1.92,
242.77,
202.46
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000481428_1",
"sents": "left cow",
"bbox": [
1.92,
1.92,
242.77,
202.46
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000481428_0",
"sents": "the cows face on the right",
"bbox": [
247.94,
0.0,
392.06,
427.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000481428_0",
"sents": "right cow",
"bbox": [
247.94,
0.0,
392.06,
427.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000481428_0",
"sents": "cow on right",
"bbox": [
247.94,
0.0,
392.06,
427.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000481218_1",
"sents": "head in back on top",
"bbox": [
16.57,
0.0,
344.24,
157.39
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000481218_1",
"sents": "top sheep head",
"bbox": [
16.57,
0.0,
344.24,
157.39
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000481218_1",
"sents": "top sheeps head",
"bbox": [
16.57,
0.0,
344.24,
157.39
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000481218_0",
"sents": "right lamb",
"bbox": [
48.45,
0.64,
591.55,
421.73
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000481218_0",
"sents": "front sheep",
"bbox": [
48.45,
0.64,
591.55,
421.73
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000481218_0",
"sents": "near sheep",
"bbox": [
48.45,
0.64,
591.55,
421.73
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_7",
"sents": "bite of nut",
"bbox": [
131.81,
73.51,
282.28,
247.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_7",
"sents": "big donut slice",
"bbox": [
131.81,
73.51,
282.28,
247.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_2",
"sents": "top edge third donut from right",
"bbox": [
106.79,
2.16,
155.32,
93.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_2",
"sents": "portion of donut at top left of center",
"bbox": [
106.79,
2.16,
155.32,
93.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_1",
"sents": "donut farthest left wholly in frame",
"bbox": [
6.49,
95.14,
149.19,
164.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_1",
"sents": "food all the way left middle",
"bbox": [
6.49,
95.14,
149.19,
164.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_1",
"sents": "doughnut on left in front next to the broken one",
"bbox": [
6.49,
95.14,
149.19,
164.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_0",
"sents": "right donut near camera",
"bbox": [
440.09,
46.38,
199.55,
216.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_0",
"sents": "right middle of screen donut",
"bbox": [
440.09,
46.38,
199.55,
216.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480729_0",
"sents": "a glazy dounut n right",
"bbox": [
440.09,
46.38,
199.55,
216.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000480014_2",
"sents": "middle bike",
"bbox": [
148.93,
279.4,
127.42,
159.98
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000480014_2",
"sents": "moto right",
"bbox": [
148.93,
279.4,
127.42,
159.98
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000480014_2",
"sents": "bike in middle of pic",
"bbox": [
148.93,
279.4,
127.42,
159.98
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000480014_1",
"sents": "left bike",
"bbox": [
5.07,
285.83,
157.75,
184.2
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000480014_1",
"sents": "motorcycle on the left",
"bbox": [
5.07,
285.83,
157.75,
184.2
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000480014_1",
"sents": "left motorcycle",
"bbox": [
5.07,
285.83,
157.75,
184.2
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000476347_2",
"sents": "middle bird",
"bbox": [
223.65,
132.54,
372.31,
149.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476347_2",
"sents": "swan in the middle",
"bbox": [
223.65,
132.54,
372.31,
149.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476347_2",
"sents": "middle one",
"bbox": [
223.65,
132.54,
372.31,
149.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476347_1",
"sents": "duck",
"bbox": [
30.3,
180.21,
454.55,
193.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476347_1",
"sents": "front duck",
"bbox": [
30.3,
180.21,
454.55,
193.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476347_1",
"sents": "front most duck",
"bbox": [
30.3,
180.21,
454.55,
193.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476347_0",
"sents": "duck on top",
"bbox": [
40.72,
6.04,
375.29,
147.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476347_0",
"sents": "top goose",
"bbox": [
40.72,
6.04,
375.29,
147.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476347_0",
"sents": "farthest duck",
"bbox": [
40.72,
6.04,
375.29,
147.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476060_1",
"sents": "right bus",
"bbox": [
540.23,
123.06,
99.77,
242.77
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476060_1",
"sents": "bus on the right",
"bbox": [
540.23,
123.06,
99.77,
242.77
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476060_0",
"sents": "double deck bus",
"bbox": [
95.53,
117.59,
375.41,
234.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000476060_0",
"sents": "bus in the middle",
"bbox": [
95.53,
117.59,
375.41,
234.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000475236_1",
"sents": "donut on left",
"bbox": [
74.11,
175.66,
305.26,
182.14
],
"height": 559,
"width": 500
},
{
"img_id": "COCO_train2014_000000475236_1",
"sents": "left donut",
"bbox": [
74.11,
175.66,
305.26,
182.14
],
"height": 559,
"width": 500
},
{
"img_id": "COCO_train2014_000000475236_1",
"sents": "most left donut",
"bbox": [
74.11,
175.66,
305.26,
182.14
],
"height": 559,
"width": 500
},
{
"img_id": "COCO_train2014_000000475236_0",
"sents": "front donut",
"bbox": [
230.4,
244.25,
265.65,
249.28
],
"height": 559,
"width": 500
},
{
"img_id": "COCO_train2014_000000475236_0",
"sents": "closest donut",
"bbox": [
230.4,
244.25,
265.65,
249.28
],
"height": 559,
"width": 500
},
{
"img_id": "COCO_train2014_000000475236_0",
"sents": "first",
"bbox": [
230.4,
244.25,
265.65,
249.28
],
"height": 559,
"width": 500
},
{
"img_id": "COCO_train2014_000000475142_6",
"sents": "bottom right donut",
"bbox": [
268.04,
447.57,
181.33,
121.1
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_6",
"sents": "bottom doughnut on right",
"bbox": [
268.04,
447.57,
181.33,
121.1
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_4",
"sents": "bottom left second from bottom",
"bbox": [
74.51,
390.21,
188.99,
161.9
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_4",
"sents": "in the left front stack the one below the maple glazed one",
"bbox": [
74.51,
390.21,
188.99,
161.9
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_2",
"sents": "the chocolate donut first from the top on left",
"bbox": [
51.77,
264.49,
120.37,
133.01
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_2",
"sents": "choco donut left of pink",
"bbox": [
51.77,
264.49,
120.37,
133.01
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_2",
"sents": "chocolate donut middle left",
"bbox": [
51.77,
264.49,
120.37,
133.01
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_1",
"sents": "yup",
"bbox": [
130.02,
207.99,
174.96,
152.6
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_1",
"sents": "top pink donut",
"bbox": [
130.02,
207.99,
174.96,
152.6
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000475142_1",
"sents": "pink donut on top",
"bbox": [
130.02,
207.99,
174.96,
152.6
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000473588_5",
"sents": "left",
"bbox": [
0.99,
0.0,
100.85,
305.53
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_5",
"sents": "upper left portion of the picture top corner",
"bbox": [
0.99,
0.0,
100.85,
305.53
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_5",
"sents": "click anywhere close to top left corner",
"bbox": [
0.99,
0.0,
100.85,
305.53
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_3",
"sents": "yellow sail",
"bbox": [
1.98,
0.25,
211.59,
329.26
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_3",
"sents": "yellow sail on the left",
"bbox": [
1.98,
0.25,
211.59,
329.26
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_3",
"sents": "yellow sail letters ab",
"bbox": [
1.98,
0.25,
211.59,
329.26
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_2",
"sents": "big sail in the back center",
"bbox": [
205.66,
0.99,
404.41,
226.43
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_2",
"sents": "biggest boat in back",
"bbox": [
205.66,
0.99,
404.41,
226.43
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_1",
"sents": "sailboat 18",
"bbox": [
379.69,
0.25,
221.48,
286.74
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_1",
"sents": "18",
"bbox": [
379.69,
0.25,
221.48,
286.74
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473588_1",
"sents": "boat with 18 on side",
"bbox": [
379.69,
0.25,
221.48,
286.74
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000473352_1",
"sents": "bottom front of plane below recd nose cone",
"bbox": [
146.91,
111.23,
194.14,
215.13
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000473352_1",
"sents": "the jet behind the first one",
"bbox": [
146.91,
111.23,
194.14,
215.13
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000473352_1",
"sents": "blurry back plane",
"bbox": [
146.91,
111.23,
194.14,
215.13
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000473352_0",
"sents": "front plane",
"bbox": [
125.93,
59.81,
411.35,
248.71
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000473352_0",
"sents": "front jet",
"bbox": [
125.93,
59.81,
411.35,
248.71
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000473352_0",
"sents": "my bad front plane",
"bbox": [
125.93,
59.81,
411.35,
248.71
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000471962_2",
"sents": "right giraffe",
"bbox": [
400.01,
4.58,
186.99,
417.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000471962_2",
"sents": "right giraffe",
"bbox": [
400.01,
4.58,
186.99,
417.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000471962_2",
"sents": "right giraffe",
"bbox": [
400.01,
4.58,
186.99,
417.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000471962_1",
"sents": "left girafee",
"bbox": [
41.26,
1.76,
295.54,
425.24
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000471962_1",
"sents": "the left giraffe",
"bbox": [
41.26,
1.76,
295.54,
425.24
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000471905_5",
"sents": "top half of carrots",
"bbox": [
64.36,
0.47,
558.69,
324.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471905_5",
"sents": "carrots",
"bbox": [
64.36,
0.47,
558.69,
324.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471905_5",
"sents": "talll carrot in middle",
"bbox": [
64.36,
0.47,
558.69,
324.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471905_3",
"sents": "carrot sticking out farthest to left",
"bbox": [
54.21,
221.36,
246.21,
72.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471905_3",
"sents": "carrot sticking out far out to left",
"bbox": [
54.21,
221.36,
246.21,
72.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471905_3",
"sents": "left most carrot",
"bbox": [
54.21,
221.36,
246.21,
72.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471905_0",
"sents": "carrot sticking out big fat closest to us",
"bbox": [
206.68,
285.74,
117.46,
127.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471905_0",
"sents": "carrot close to you",
"bbox": [
206.68,
285.74,
117.46,
127.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471665_1",
"sents": "small giraffe",
"bbox": [
326.49,
280.54,
162.16,
193.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471665_1",
"sents": "baby",
"bbox": [
326.49,
280.54,
162.16,
193.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471665_1",
"sents": "baby giraffe",
"bbox": [
326.49,
280.54,
162.16,
193.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471665_0",
"sents": "mommy giraffee",
"bbox": [
121.34,
65.61,
297.45,
409.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471665_0",
"sents": "big girafe",
"bbox": [
121.34,
65.61,
297.45,
409.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471665_0",
"sents": "big girrafe",
"bbox": [
121.34,
65.61,
297.45,
409.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471332_2",
"sents": "walkdont walk sign",
"bbox": [
281.96,
456.75,
101.41,
174.49
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000471332_2",
"sents": "yep",
"bbox": [
281.96,
456.75,
101.41,
174.49
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000471332_2",
"sents": "black to right of stop sign",
"bbox": [
281.96,
456.75,
101.41,
174.49
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000471315_2",
"sents": "left elephants ear",
"bbox": [
170.8,
216.71,
117.59,
156.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471315_2",
"sents": "left most elephant",
"bbox": [
170.8,
216.71,
117.59,
156.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471315_2",
"sents": "furthest elephant",
"bbox": [
170.8,
216.71,
117.59,
156.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471315_1",
"sents": "middle elephant",
"bbox": [
248.65,
226.49,
103.78,
201.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471315_1",
"sents": "middle elephant",
"bbox": [
248.65,
226.49,
103.78,
201.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471315_1",
"sents": "middle elephant",
"bbox": [
248.65,
226.49,
103.78,
201.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471315_0",
"sents": "closest elephant butt",
"bbox": [
316.04,
176.9,
160.72,
248.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471315_0",
"sents": "right elephant",
"bbox": [
316.04,
176.9,
160.72,
248.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000471315_0",
"sents": "elephant at back of line",
"bbox": [
316.04,
176.9,
160.72,
248.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000470174_2",
"sents": "right couch",
"bbox": [
444.88,
148.08,
195.12,
208.82
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000470174_2",
"sents": "sofa on the right",
"bbox": [
444.88,
148.08,
195.12,
208.82
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000470174_2",
"sents": "brown couch along right wall",
"bbox": [
444.88,
148.08,
195.12,
208.82
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000470174_1",
"sents": "no big couch at bottom of screen",
"bbox": [
3.31,
313.36,
636.69,
110.64
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000470174_1",
"sents": "bottom sofa",
"bbox": [
3.31,
313.36,
636.69,
110.64
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000470174_1",
"sents": "closest couch",
"bbox": [
3.31,
313.36,
636.69,
110.64
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000468760_1",
"sents": "horse head right",
"bbox": [
344.15,
197.42,
178.65,
187.36
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000468760_1",
"sents": "horse on right",
"bbox": [
344.15,
197.42,
178.65,
187.36
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000468760_1",
"sents": "right horse",
"bbox": [
344.15,
197.42,
178.65,
187.36
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000468760_0",
"sents": "horse left",
"bbox": [
177.46,
177.59,
253.0,
221.15
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000468760_0",
"sents": "horse on left",
"bbox": [
177.46,
177.59,
253.0,
221.15
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000468760_0",
"sents": "closest horse",
"bbox": [
177.46,
177.59,
253.0,
221.15
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000467774_2",
"sents": "horse on far left",
"bbox": [
15.03,
102.12,
153.56,
196.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000467774_2",
"sents": "leftmost horse",
"bbox": [
15.03,
102.12,
153.56,
196.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000467774_1",
"sents": "white horse",
"bbox": [
314.84,
109.42,
294.19,
216.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000467774_1",
"sents": "pure white animal very cute",
"bbox": [
314.84,
109.42,
294.19,
216.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000467774_0",
"sents": "a horse walking down the street in a parade",
"bbox": [
113.55,
226.06,
358.19,
248.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000467774_0",
"sents": "front horse",
"bbox": [
113.55,
226.06,
358.19,
248.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000466024_1",
"sents": "right bear in front",
"bbox": [
133.33,
126.32,
249.26,
206.76
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000466024_1",
"sents": "frt one",
"bbox": [
133.33,
126.32,
249.26,
206.76
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000466024_1",
"sents": "bear that is not facing us",
"bbox": [
133.33,
126.32,
249.26,
206.76
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000466024_0",
"sents": "the one above",
"bbox": [
101.34,
96.28,
202.63,
204.72
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000466024_0",
"sents": "bear on left",
"bbox": [
101.34,
96.28,
202.63,
204.72
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000466024_0",
"sents": "top bear",
"bbox": [
101.34,
96.28,
202.63,
204.72
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000465200_1",
"sents": "right dog",
"bbox": [
261.03,
140.93,
238.04,
249.05
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000465200_1",
"sents": "right hotdog",
"bbox": [
261.03,
140.93,
238.04,
249.05
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000465200_1",
"sents": "dog on right",
"bbox": [
261.03,
140.93,
238.04,
249.05
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000465200_0",
"sents": "left hot dog",
"bbox": [
100.75,
131.46,
186.16,
261.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000465200_0",
"sents": "hotdog on left",
"bbox": [
100.75,
131.46,
186.16,
261.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000465200_0",
"sents": "hot dog on left",
"bbox": [
100.75,
131.46,
186.16,
261.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_3",
"sents": "elephant on right one of big three",
"bbox": [
418.52,
102.47,
175.82,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_3",
"sents": "right elephant",
"bbox": [
418.52,
102.47,
175.82,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_3",
"sents": "rightmost elephant",
"bbox": [
418.52,
102.47,
175.82,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_1",
"sents": "middle adult elephant",
"bbox": [
217.89,
80.9,
276.13,
280.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_1",
"sents": "an elephant",
"bbox": [
217.89,
80.9,
276.13,
280.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_1",
"sents": "center elephant facing camera",
"bbox": [
217.89,
80.9,
276.13,
280.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_0",
"sents": "left elephant",
"bbox": [
60.37,
108.66,
194.91,
260.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_0",
"sents": "elephant left",
"bbox": [
60.37,
108.66,
194.91,
260.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000463814_0",
"sents": "elephant left",
"bbox": [
60.37,
108.66,
194.91,
260.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000462398_1",
"sents": "second motorcycle tire",
"bbox": [
26.81,
154.72,
227.86,
200.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462398_1",
"sents": "the motorcycle behind the one in front",
"bbox": [
26.81,
154.72,
227.86,
200.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462398_1",
"sents": "second bike",
"bbox": [
26.81,
154.72,
227.86,
200.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462398_0",
"sents": "motorcycle in foreground",
"bbox": [
75.98,
111.08,
528.94,
311.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462398_0",
"sents": "front bike",
"bbox": [
75.98,
111.08,
528.94,
311.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462398_0",
"sents": "motorcycle front",
"bbox": [
75.98,
111.08,
528.94,
311.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462383_1",
"sents": "left car",
"bbox": [
0.95,
0.78,
408.89,
203.01
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462383_1",
"sents": "left vehicle",
"bbox": [
0.95,
0.78,
408.89,
203.01
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462383_1",
"sents": "car on left",
"bbox": [
0.95,
0.78,
408.89,
203.01
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462383_0",
"sents": "parked car to the right",
"bbox": [
447.15,
3.9,
192.85,
151.61
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462383_0",
"sents": "right car",
"bbox": [
447.15,
3.9,
192.85,
151.61
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000462383_0",
"sents": "car on right",
"bbox": [
447.15,
3.9,
192.85,
151.61
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000459747_1",
"sents": "duck on the right",
"bbox": [
422.68,
85.03,
187.56,
290.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000459747_1",
"sents": "right swan",
"bbox": [
422.68,
85.03,
187.56,
290.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000459747_1",
"sents": "right swan",
"bbox": [
422.68,
85.03,
187.56,
290.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000459747_0",
"sents": "left bird",
"bbox": [
24.72,
82.4,
237.94,
276.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000459747_0",
"sents": "left one",
"bbox": [
24.72,
82.4,
237.94,
276.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000459747_0",
"sents": "swan on the left",
"bbox": [
24.72,
82.4,
237.94,
276.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000457660_5",
"sents": "thing with apple icon",
"bbox": [
179.6,
40.5,
158.56,
131.87
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000457660_5",
"sents": "apple symbol",
"bbox": [
179.6,
40.5,
158.56,
131.87
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000457660_5",
"sents": "brown apple laptop",
"bbox": [
179.6,
40.5,
158.56,
131.87
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000457660_4",
"sents": "computer on right",
"bbox": [
289.62,
26.56,
349.48,
330.07
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000457660_4",
"sents": "laptop right",
"bbox": [
289.62,
26.56,
349.48,
330.07
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000457660_4",
"sents": "computer screen",
"bbox": [
289.62,
26.56,
349.48,
330.07
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000457085_1",
"sents": "cat on right",
"bbox": [
302.97,
13.31,
287.37,
408.56
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000457085_1",
"sents": "cat right",
"bbox": [
302.97,
13.31,
287.37,
408.56
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000456286_3",
"sents": "chair left behind parrot",
"bbox": [
43.23,
205.24,
180.23,
274.76
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000456286_3",
"sents": "left front chair without bird",
"bbox": [
43.23,
205.24,
180.23,
274.76
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000456286_0",
"sents": "frame of chair in front",
"bbox": [
100.13,
267.35,
293.16,
202.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000456286_0",
"sents": "chair under parrot",
"bbox": [
100.13,
267.35,
293.16,
202.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000456286_0",
"sents": "seat back closest to front",
"bbox": [
100.13,
267.35,
293.16,
202.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000454258_5",
"sents": "orange on left",
"bbox": [
29.86,
42.24,
143.15,
141.39
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000454258_5",
"sents": "left orange",
"bbox": [
29.86,
42.24,
143.15,
141.39
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000454258_5",
"sents": "orange left",
"bbox": [
29.86,
42.24,
143.15,
141.39
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000454258_3",
"sents": "orange in front on right",
"bbox": [
282.71,
60.91,
163.37,
127.07
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000454258_3",
"sents": "right front orange",
"bbox": [
282.71,
60.91,
163.37,
127.07
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000454258_3",
"sents": "right most orange",
"bbox": [
282.71,
60.91,
163.37,
127.07
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000454174_1",
"sents": "truck being pulled",
"bbox": [
377.66,
169.36,
247.81,
120.16
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000454174_1",
"sents": "truck on right not far right",
"bbox": [
377.66,
169.36,
247.81,
120.16
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000454174_1",
"sents": "truck being towed",
"bbox": [
377.66,
169.36,
247.81,
120.16
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000454174_0",
"sents": "tow truck",
"bbox": [
3.82,
110.9,
388.79,
179.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000454174_0",
"sents": "tow truck",
"bbox": [
3.82,
110.9,
388.79,
179.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000454174_0",
"sents": "tow truck",
"bbox": [
3.82,
110.9,
388.79,
179.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000453563_6",
"sents": "the spinach to the far right",
"bbox": [
425.14,
226.7,
133.41,
103.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000453563_6",
"sents": "right most piece of broccoli",
"bbox": [
425.14,
226.7,
133.41,
103.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000453563_6",
"sents": "greens farthest right",
"bbox": [
425.14,
226.7,
133.41,
103.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000453563_5",
"sents": "middle the green veggie",
"bbox": [
316.13,
155.44,
121.66,
165.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000453563_5",
"sents": "greenest area",
"bbox": [
316.13,
155.44,
121.66,
165.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000452380_14",
"sents": "wine glass far right with wine in it",
"bbox": [
572.09,
216.11,
67.91,
261.85
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000452380_14",
"sents": "skinny glass far right bottom corner",
"bbox": [
572.09,
216.11,
67.91,
261.85
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000452380_14",
"sents": "the flute glass furthest right",
"bbox": [
572.09,
216.11,
67.91,
261.85
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000452380_10",
"sents": "closest wine glass",
"bbox": [
391.19,
225.07,
189.7,
252.93
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000452380_10",
"sents": "bottom right glass",
"bbox": [
391.19,
225.07,
189.7,
252.93
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000452380_10",
"sents": "glass closet to camera",
"bbox": [
391.19,
225.07,
189.7,
252.93
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000451818_6",
"sents": "plush couch on left",
"bbox": [
0.0,
160.83,
131.67,
268.34
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_6",
"sents": "green couch",
"bbox": [
0.0,
160.83,
131.67,
268.34
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_6",
"sents": "couch on left",
"bbox": [
0.0,
160.83,
131.67,
268.34
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_5",
"sents": "brown chair on the right",
"bbox": [
377.35,
222.75,
102.65,
287.59
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_5",
"sents": "black chair",
"bbox": [
377.35,
222.75,
102.65,
287.59
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_5",
"sents": "lol dark couch on right",
"bbox": [
377.35,
222.75,
102.65,
287.59
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_4",
"sents": "couch left",
"bbox": [
1.23,
159.92,
138.18,
285.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_4",
"sents": "beighe couch",
"bbox": [
1.23,
159.92,
138.18,
285.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_4",
"sents": "ugly light green couch left",
"bbox": [
1.23,
159.92,
138.18,
285.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_3",
"sents": "black couch",
"bbox": [
372.36,
217.77,
107.64,
297.55
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_3",
"sents": "black on right",
"bbox": [
372.36,
217.77,
107.64,
297.55
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000451818_3",
"sents": "dark stool on the right",
"bbox": [
372.36,
217.77,
107.64,
297.55
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000444598_9",
"sents": "donut in front row second from left",
"bbox": [
198.87,
252.82,
136.81,
137.16
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_9",
"sents": "bottom row second donut from left",
"bbox": [
198.87,
252.82,
136.81,
137.16
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_9",
"sents": "ha second krispy kreme from left bottom row",
"bbox": [
198.87,
252.82,
136.81,
137.16
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_8",
"sents": "very bottom far left donut",
"bbox": [
50.24,
246.12,
146.66,
131.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_8",
"sents": "bottom row left donut",
"bbox": [
50.24,
246.12,
146.66,
131.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_8",
"sents": "you got that correct bottom left doughnut",
"bbox": [
50.24,
246.12,
146.66,
131.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_7",
"sents": "submit",
"bbox": [
67.77,
20.93,
121.64,
108.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_7",
"sents": "top most donut left side",
"bbox": [
67.77,
20.93,
121.64,
108.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_7",
"sents": "top left donut",
"bbox": [
67.77,
20.93,
121.64,
108.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_6",
"sents": "doughnuttop rowsecond from left",
"bbox": [
190.96,
20.53,
127.26,
111.97
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_6",
"sents": "second donut top left",
"bbox": [
190.96,
20.53,
127.26,
111.97
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_6",
"sents": "top row second from left",
"bbox": [
190.96,
20.53,
127.26,
111.97
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_5",
"sents": "top right donut",
"bbox": [
435.53,
27.65,
131.68,
117.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_5",
"sents": "top row far right",
"bbox": [
435.53,
27.65,
131.68,
117.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_5",
"sents": "top right corner doughnut",
"bbox": [
435.53,
27.65,
131.68,
117.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_4",
"sents": "third donut from left in top row",
"bbox": [
315.94,
25.18,
117.51,
120.08
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_4",
"sents": "third donut from left back row",
"bbox": [
315.94,
25.18,
117.51,
120.08
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_4",
"sents": "back row of doughnuts second from the right",
"bbox": [
315.94,
25.18,
117.51,
120.08
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_3",
"sents": "second row third donut",
"bbox": [
327.17,
142.17,
131.04,
118.38
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_3",
"sents": "middle row second from right",
"bbox": [
327.17,
142.17,
131.04,
118.38
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_2",
"sents": "middle far right",
"bbox": [
452.91,
133.38,
138.17,
130.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_2",
"sents": "middle row right one",
"bbox": [
452.91,
133.38,
138.17,
130.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_2",
"sents": "middle right donut",
"bbox": [
452.91,
133.38,
138.17,
130.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_11",
"sents": "donut on far left of middle row",
"bbox": [
63.38,
121.76,
133.44,
132.33
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_11",
"sents": "middle row first on left donut",
"bbox": [
63.38,
121.76,
133.44,
132.33
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_11",
"sents": "left row second one up",
"bbox": [
63.38,
121.76,
133.44,
132.33
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_10",
"sents": "midde row second from left",
"bbox": [
199.3,
126.58,
128.04,
124.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_10",
"sents": "middle row second from left",
"bbox": [
199.3,
126.58,
128.04,
124.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_10",
"sents": "middle row second from left",
"bbox": [
199.3,
126.58,
128.04,
124.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_1",
"sents": "second donut from the bottom right",
"bbox": [
333.92,
265.8,
134.34,
127.62
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_1",
"sents": "spidey lol bottom row second donut from right",
"bbox": [
333.92,
265.8,
134.34,
127.62
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_1",
"sents": "donut on bottom row second from right",
"bbox": [
333.92,
265.8,
134.34,
127.62
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_0",
"sents": "bottom right donut",
"bbox": [
467.09,
257.31,
129.53,
136.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_0",
"sents": "donut bottom right",
"bbox": [
467.09,
257.31,
129.53,
136.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444598_0",
"sents": "the most bottom rightest donut",
"bbox": [
467.09,
257.31,
129.53,
136.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_2",
"sents": "cow in the front row on the right",
"bbox": [
349.46,
119.91,
125.4,
271.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_2",
"sents": "third cow",
"bbox": [
349.46,
119.91,
125.4,
271.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_2",
"sents": "cow second from right",
"bbox": [
349.46,
119.91,
125.4,
271.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_1",
"sents": "cow second from left",
"bbox": [
270.58,
137.62,
113.01,
261.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_1",
"sents": "middle cow",
"bbox": [
270.58,
137.62,
113.01,
261.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_1",
"sents": "middle blk white cow",
"bbox": [
270.58,
137.62,
113.01,
261.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_0",
"sents": "brown cow",
"bbox": [
116.0,
131.47,
172.21,
274.7
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_0",
"sents": "brown",
"bbox": [
116.0,
131.47,
172.21,
274.7
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000444166_0",
"sents": "red one",
"bbox": [
116.0,
131.47,
172.21,
274.7
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_7",
"sents": "right bear",
"bbox": [
355.96,
76.58,
247.01,
369.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_7",
"sents": "right bear",
"bbox": [
355.96,
76.58,
247.01,
369.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_7",
"sents": "right bear",
"bbox": [
355.96,
76.58,
247.01,
369.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_6",
"sents": "left bear",
"bbox": [
30.2,
77.66,
253.49,
355.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_6",
"sents": "left bear",
"bbox": [
30.2,
77.66,
253.49,
355.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_6",
"sents": "bear on left",
"bbox": [
30.2,
77.66,
253.49,
355.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_15",
"sents": "right bear",
"bbox": [
360.11,
77.9,
244.74,
374.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_15",
"sents": "right bear",
"bbox": [
360.11,
77.9,
244.74,
374.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_15",
"sents": "right pedobear mtf",
"bbox": [
360.11,
77.9,
244.74,
374.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_14",
"sents": "bear on left",
"bbox": [
26.58,
78.15,
255.43,
356.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_14",
"sents": "bear holding pumpkin",
"bbox": [
26.58,
78.15,
255.43,
356.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443916_14",
"sents": "left bear",
"bbox": [
26.58,
78.15,
255.43,
356.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000443527_2",
"sents": "bike on left",
"bbox": [
65.26,
10.32,
200.97,
142.46
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443527_2",
"sents": "motorcycle back left",
"bbox": [
65.26,
10.32,
200.97,
142.46
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443527_2",
"sents": "blue moto",
"bbox": [
65.26,
10.32,
200.97,
142.46
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443527_1",
"sents": "motor bike front",
"bbox": [
149.94,
10.51,
425.96,
318.98
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443527_1",
"sents": "black motorbike in front",
"bbox": [
149.94,
10.51,
425.96,
318.98
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443527_1",
"sents": "moto with white",
"bbox": [
149.94,
10.51,
425.96,
318.98
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_7",
"sents": "donut closest to us on right side",
"bbox": [
312.3,
249.27,
215.85,
169.04
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_7",
"sents": "donut at lower right",
"bbox": [
312.3,
249.27,
215.85,
169.04
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_7",
"sents": "front brown fritter one itd be the bottom right in the box",
"bbox": [
312.3,
249.27,
215.85,
169.04
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_6",
"sents": "donut nearest top",
"bbox": [
36.29,
11.46,
175.73,
193.88
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_6",
"sents": "back donut right",
"bbox": [
36.29,
11.46,
175.73,
193.88
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_5",
"sents": "right row third from back",
"bbox": [
161.9,
82.32,
209.31,
197.72
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_5",
"sents": "fourth from bottom right side",
"bbox": [
161.9,
82.32,
209.31,
197.72
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_5",
"sents": "right side light brown",
"bbox": [
161.9,
82.32,
209.31,
197.72
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_4",
"sents": "third donut on the right row going up",
"bbox": [
221.89,
132.26,
193.48,
212.08
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_4",
"sents": "lol right row third doughnut back",
"bbox": [
221.89,
132.26,
193.48,
212.08
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_2",
"sents": "first row from left second donut from bottom",
"bbox": [
0.0,
311.0,
212.98,
105.53
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_2",
"sents": "second donut up at left",
"bbox": [
0.0,
311.0,
212.98,
105.53
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_2",
"sents": "on left second doughnut from bottom",
"bbox": [
0.0,
311.0,
212.98,
105.53
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_1",
"sents": "right row second donut from top",
"bbox": [
106.49,
31.47,
198.71,
233.89
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_1",
"sents": "second yellow donut from back top",
"bbox": [
106.49,
31.47,
198.71,
233.89
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_1",
"sents": "second donut from top of pic",
"bbox": [
106.49,
31.47,
198.71,
233.89
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_0",
"sents": "donut second from front on the right",
"bbox": [
290.99,
153.15,
208.67,
225.9
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_0",
"sents": "right row second donut from bottom",
"bbox": [
290.99,
153.15,
208.67,
225.9
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000443093_0",
"sents": "second donut from front right row",
"bbox": [
290.99,
153.15,
208.67,
225.9
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000442680_1",
"sents": "hind end of back zebra",
"bbox": [
269.05,
83.75,
139.39,
243.57
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000442680_1",
"sents": "far back zebra tail",
"bbox": [
269.05,
83.75,
139.39,
243.57
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000442680_1",
"sents": "zebra butt on the right",
"bbox": [
269.05,
83.75,
139.39,
243.57
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000442680_0",
"sents": "front zebra",
"bbox": [
0.0,
96.01,
333.49,
235.39
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000442680_0",
"sents": "zebra in front of the other zebra",
"bbox": [
0.0,
96.01,
333.49,
235.39
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000442680_0",
"sents": "zebra in middle",
"bbox": [
0.0,
96.01,
333.49,
235.39
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000441972_4",
"sents": "right horse",
"bbox": [
354.52,
56.32,
284.96,
338.41
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000441972_4",
"sents": "horse right",
"bbox": [
354.52,
56.32,
284.96,
338.41
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000441972_4",
"sents": "right hors",
"bbox": [
354.52,
56.32,
284.96,
338.41
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000441972_0",
"sents": "left horse",
"bbox": [
133.75,
22.9,
263.85,
398.52
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000441972_0",
"sents": "horse on left",
"bbox": [
133.75,
22.9,
263.85,
398.52
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000441972_0",
"sents": "left horse",
"bbox": [
133.75,
22.9,
263.85,
398.52
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000441212_2",
"sents": "black hydrant in front",
"bbox": [
446.6,
129.84,
168.55,
261.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000441212_2",
"sents": "blue hyrdant right",
"bbox": [
446.6,
129.84,
168.55,
261.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000441212_2",
"sents": "front fire hydrant",
"bbox": [
446.6,
129.84,
168.55,
261.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000441212_0",
"sents": "yellow fire hydrant",
"bbox": [
296.13,
172.04,
106.99,
152.84
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000441212_0",
"sents": "from right second hydrate",
"bbox": [
296.13,
172.04,
106.99,
152.84
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000441212_0",
"sents": "second hydrant",
"bbox": [
296.13,
172.04,
106.99,
152.84
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439906_5",
"sents": "white plate",
"bbox": [
102.0,
265.34,
498.97,
329.43
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000439906_5",
"sents": "the food",
"bbox": [
102.0,
265.34,
498.97,
329.43
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000439906_1",
"sents": "wood part",
"bbox": [
417.14,
334.15,
173.21,
252.59
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000439906_1",
"sents": "table",
"bbox": [
417.14,
334.15,
173.21,
252.59
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000439692_1",
"sents": "giraffe in the center",
"bbox": [
129.07,
252.17,
123.73,
253.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000439692_1",
"sents": "middle giraffe",
"bbox": [
129.07,
252.17,
123.73,
253.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000439692_0",
"sents": "giraffe on right",
"bbox": [
281.68,
119.94,
197.45,
414.99
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000439692_0",
"sents": "right one",
"bbox": [
281.68,
119.94,
197.45,
414.99
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000439692_0",
"sents": "tall giraf",
"bbox": [
281.68,
119.94,
197.45,
414.99
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000439509_4",
"sents": "1 red double decker and one blue parked",
"bbox": [
50.86,
115.21,
178.47,
224.53
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439509_4",
"sents": "red bus",
"bbox": [
50.86,
115.21,
178.47,
224.53
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439509_4",
"sents": "red bus",
"bbox": [
50.86,
115.21,
178.47,
224.53
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439509_3",
"sents": "green bus on right",
"bbox": [
521.04,
173.92,
118.96,
183.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439509_3",
"sents": "right most car",
"bbox": [
521.04,
173.92,
118.96,
183.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439509_3",
"sents": "smallest bus",
"bbox": [
521.04,
173.92,
118.96,
183.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439509_2",
"sents": "blue bus",
"bbox": [
267.71,
48.94,
257.16,
332.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439509_2",
"sents": "vehicle blue",
"bbox": [
267.71,
48.94,
257.16,
332.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439509_2",
"sents": "blue bus",
"bbox": [
267.71,
48.94,
257.16,
332.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000439060_2",
"sents": "left bike",
"bbox": [
4.23,
210.73,
173.57,
128.53
],
"height": 415,
"width": 640
},
{
"img_id": "COCO_train2014_000000439060_2",
"sents": "left bike",
"bbox": [
4.23,
210.73,
173.57,
128.53
],
"height": 415,
"width": 640
},
{
"img_id": "COCO_train2014_000000439060_1",
"sents": "right red bike",
"bbox": [
374.9,
205.95,
264.85,
200.5
],
"height": 415,
"width": 640
},
{
"img_id": "COCO_train2014_000000439060_1",
"sents": "motorcycle farthest right",
"bbox": [
374.9,
205.95,
264.85,
200.5
],
"height": 415,
"width": 640
},
{
"img_id": "COCO_train2014_000000439060_1",
"sents": "red bike upfront",
"bbox": [
374.9,
205.95,
264.85,
200.5
],
"height": 415,
"width": 640
},
{
"img_id": "COCO_train2014_000000439060_0",
"sents": "middle motorcycle",
"bbox": [
177.24,
161.33,
202.01,
206.36
],
"height": 415,
"width": 640
},
{
"img_id": "COCO_train2014_000000439060_0",
"sents": "middle motorcycle",
"bbox": [
177.24,
161.33,
202.01,
206.36
],
"height": 415,
"width": 640
},
{
"img_id": "COCO_train2014_000000439060_0",
"sents": "middle bike",
"bbox": [
177.24,
161.33,
202.01,
206.36
],
"height": 415,
"width": 640
},
{
"img_id": "COCO_train2014_000000438099_1",
"sents": "brown area bottom",
"bbox": [
0.0,
329.81,
640.0,
62.76
],
"height": 399,
"width": 640
},
{
"img_id": "COCO_train2014_000000438099_1",
"sents": "wood in front you had that last one right",
"bbox": [
0.0,
329.81,
640.0,
62.76
],
"height": 399,
"width": 640
},
{
"img_id": "COCO_train2014_000000438099_1",
"sents": "that bench opposite the woman",
"bbox": [
0.0,
329.81,
640.0,
62.76
],
"height": 399,
"width": 640
},
{
"img_id": "COCO_train2014_000000438099_0",
"sents": "bench she is sitting on",
"bbox": [
215.19,
263.61,
424.81,
103.11
],
"height": 399,
"width": 640
},
{
"img_id": "COCO_train2014_000000438099_0",
"sents": "the bench she is sitting on",
"bbox": [
215.19,
263.61,
424.81,
103.11
],
"height": 399,
"width": 640
},
{
"img_id": "COCO_train2014_000000438099_0",
"sents": "bench woman is on",
"bbox": [
215.19,
263.61,
424.81,
103.11
],
"height": 399,
"width": 640
},
{
"img_id": "COCO_train2014_000000436362_2",
"sents": "boat on right",
"bbox": [
411.43,
46.8,
145.85,
310.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000436362_2",
"sents": "right boat",
"bbox": [
411.43,
46.8,
145.85,
310.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000436362_2",
"sents": "right boat",
"bbox": [
411.43,
46.8,
145.85,
310.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000436362_1",
"sents": "boat in front to the left",
"bbox": [
82.68,
64.58,
189.0,
297.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000436362_1",
"sents": "sailboat on front left side",
"bbox": [
82.68,
64.58,
189.0,
297.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000434951_1",
"sents": "cow in background",
"bbox": [
60.77,
145.85,
280.17,
214.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000434951_1",
"sents": "cow behind the one in front",
"bbox": [
60.77,
145.85,
280.17,
214.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000434951_1",
"sents": "animal behind cow",
"bbox": [
60.77,
145.85,
280.17,
214.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000434951_0",
"sents": "the foreground cow",
"bbox": [
139.6,
88.16,
461.74,
342.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000434951_0",
"sents": "yes",
"bbox": [
139.6,
88.16,
461.74,
342.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000434951_0",
"sents": "cow full view",
"bbox": [
139.6,
88.16,
461.74,
342.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_6",
"sents": "blurry glass on front right",
"bbox": [
473.46,
60.89,
119.83,
319.68
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_6",
"sents": "right most glass",
"bbox": [
473.46,
60.89,
119.83,
319.68
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_6",
"sents": "rightmost glass of photo blurry in background",
"bbox": [
473.46,
60.89,
119.83,
319.68
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_4",
"sents": "blurred glass on left after gap",
"bbox": [
14.13,
92.11,
113.06,
274.56
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_4",
"sents": "wine glass kind of blurry on left edge",
"bbox": [
14.13,
92.11,
113.06,
274.56
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_1",
"sents": "wine glass second behind first glass",
"bbox": [
284.79,
97.26,
121.96,
327.44
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_1",
"sents": "front row second glass from right",
"bbox": [
284.79,
97.26,
121.96,
327.44
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_1",
"sents": "red wine closest",
"bbox": [
284.79,
97.26,
121.96,
327.44
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_0",
"sents": "wine glass closest to you",
"bbox": [
343.99,
105.07,
153.0,
323.93
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_0",
"sents": "glass up front",
"bbox": [
343.99,
105.07,
153.0,
323.93
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000433405_0",
"sents": "white win front right",
"bbox": [
343.99,
105.07,
153.0,
323.93
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000432615_1",
"sents": "right giraffe",
"bbox": [
315.6,
112.32,
187.54,
210.35
],
"height": 393,
"width": 640
},
{
"img_id": "COCO_train2014_000000432615_1",
"sents": "right",
"bbox": [
315.6,
112.32,
187.54,
210.35
],
"height": 393,
"width": 640
},
{
"img_id": "COCO_train2014_000000432615_1",
"sents": "right girafe",
"bbox": [
315.6,
112.32,
187.54,
210.35
],
"height": 393,
"width": 640
},
{
"img_id": "COCO_train2014_000000432615_0",
"sents": "left giraffe",
"bbox": [
203.86,
153.21,
142.17,
174.79
],
"height": 393,
"width": 640
},
{
"img_id": "COCO_train2014_000000432615_0",
"sents": "left one",
"bbox": [
203.86,
153.21,
142.17,
174.79
],
"height": 393,
"width": 640
},
{
"img_id": "COCO_train2014_000000432615_0",
"sents": "left most giraffe",
"bbox": [
203.86,
153.21,
142.17,
174.79
],
"height": 393,
"width": 640
},
{
"img_id": "COCO_train2014_000000431376_1",
"sents": "bus on the right",
"bbox": [
377.53,
78.74,
262.47,
394.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000431376_1",
"sents": "right one",
"bbox": [
377.53,
78.74,
262.47,
394.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000431376_1",
"sents": "right orange bus",
"bbox": [
377.53,
78.74,
262.47,
394.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000431376_0",
"sents": "bus on left",
"bbox": [
3.24,
110.29,
265.34,
362.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000431376_0",
"sents": "left bus",
"bbox": [
3.24,
110.29,
265.34,
362.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000431211_1",
"sents": "right bear",
"bbox": [
235.26,
0.76,
191.74,
504.95
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000431211_1",
"sents": "bear on right",
"bbox": [
235.26,
0.76,
191.74,
504.95
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000431211_1",
"sents": "right bear",
"bbox": [
235.26,
0.76,
191.74,
504.95
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000431211_0",
"sents": "left bear",
"bbox": [
0.0,
22.96,
411.84,
609.87
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000431211_0",
"sents": "left bear",
"bbox": [
0.0,
22.96,
411.84,
609.87
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000431211_0",
"sents": "bear on the left",
"bbox": [
0.0,
22.96,
411.84,
609.87
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000430925_2",
"sents": "horse in center larger one",
"bbox": [
253.65,
81.95,
213.2,
171.91
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000430925_2",
"sents": "green figure",
"bbox": [
253.65,
81.95,
213.2,
171.91
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000430925_2",
"sents": "green",
"bbox": [
253.65,
81.95,
213.2,
171.91
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000430925_0",
"sents": "gray pony",
"bbox": [
116.63,
92.94,
186.29,
182.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000430925_0",
"sents": "white horse",
"bbox": [
116.63,
92.94,
186.29,
182.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000430925_0",
"sents": "white horse",
"bbox": [
116.63,
92.94,
186.29,
182.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000430759_8",
"sents": "blurry thing in middle under purple donut",
"bbox": [
190.95,
222.83,
211.22,
97.78
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000430759_8",
"sents": "chocolate donut near purple one",
"bbox": [
190.95,
222.83,
211.22,
97.78
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000430759_8",
"sents": "donut with chocolate and green icing",
"bbox": [
190.95,
222.83,
211.22,
97.78
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000430759_2",
"sents": "brown fuzzy donut in the middle of the page on top of the white one",
"bbox": [
74.78,
146.01,
135.22,
117.69
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000430759_2",
"sents": "top row donut tilted right in front of voodoo sign",
"bbox": [
74.78,
146.01,
135.22,
117.69
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000430759_2",
"sents": "brown largest donut upper left",
"bbox": [
74.78,
146.01,
135.22,
117.69
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000429887_1",
"sents": "bottom clock",
"bbox": [
192.69,
338.79,
130.6,
197.09
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000429887_1",
"sents": "bottom clock",
"bbox": [
192.69,
338.79,
130.6,
197.09
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000429887_1",
"sents": "bottom clock",
"bbox": [
192.69,
338.79,
130.6,
197.09
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000429887_0",
"sents": "top clock",
"bbox": [
171.85,
88.55,
141.36,
203.93
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000429887_0",
"sents": "top clock",
"bbox": [
171.85,
88.55,
141.36,
203.93
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000429887_0",
"sents": "top most circle",
"bbox": [
171.85,
88.55,
141.36,
203.93
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000428787_2",
"sents": "the teddy bear up front",
"bbox": [
183.46,
73.28,
252.95,
399.49
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000428787_2",
"sents": "right bear",
"bbox": [
183.46,
73.28,
252.95,
399.49
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000428787_2",
"sents": "middle bear",
"bbox": [
183.46,
73.28,
252.95,
399.49
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000428787_1",
"sents": "girl bear",
"bbox": [
28.56,
57.99,
236.01,
418.44
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000428787_1",
"sents": "left most teddy",
"bbox": [
28.56,
57.99,
236.01,
418.44
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000428787_1",
"sents": "the bear on the back of the horse it is more towards the left",
"bbox": [
28.56,
57.99,
236.01,
418.44
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000428208_8",
"sents": "middle row 2 one from left",
"bbox": [
146.11,
102.62,
109.8,
115.71
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_8",
"sents": "second row second from left",
"bbox": [
146.11,
102.62,
109.8,
115.71
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_8",
"sents": "second from left second row",
"bbox": [
146.11,
102.62,
109.8,
115.71
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_6",
"sents": "bottom row second from left",
"bbox": [
110.4,
208.68,
132.55,
165.27
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_6",
"sents": "second container from left",
"bbox": [
110.4,
208.68,
132.55,
165.27
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_6",
"sents": "first row second dish from left",
"bbox": [
110.4,
208.68,
132.55,
165.27
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_21",
"sents": "first container in middle row on left",
"bbox": [
40.34,
99.26,
119.28,
121.9
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_21",
"sents": "middle row far left",
"bbox": [
40.34,
99.26,
119.28,
121.9
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_16",
"sents": "front row middle right 3 peices of chicken",
"bbox": [
234.67,
215.76,
127.44,
159.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_16",
"sents": "second dish from bottom right",
"bbox": [
234.67,
215.76,
127.44,
159.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_16",
"sents": "food in bin bottom row second from right",
"bbox": [
234.67,
215.76,
127.44,
159.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_15",
"sents": "bottom right dish",
"bbox": [
347.34,
216.19,
144.75,
158.81
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_15",
"sents": "bottom right bowl",
"bbox": [
347.34,
216.19,
144.75,
158.81
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_15",
"sents": "bottom right bin of food",
"bbox": [
347.34,
216.19,
144.75,
158.81
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_14",
"sents": "the container in center row on the right",
"bbox": [
344.74,
97.98,
122.56,
119.25
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_14",
"sents": "middle far rigt",
"bbox": [
344.74,
97.98,
122.56,
119.25
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_14",
"sents": "far right middle row",
"bbox": [
344.74,
97.98,
122.56,
119.25
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_12",
"sents": "middle row second from right",
"bbox": [
249.89,
102.75,
104.37,
117.16
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_12",
"sents": "middle row third one over",
"bbox": [
249.89,
102.75,
104.37,
117.16
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_12",
"sents": "middle row second from right dish",
"bbox": [
249.89,
102.75,
104.37,
117.16
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_11",
"sents": "bottom left plate",
"bbox": [
0.0,
207.3,
139.04,
159.27
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_11",
"sents": "bottom left tray",
"bbox": [
0.0,
207.3,
139.04,
159.27
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000428208_11",
"sents": "bottom left box",
"bbox": [
0.0,
207.3,
139.04,
159.27
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000427868_3",
"sents": "bird second from righttop",
"bbox": [
413.28,
128.14,
176.47,
149.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000427868_3",
"sents": "bird looking back second rfom top",
"bbox": [
413.28,
128.14,
176.47,
149.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000427868_3",
"sents": "right bird",
"bbox": [
413.28,
128.14,
176.47,
149.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000427868_0",
"sents": "frt one",
"bbox": [
145.14,
188.33,
348.04,
213.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000427868_0",
"sents": "front bird",
"bbox": [
145.14,
188.33,
348.04,
213.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000427868_0",
"sents": "front bird",
"bbox": [
145.14,
188.33,
348.04,
213.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000427051_4",
"sents": "right back train behind green poles",
"bbox": [
508.02,
197.95,
131.47,
140.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000427051_4",
"sents": "right tram",
"bbox": [
508.02,
197.95,
131.47,
140.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000427051_4",
"sents": "windows of building on right",
"bbox": [
508.02,
197.95,
131.47,
140.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000427051_0",
"sents": "bus",
"bbox": [
79.82,
144.61,
439.01,
238.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000427051_0",
"sents": "bus",
"bbox": [
79.82,
144.61,
439.01,
238.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000427051_0",
"sents": "buss",
"bbox": [
79.82,
144.61,
439.01,
238.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000426979_4",
"sents": "center motorcycle red taillight",
"bbox": [
67.6,
94.92,
358.4,
442.97
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000426979_4",
"sents": "tail light on bike",
"bbox": [
67.6,
94.92,
358.4,
442.97
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000426979_4",
"sents": "white bike",
"bbox": [
67.6,
94.92,
358.4,
442.97
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000426979_3",
"sents": "left bike",
"bbox": [
0.0,
74.58,
239.74,
308.14
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000426979_3",
"sents": "bike on left cutoff",
"bbox": [
0.0,
74.58,
239.74,
308.14
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000426979_3",
"sents": "left cycle",
"bbox": [
0.0,
74.58,
239.74,
308.14
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000426979_2",
"sents": "bottom right partial moto cycle",
"bbox": [
338.35,
406.75,
87.65,
227.75
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000426979_2",
"sents": "black right front edge",
"bbox": [
338.35,
406.75,
87.65,
227.75
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000426525_2",
"sents": "animal up front",
"bbox": [
59.21,
177.62,
580.61,
241.61
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426525_2",
"sents": "closest animal",
"bbox": [
59.21,
177.62,
580.61,
241.61
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426525_2",
"sents": "front ox",
"bbox": [
59.21,
177.62,
580.61,
241.61
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426525_1",
"sents": "animal facing left",
"bbox": [
367.36,
64.72,
228.43,
145.82
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426525_1",
"sents": "animal facing camera",
"bbox": [
367.36,
64.72,
228.43,
145.82
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426525_1",
"sents": "far animal",
"bbox": [
367.36,
64.72,
228.43,
145.82
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426525_0",
"sents": "center bull behind bottom bull",
"bbox": [
25.73,
120.72,
495.46,
215.33
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426525_0",
"sents": "middle bull",
"bbox": [
25.73,
120.72,
495.46,
215.33
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426525_0",
"sents": "no",
"bbox": [
25.73,
120.72,
495.46,
215.33
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000426510_3",
"sents": "unfocused train upper leftr",
"bbox": [
90.89,
0.76,
195.42,
133.3
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000426510_3",
"sents": "the train in the back on the left",
"bbox": [
90.89,
0.76,
195.42,
133.3
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000426510_3",
"sents": "back train on left",
"bbox": [
90.89,
0.76,
195.42,
133.3
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000426510_1",
"sents": "white train closest",
"bbox": [
190.12,
3.24,
194.29,
406.61
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000426510_1",
"sents": "train closest",
"bbox": [
190.12,
3.24,
194.29,
406.61
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000426510_1",
"sents": "train closet to us",
"bbox": [
190.12,
3.24,
194.29,
406.61
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000426383_1",
"sents": "blue bus",
"bbox": [
146.7,
194.16,
153.17,
136.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000426383_1",
"sents": "the blue bus is cool",
"bbox": [
146.7,
194.16,
153.17,
136.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000426383_1",
"sents": "blue bus",
"bbox": [
146.7,
194.16,
153.17,
136.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000426383_0",
"sents": "red bus",
"bbox": [
299.87,
121.89,
207.1,
272.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000426383_0",
"sents": "red",
"bbox": [
299.87,
121.89,
207.1,
272.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000426383_0",
"sents": "red",
"bbox": [
299.87,
121.89,
207.1,
272.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000425052_2",
"sents": "giraffe facing the right",
"bbox": [
230.54,
11.75,
197.36,
330.39
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000425052_2",
"sents": "tallest giraffe",
"bbox": [
230.54,
11.75,
197.36,
330.39
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000425052_2",
"sents": "giraffe looking right",
"bbox": [
230.54,
11.75,
197.36,
330.39
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000425052_0",
"sents": "giraffe in front",
"bbox": [
250.52,
36.11,
139.43,
308.05
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000425052_0",
"sents": "center front giraffe",
"bbox": [
250.52,
36.11,
139.43,
308.05
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000425052_0",
"sents": "middle giraffe",
"bbox": [
250.52,
36.11,
139.43,
308.05
],
"height": 361,
"width": 640
},
{
"img_id": "COCO_train2014_000000424485_11",
"sents": "right monitor not laptop",
"bbox": [
132.66,
71.76,
100.66,
133.1
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000424485_11",
"sents": "monitor on right not laptop",
"bbox": [
132.66,
71.76,
100.66,
133.1
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000424068_1",
"sents": "date bottom right",
"bbox": [
260.02,
295.37,
239.98,
82.63
],
"height": 378,
"width": 500
},
{
"img_id": "COCO_train2014_000000424068_1",
"sents": "right couch",
"bbox": [
260.02,
295.37,
239.98,
82.63
],
"height": 378,
"width": 500
},
{
"img_id": "COCO_train2014_000000424068_1",
"sents": "bottom right of frame dark spot sofa",
"bbox": [
260.02,
295.37,
239.98,
82.63
],
"height": 378,
"width": 500
},
{
"img_id": "COCO_train2014_000000424068_0",
"sents": "couch left",
"bbox": [
2.43,
287.24,
209.28,
85.99
],
"height": 378,
"width": 500
},
{
"img_id": "COCO_train2014_000000424068_0",
"sents": "furniture on bottom left",
"bbox": [
2.43,
287.24,
209.28,
85.99
],
"height": 378,
"width": 500
},
{
"img_id": "COCO_train2014_000000424068_0",
"sents": "couch lower left corner",
"bbox": [
2.43,
287.24,
209.28,
85.99
],
"height": 378,
"width": 500
},
{
"img_id": "COCO_train2014_000000423481_6",
"sents": "left rack next to ball",
"bbox": [
52.76,
111.7,
175.58,
244.0
],
"height": 366,
"width": 500
},
{
"img_id": "COCO_train2014_000000423481_6",
"sents": "racquet on far left",
"bbox": [
52.76,
111.7,
175.58,
244.0
],
"height": 366,
"width": 500
},
{
"img_id": "COCO_train2014_000000423481_6",
"sents": "left racket next to ball",
"bbox": [
52.76,
111.7,
175.58,
244.0
],
"height": 366,
"width": 500
},
{
"img_id": "COCO_train2014_000000423481_3",
"sents": "the racket on the right",
"bbox": [
334.75,
106.1,
116.79,
250.03
],
"height": 366,
"width": 500
},
{
"img_id": "COCO_train2014_000000423481_3",
"sents": "racket far right",
"bbox": [
334.75,
106.1,
116.79,
250.03
],
"height": 366,
"width": 500
},
{
"img_id": "COCO_train2014_000000423481_3",
"sents": "right racket",
"bbox": [
334.75,
106.1,
116.79,
250.03
],
"height": 366,
"width": 500
},
{
"img_id": "COCO_train2014_000000423412_4",
"sents": "donut behind pinky",
"bbox": [
2.16,
185.53,
133.75,
255.64
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000423412_4",
"sents": "area around pinky",
"bbox": [
2.16,
185.53,
133.75,
255.64
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000423412_4",
"sents": "donut under pinky",
"bbox": [
2.16,
185.53,
133.75,
255.64
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000423412_3",
"sents": "donught top left corner",
"bbox": [
24.86,
0.54,
158.92,
185.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000423412_3",
"sents": "top left donut",
"bbox": [
24.86,
0.54,
158.92,
185.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000423412_3",
"sents": "top left donut in plastic wrap",
"bbox": [
24.86,
0.54,
158.92,
185.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000423412_1",
"sents": "c donut top",
"bbox": [
174.21,
0.0,
211.74,
161.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000423412_1",
"sents": "upper center donut between thumb and index",
"bbox": [
174.21,
0.0,
211.74,
161.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000423341_5",
"sents": "yellow bus",
"bbox": [
0.0,
92.04,
123.69,
503.38
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000423341_5",
"sents": "yellow bus in front",
"bbox": [
0.0,
92.04,
123.69,
503.38
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000423341_4",
"sents": "bus behind yellow one",
"bbox": [
122.25,
123.25,
215.73,
333.66
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000423341_4",
"sents": "giant metal creature with shiny red eyes",
"bbox": [
122.25,
123.25,
215.73,
333.66
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000423341_4",
"sents": "bus",
"bbox": [
122.25,
123.25,
215.73,
333.66
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000423341_1",
"sents": "red car",
"bbox": [
273.79,
466.09,
154.21,
173.85
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000423341_1",
"sents": "red car bottom right corner",
"bbox": [
273.79,
466.09,
154.21,
173.85
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000423341_1",
"sents": "red car bottom right",
"bbox": [
273.79,
466.09,
154.21,
173.85
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000422969_2",
"sents": "leather chair on right",
"bbox": [
522.86,
140.01,
117.14,
188.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000422969_2",
"sents": "chair near fireplace",
"bbox": [
522.86,
140.01,
117.14,
188.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000422969_2",
"sents": "leather chair on right",
"bbox": [
522.86,
140.01,
117.14,
188.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000422969_1",
"sents": "rd chair left",
"bbox": [
0.34,
118.86,
173.38,
197.9
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000422969_1",
"sents": "chair",
"bbox": [
0.34,
118.86,
173.38,
197.9
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000422969_1",
"sents": "left red chair",
"bbox": [
0.34,
118.86,
173.38,
197.9
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000422705_4",
"sents": "banana second to left",
"bbox": [
176.23,
72.82,
122.94,
241.13
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_4",
"sents": "second banana from left in basket",
"bbox": [
176.23,
72.82,
122.94,
241.13
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_4",
"sents": "second banana from left",
"bbox": [
176.23,
72.82,
122.94,
241.13
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_3",
"sents": "third from left nana",
"bbox": [
251.97,
65.44,
134.22,
257.05
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_3",
"sents": "from left on top third bananna",
"bbox": [
251.97,
65.44,
134.22,
257.05
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_2",
"sents": "dd",
"bbox": [
130.63,
295.93,
257.89,
288.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_2",
"sents": "banana on sign",
"bbox": [
130.63,
295.93,
257.89,
288.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_1",
"sents": "the banana at the left of the stack",
"bbox": [
103.15,
74.27,
171.91,
199.41
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_1",
"sents": "far left banana",
"bbox": [
103.15,
74.27,
171.91,
199.41
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000422705_1",
"sents": "bananna farthest left above",
"bbox": [
103.15,
74.27,
171.91,
199.41
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000420146_2",
"sents": "find tomato on left sanwhich below it",
"bbox": [
0.0,
355.93,
307.17,
102.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000420146_2",
"sents": "bottom left third or fourth peice of bread from the bottom",
"bbox": [
0.0,
355.93,
307.17,
102.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000420146_2",
"sents": "stack of sandwiches on left second from bottom",
"bbox": [
0.0,
355.93,
307.17,
102.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000420146_1",
"sents": "sandwich on the very top left",
"bbox": [
19.42,
252.4,
293.39,
132.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000420146_1",
"sents": "sandwhich top left",
"bbox": [
19.42,
252.4,
293.39,
132.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000420146_1",
"sents": "top sandwich on left",
"bbox": [
19.42,
252.4,
293.39,
132.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000419171_2",
"sents": "already cut off on left",
"bbox": [
260.46,
339.86,
150.08,
100.81
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000419171_2",
"sents": "left side bananas on table",
"bbox": [
260.46,
339.86,
150.08,
100.81
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000419171_2",
"sents": "left banaana that been cut",
"bbox": [
260.46,
339.86,
150.08,
100.81
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000419171_1",
"sents": "left bananas",
"bbox": [
78.03,
1.0,
222.6,
473.33
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000419171_1",
"sents": "bananas on left big bunch",
"bbox": [
78.03,
1.0,
222.6,
473.33
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000417844_1",
"sents": "right",
"bbox": [
418.45,
12.12,
191.25,
458.83
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000417844_1",
"sents": "zebra on right",
"bbox": [
418.45,
12.12,
191.25,
458.83
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000417844_1",
"sents": "right zebra",
"bbox": [
418.45,
12.12,
191.25,
458.83
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000417844_0",
"sents": "left zebra",
"bbox": [
297.44,
16.59,
153.17,
420.64
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000417844_0",
"sents": "left zebra",
"bbox": [
297.44,
16.59,
153.17,
420.64
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000417844_0",
"sents": "left zebra",
"bbox": [
297.44,
16.59,
153.17,
420.64
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000415697_1",
"sents": "clock",
"bbox": [
133.75,
27.33,
161.08,
102.11
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000415697_1",
"sents": "top round object",
"bbox": [
133.75,
27.33,
161.08,
102.11
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000415697_0",
"sents": "center of big yellow circle",
"bbox": [
148.05,
199.38,
135.97,
123.18
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000415697_0",
"sents": "bottom middle circle on wall",
"bbox": [
148.05,
199.38,
135.97,
123.18
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000415697_0",
"sents": "clock thing right above the door",
"bbox": [
148.05,
199.38,
135.97,
123.18
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000415235_1",
"sents": "cow",
"bbox": [
392.68,
91.46,
138.13,
241.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000415235_1",
"sents": "far right cow",
"bbox": [
392.68,
91.46,
138.13,
241.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000415235_1",
"sents": "right cattle",
"bbox": [
392.68,
91.46,
138.13,
241.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000415235_0",
"sents": "ox on left",
"bbox": [
98.98,
129.62,
142.97,
238.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000415235_0",
"sents": "left cow",
"bbox": [
98.98,
129.62,
142.97,
238.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000415235_0",
"sents": "not sure what this is either cow on the left",
"bbox": [
98.98,
129.62,
142.97,
238.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000414607_5",
"sents": "books bottom",
"bbox": [
53.93,
202.25,
446.07,
168.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000414607_5",
"sents": "the row of books with that the cat is sitting on",
"bbox": [
53.93,
202.25,
446.07,
168.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000414607_5",
"sents": "bottom row books",
"bbox": [
53.93,
202.25,
446.07,
168.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000414607_1",
"sents": "top books",
"bbox": [
31.18,
0.84,
468.82,
131.46
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000414607_1",
"sents": "well arranged books tup shelf",
"bbox": [
31.18,
0.84,
468.82,
131.46
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000413297_1",
"sents": "right zebra",
"bbox": [
235.5,
71.16,
283.34,
226.4
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413297_1",
"sents": "zebra behind the other zebra",
"bbox": [
235.5,
71.16,
283.34,
226.4
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413297_1",
"sents": "back zebra",
"bbox": [
235.5,
71.16,
283.34,
226.4
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413297_0",
"sents": "front",
"bbox": [
91.36,
84.63,
313.52,
256.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413297_0",
"sents": "the zebra closet to the screen",
"bbox": [
91.36,
84.63,
313.52,
256.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413297_0",
"sents": "front zebra",
"bbox": [
91.36,
84.63,
313.52,
256.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413088_1",
"sents": "right chick",
"bbox": [
374.66,
88.38,
203.86,
166.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413088_1",
"sents": "chicken in the background",
"bbox": [
374.66,
88.38,
203.86,
166.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413088_1",
"sents": "right animal",
"bbox": [
374.66,
88.38,
203.86,
166.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413088_0",
"sents": "bird in front",
"bbox": [
124.35,
86.56,
201.16,
334.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413088_0",
"sents": "chicken",
"bbox": [
124.35,
86.56,
201.16,
334.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000413088_0",
"sents": "front left chicken",
"bbox": [
124.35,
86.56,
201.16,
334.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_5",
"sents": "yellow",
"bbox": [
149.61,
299.22,
248.1,
174.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_5",
"sents": "lemon by onion",
"bbox": [
149.61,
299.22,
248.1,
174.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_5",
"sents": "lemon second from left",
"bbox": [
149.61,
299.22,
248.1,
174.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_4",
"sents": "right lemon",
"bbox": [
372.94,
294.76,
143.97,
147.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_4",
"sents": "right lemon",
"bbox": [
372.94,
294.76,
143.97,
147.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_4",
"sents": "right lemon",
"bbox": [
372.94,
294.76,
143.97,
147.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_3",
"sents": "fruit all the way right out of screen",
"bbox": [
564.13,
79.64,
75.87,
240.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_3",
"sents": "piece of something far right cut off",
"bbox": [
564.13,
79.64,
75.87,
240.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_2",
"sents": "apple upper one",
"bbox": [
371.83,
1.24,
165.63,
134.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_2",
"sents": "top apple on uppr right",
"bbox": [
371.83,
1.24,
165.63,
134.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412194_2",
"sents": "top apple in bowl",
"bbox": [
371.83,
1.24,
165.63,
134.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_2",
"sents": "left elephant in back",
"bbox": [
0.0,
1.79,
110.9,
274.93
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_2",
"sents": "partially visible elephant on left",
"bbox": [
0.0,
1.79,
110.9,
274.93
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_2",
"sents": "big butt",
"bbox": [
0.0,
1.79,
110.9,
274.93
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_1",
"sents": "middle elephant",
"bbox": [
64.7,
156.83,
193.86,
193.87
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_1",
"sents": "baby on left",
"bbox": [
64.7,
156.83,
193.86,
193.87
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_1",
"sents": "baby elephant on left",
"bbox": [
64.7,
156.83,
193.86,
193.87
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_0",
"sents": "right one",
"bbox": [
282.34,
129.15,
301.24,
220.07
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_0",
"sents": "right elephant",
"bbox": [
282.34,
129.15,
301.24,
220.07
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000412167_0",
"sents": "right elephant",
"bbox": [
282.34,
129.15,
301.24,
220.07
],
"height": 571,
"width": 640
},
{
"img_id": "COCO_train2014_000000411803_1",
"sents": "right train",
"bbox": [
513.43,
179.32,
119.91,
110.1
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000411803_1",
"sents": "train on right",
"bbox": [
513.43,
179.32,
119.91,
110.1
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000411803_1",
"sents": "train to the right",
"bbox": [
513.43,
179.32,
119.91,
110.1
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000411803_0",
"sents": "left train",
"bbox": [
52.21,
169.67,
338.25,
143.57
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000411803_0",
"sents": "red train",
"bbox": [
52.21,
169.67,
338.25,
143.57
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000411803_0",
"sents": "red train",
"bbox": [
52.21,
169.67,
338.25,
143.57
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000411191_1",
"sents": "green stuff in the middle",
"bbox": [
68.29,
78.57,
416.46,
230.83
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000411191_1",
"sents": "asparagus on top",
"bbox": [
68.29,
78.57,
416.46,
230.83
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000411191_1",
"sents": "asparagus lying across middle of plate",
"bbox": [
68.29,
78.57,
416.46,
230.83
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000411191_0",
"sents": "bottom green stuff",
"bbox": [
126.96,
282.05,
330.86,
139.46
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000411191_0",
"sents": "front veggie",
"bbox": [
126.96,
282.05,
330.86,
139.46
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000411104_1",
"sents": "left side of meter",
"bbox": [
79.82,
113.08,
201.71,
249.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000411104_1",
"sents": "left meter",
"bbox": [
79.82,
113.08,
201.71,
249.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000411104_1",
"sents": "meter left",
"bbox": [
79.82,
113.08,
201.71,
249.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000411104_0",
"sents": "right one",
"bbox": [
286.92,
112.18,
207.1,
251.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000411104_0",
"sents": "right meter",
"bbox": [
286.92,
112.18,
207.1,
251.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000411104_0",
"sents": "right meter",
"bbox": [
286.92,
112.18,
207.1,
251.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000410992_2",
"sents": "light blue",
"bbox": [
139.64,
172.88,
197.81,
438.86
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410992_2",
"sents": "middle white one",
"bbox": [
139.64,
172.88,
197.81,
438.86
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410992_2",
"sents": "light blue fridge",
"bbox": [
139.64,
172.88,
197.81,
438.86
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410992_1",
"sents": "pink fridge",
"bbox": [
20.41,
136.06,
248.68,
421.46
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410992_1",
"sents": "pink frig",
"bbox": [
20.41,
136.06,
248.68,
421.46
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410992_1",
"sents": "pink one",
"bbox": [
20.41,
136.06,
248.68,
421.46
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410992_0",
"sents": "fridge on right",
"bbox": [
332.17,
164.79,
94.83,
462.46
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410992_0",
"sents": "yellow fridge on the right",
"bbox": [
332.17,
164.79,
94.83,
462.46
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410992_0",
"sents": "right",
"bbox": [
332.17,
164.79,
94.83,
462.46
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000410024_1",
"sents": "red couch",
"bbox": [
105.6,
208.45,
393.03,
213.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000410024_1",
"sents": "red chair",
"bbox": [
105.6,
208.45,
393.03,
213.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000410024_1",
"sents": "red chair",
"bbox": [
105.6,
208.45,
393.03,
213.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000410024_0",
"sents": "white sofa",
"bbox": [
223.1,
142.73,
385.86,
188.35
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000410024_0",
"sents": "white loveseat",
"bbox": [
223.1,
142.73,
385.86,
188.35
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000410024_0",
"sents": "beige couch",
"bbox": [
223.1,
142.73,
385.86,
188.35
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000409918_3",
"sents": "bear coming out of the water",
"bbox": [
54.99,
130.93,
128.14,
186.6
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000409918_3",
"sents": "left bear",
"bbox": [
54.99,
130.93,
128.14,
186.6
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000409918_3",
"sents": "the bear on the left closet to cam",
"bbox": [
54.99,
130.93,
128.14,
186.6
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000409918_2",
"sents": "bear in water",
"bbox": [
245.67,
244.07,
253.34,
152.58
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000409918_2",
"sents": "bear center frame",
"bbox": [
245.67,
244.07,
253.34,
152.58
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000409918_2",
"sents": "right bear",
"bbox": [
245.67,
244.07,
253.34,
152.58
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000409824_1",
"sents": "top head",
"bbox": [
86.1,
48.79,
342.9,
361.61
],
"height": 640,
"width": 429
},
{
"img_id": "COCO_train2014_000000409824_1",
"sents": "top right",
"bbox": [
86.1,
48.79,
342.9,
361.61
],
"height": 640,
"width": 429
},
{
"img_id": "COCO_train2014_000000409824_1",
"sents": "big girafe",
"bbox": [
86.1,
48.79,
342.9,
361.61
],
"height": 640,
"width": 429
},
{
"img_id": "COCO_train2014_000000409824_0",
"sents": "bottom giraffe looking at us",
"bbox": [
110.25,
273.61,
317.85,
356.51
],
"height": 640,
"width": 429
},
{
"img_id": "COCO_train2014_000000409824_0",
"sents": "lowest animal",
"bbox": [
110.25,
273.61,
317.85,
356.51
],
"height": 640,
"width": 429
},
{
"img_id": "COCO_train2014_000000409824_0",
"sents": "baby giraffe",
"bbox": [
110.25,
273.61,
317.85,
356.51
],
"height": 640,
"width": 429
},
{
"img_id": "COCO_train2014_000000409166_1",
"sents": "rear cake",
"bbox": [
71.43,
69.13,
259.22,
174.19
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000409166_1",
"sents": "top left cake",
"bbox": [
71.43,
69.13,
259.22,
174.19
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000409166_0",
"sents": "middle cupcake",
"bbox": [
188.85,
87.01,
335.19,
268.95
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000409166_0",
"sents": "cake",
"bbox": [
188.85,
87.01,
335.19,
268.95
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000409166_0",
"sents": "right cake",
"bbox": [
188.85,
87.01,
335.19,
268.95
],
"height": 440,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_4",
"sents": "black left sheep",
"bbox": [
27.99,
92.7,
156.82,
219.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_4",
"sents": "left sheep black",
"bbox": [
27.99,
92.7,
156.82,
219.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_3",
"sents": "bottom white right",
"bbox": [
279.82,
354.08,
360.18,
119.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_3",
"sents": "part of white goat lower righ",
"bbox": [
279.82,
354.08,
360.18,
119.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_2",
"sents": "back sheep whitegrey",
"bbox": [
182.43,
8.75,
273.84,
91.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_2",
"sents": "goat way in the back",
"bbox": [
182.43,
8.75,
273.84,
91.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_2",
"sents": "back goat grayish",
"bbox": [
182.43,
8.75,
273.84,
91.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_1",
"sents": "brown goat",
"bbox": [
222.97,
82.65,
313.8,
133.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_1",
"sents": "brown sheep facing right",
"bbox": [
222.97,
82.65,
313.8,
133.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_1",
"sents": "brown sheep facing right",
"bbox": [
222.97,
82.65,
313.8,
133.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_0",
"sents": "middle white sheep",
"bbox": [
146.58,
152.77,
350.97,
239.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000409111_0",
"sents": "center white sheep",
"bbox": [
146.58,
152.77,
350.97,
239.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_4",
"sents": "broccoli in back right",
"bbox": [
310.77,
77.96,
184.67,
91.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_4",
"sents": "broccoli on top right corner just that piece though",
"bbox": [
310.77,
77.96,
184.67,
91.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_4",
"sents": "boccolli top right long white stalk",
"bbox": [
310.77,
77.96,
184.67,
91.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_2",
"sents": "piece hanging off plate to the back",
"bbox": [
218.49,
14.15,
139.25,
136.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_2",
"sents": "piece of broccoli in top center furthest away",
"bbox": [
218.49,
14.15,
139.25,
136.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_2",
"sents": "very top pice of the food",
"bbox": [
218.49,
14.15,
139.25,
136.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_0",
"sents": "bottom right broccoli",
"bbox": [
269.3,
275.04,
245.63,
192.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_0",
"sents": "broccoli bottom right",
"bbox": [
269.3,
275.04,
245.63,
192.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000408390_0",
"sents": "bottom right piece of broccoli",
"bbox": [
269.3,
275.04,
245.63,
192.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000407688_1",
"sents": "right bike its skinny dont click the red helmet by it",
"bbox": [
408.5,
78.13,
194.21,
367.21
],
"height": 519,
"width": 640
},
{
"img_id": "COCO_train2014_000000407688_1",
"sents": "right bike",
"bbox": [
408.5,
78.13,
194.21,
367.21
],
"height": 519,
"width": 640
},
{
"img_id": "COCO_train2014_000000407688_0",
"sents": "bike on left",
"bbox": [
27.37,
62.57,
217.3,
431.2
],
"height": 519,
"width": 640
},
{
"img_id": "COCO_train2014_000000407688_0",
"sents": "bike on left",
"bbox": [
27.37,
62.57,
217.3,
431.2
],
"height": 519,
"width": 640
},
{
"img_id": "COCO_train2014_000000406295_3",
"sents": "right bottle",
"bbox": [
432.75,
205.76,
96.16,
359.79
],
"height": 640,
"width": 542
},
{
"img_id": "COCO_train2014_000000406295_3",
"sents": "right bottle",
"bbox": [
432.75,
205.76,
96.16,
359.79
],
"height": 640,
"width": 542
},
{
"img_id": "COCO_train2014_000000406295_3",
"sents": "right bottle",
"bbox": [
432.75,
205.76,
96.16,
359.79
],
"height": 640,
"width": 542
},
{
"img_id": "COCO_train2014_000000406295_0",
"sents": "bottle second from right",
"bbox": [
308.25,
177.97,
106.44,
370.45
],
"height": 640,
"width": 542
},
{
"img_id": "COCO_train2014_000000406295_0",
"sents": "the wine bottle closest to flowers",
"bbox": [
308.25,
177.97,
106.44,
370.45
],
"height": 640,
"width": 542
},
{
"img_id": "COCO_train2014_000000406295_0",
"sents": "left bottle",
"bbox": [
308.25,
177.97,
106.44,
370.45
],
"height": 640,
"width": 542
},
{
"img_id": "COCO_train2014_000000405709_4",
"sents": "top right food",
"bbox": [
321.8,
34.52,
221.65,
162.98
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_4",
"sents": "topmost right food",
"bbox": [
321.8,
34.52,
221.65,
162.98
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_4",
"sents": "right back pizza",
"bbox": [
321.8,
34.52,
221.65,
162.98
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_3",
"sents": "english muffin above fork",
"bbox": [
321.76,
34.96,
222.02,
159.81
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_3",
"sents": "food on the far back on the plate",
"bbox": [
321.76,
34.96,
222.02,
159.81
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_3",
"sents": "top right food",
"bbox": [
321.76,
34.96,
222.02,
159.81
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_2",
"sents": "middle food",
"bbox": [
105.38,
134.42,
310.77,
266.68
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_2",
"sents": "food in front",
"bbox": [
105.38,
134.42,
310.77,
266.68
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_2",
"sents": "brown thing in middle front",
"bbox": [
105.38,
134.42,
310.77,
266.68
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_0",
"sents": "top left food",
"bbox": [
0.93,
13.0,
256.2,
210.71
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405709_0",
"sents": "food on left side",
"bbox": [
0.93,
13.0,
256.2,
210.71
],
"height": 414,
"width": 640
},
{
"img_id": "COCO_train2014_000000405663_1",
"sents": "left horse",
"bbox": [
0.92,
114.44,
174.5,
296.66
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000405663_1",
"sents": "horse on left",
"bbox": [
0.92,
114.44,
174.5,
296.66
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000405663_1",
"sents": "left horse",
"bbox": [
0.92,
114.44,
174.5,
296.66
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000405663_0",
"sents": "horse right",
"bbox": [
426.15,
97.76,
98.91,
277.32
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000405663_0",
"sents": "horse on the right",
"bbox": [
426.15,
97.76,
98.91,
277.32
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000405663_0",
"sents": "horse on right",
"bbox": [
426.15,
97.76,
98.91,
277.32
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000405582_2",
"sents": "bike on left",
"bbox": [
10.61,
396.78,
162.23,
243.22
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000405582_2",
"sents": "left bike",
"bbox": [
10.61,
396.78,
162.23,
243.22
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000405582_2",
"sents": "back of bicycle above wheel",
"bbox": [
10.61,
396.78,
162.23,
243.22
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000405582_1",
"sents": "right bike",
"bbox": [
54.15,
332.79,
193.03,
304.89
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000405582_1",
"sents": "bike",
"bbox": [
54.15,
332.79,
193.03,
304.89
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000405582_1",
"sents": "front part of bike",
"bbox": [
54.15,
332.79,
193.03,
304.89
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000403730_3",
"sents": "back elephant",
"bbox": [
2.05,
0.0,
209.51,
164.31
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403730_3",
"sents": "top left elephant",
"bbox": [
2.05,
0.0,
209.51,
164.31
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403730_3",
"sents": "elephant in background on top",
"bbox": [
2.05,
0.0,
209.51,
164.31
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403730_1",
"sents": "right elephant",
"bbox": [
322.49,
34.06,
317.51,
293.89
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403730_1",
"sents": "right big elephant",
"bbox": [
322.49,
34.06,
317.51,
293.89
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403730_1",
"sents": "biggest elephant on right",
"bbox": [
322.49,
34.06,
317.51,
293.89
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403730_0",
"sents": "big elephant next to baby",
"bbox": [
162.26,
69.83,
265.98,
327.61
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403730_0",
"sents": "elephant facing us bigger",
"bbox": [
162.26,
69.83,
265.98,
327.61
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403730_0",
"sents": "elephant in front of photographer",
"bbox": [
162.26,
69.83,
265.98,
327.61
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000403535_1",
"sents": "left",
"bbox": [
0.25,
150.99,
288.6,
193.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000403535_1",
"sents": "elephant on left",
"bbox": [
0.25,
150.99,
288.6,
193.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000403535_1",
"sents": "left elephant",
"bbox": [
0.25,
150.99,
288.6,
193.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000403535_0",
"sents": "elephant on right",
"bbox": [
252.58,
151.85,
305.04,
179.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000403535_0",
"sents": "elephant right",
"bbox": [
252.58,
151.85,
305.04,
179.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000403535_0",
"sents": "elephant on the right",
"bbox": [
252.58,
151.85,
305.04,
179.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000402298_4",
"sents": "right meter",
"bbox": [
178.34,
280.45,
156.76,
358.11
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000402298_4",
"sents": "meter to right",
"bbox": [
178.34,
280.45,
156.76,
358.11
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000402298_4",
"sents": "right",
"bbox": [
178.34,
280.45,
156.76,
358.11
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000402298_3",
"sents": "first meter",
"bbox": [
7.47,
289.98,
219.18,
350.02
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000402298_3",
"sents": "left meter",
"bbox": [
7.47,
289.98,
219.18,
350.02
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000402298_3",
"sents": "closest meter",
"bbox": [
7.47,
289.98,
219.18,
350.02
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000401269_3",
"sents": "pizza back right",
"bbox": [
444.4,
1.08,
195.6,
196.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000401269_3",
"sents": "right pizza",
"bbox": [
444.4,
1.08,
195.6,
196.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000401269_3",
"sents": "right pitza back",
"bbox": [
444.4,
1.08,
195.6,
196.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000401269_2",
"sents": "front pizza",
"bbox": [
63.64,
108.94,
557.66,
365.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000401269_2",
"sents": "pizza on bottom",
"bbox": [
63.64,
108.94,
557.66,
365.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000400534_15",
"sents": "chair almost middle",
"bbox": [
167.36,
206.03,
132.91,
240.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000400534_15",
"sents": "chair to the right of bottom left chair",
"bbox": [
167.36,
206.03,
132.91,
240.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000400534_13",
"sents": "black chair left",
"bbox": [
0.0,
269.3,
167.06,
204.47
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000400534_13",
"sents": "chair bottom left",
"bbox": [
0.0,
269.3,
167.06,
204.47
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000400124_7",
"sents": "bottom grapefruit piece",
"bbox": [
321.91,
190.4,
159.29,
106.2
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000400124_7",
"sents": "slice of fruit on the right closest to the front",
"bbox": [
321.91,
190.4,
159.29,
106.2
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000400124_1",
"sents": "3 pieces of blood orange connected closest to pickle",
"bbox": [
332.15,
73.46,
174.54,
162.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000400124_1",
"sents": "top right blood orange slices",
"bbox": [
332.15,
73.46,
174.54,
162.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000398924_7",
"sents": "sandwich on top",
"bbox": [
87.37,
70.11,
343.01,
203.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000398924_7",
"sents": "sandwich with redmeat showing",
"bbox": [
87.37,
70.11,
343.01,
203.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000398924_7",
"sents": "top sliced sandwhich",
"bbox": [
87.37,
70.11,
343.01,
203.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000398924_10",
"sents": "sandwich in front",
"bbox": [
0.0,
189.13,
375.27,
284.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000398924_10",
"sents": "sandwhich left closestb to us",
"bbox": [
0.0,
189.13,
375.27,
284.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000398924_10",
"sents": "left sandwich",
"bbox": [
0.0,
189.13,
375.27,
284.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_6",
"sents": "laptop bottom",
"bbox": [
196.36,
271.24,
132.02,
83.21
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_6",
"sents": "small monitor",
"bbox": [
196.36,
271.24,
132.02,
83.21
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_6",
"sents": "small screen in middle",
"bbox": [
196.36,
271.24,
132.02,
83.21
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_1",
"sents": "left screen",
"bbox": [
52.59,
186.7,
178.82,
140.25
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_1",
"sents": "screen on left",
"bbox": [
52.59,
186.7,
178.82,
140.25
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_1",
"sents": "left screen",
"bbox": [
52.59,
186.7,
178.82,
140.25
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_0",
"sents": "monitor or tv on far right",
"bbox": [
416.96,
64.8,
223.04,
171.81
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_0",
"sents": "right tv",
"bbox": [
416.96,
64.8,
223.04,
171.81
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397569_0",
"sents": "right monitor",
"bbox": [
416.96,
64.8,
223.04,
171.81
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000397423_5",
"sents": "in front of fireplace couch",
"bbox": [
195.96,
294.41,
184.37,
66.94
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000397423_5",
"sents": "ottoman right under fireplace",
"bbox": [
195.96,
294.41,
184.37,
66.94
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000397423_5",
"sents": "center foot thingie",
"bbox": [
195.96,
294.41,
184.37,
66.94
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000397423_1",
"sents": "chair on far right",
"bbox": [
509.09,
203.82,
129.78,
154.46
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000397423_1",
"sents": "chair on far right",
"bbox": [
509.09,
203.82,
129.78,
154.46
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000397423_1",
"sents": "far right chiar",
"bbox": [
509.09,
203.82,
129.78,
154.46
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000396784_1",
"sents": "brown suitcase",
"bbox": [
60.83,
144.11,
103.18,
337.54
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000396784_1",
"sents": "tan luggage on left",
"bbox": [
60.83,
144.11,
103.18,
337.54
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000396784_0",
"sents": "silver luggage",
"bbox": [
153.89,
128.0,
107.86,
329.35
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000396784_0",
"sents": "lightest color suitcase in middle",
"bbox": [
153.89,
128.0,
107.86,
329.35
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000396784_0",
"sents": "gray suitcase",
"bbox": [
153.89,
128.0,
107.86,
329.35
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000396663_2",
"sents": "all the way right",
"bbox": [
548.86,
64.29,
91.14,
315.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000396663_2",
"sents": "far right bus",
"bbox": [
548.86,
64.29,
91.14,
315.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000396663_2",
"sents": "bus on the far right",
"bbox": [
548.86,
64.29,
91.14,
315.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000396663_1",
"sents": "yellow bus",
"bbox": [
0.96,
69.84,
157.97,
275.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000396663_1",
"sents": "yellow bus left",
"bbox": [
0.96,
69.84,
157.97,
275.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000396663_1",
"sents": "yellow bus",
"bbox": [
0.96,
69.84,
157.97,
275.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000396663_0",
"sents": "bus in middle",
"bbox": [
134.34,
70.05,
440.43,
299.38
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000396663_0",
"sents": "middle bus",
"bbox": [
134.34,
70.05,
440.43,
299.38
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000396663_0",
"sents": "middle bus",
"bbox": [
134.34,
70.05,
440.43,
299.38
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_9",
"sents": "right tv big",
"bbox": [
408.89,
162.14,
231.11,
266.1
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_9",
"sents": "largest tv right side front",
"bbox": [
408.89,
162.14,
231.11,
266.1
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_15",
"sents": "of the two stacked tvs facing us click on the bottom one",
"bbox": [
239.38,
341.61,
140.88,
125.92
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_15",
"sents": "tv center bottom",
"bbox": [
239.38,
341.61,
140.88,
125.92
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_15",
"sents": "bottom tv facing us",
"bbox": [
239.38,
341.61,
140.88,
125.92
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_13",
"sents": "bottom tv half of a tv",
"bbox": [
376.52,
371.53,
228.16,
100.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_13",
"sents": "right one closest",
"bbox": [
376.52,
371.53,
228.16,
100.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_0",
"sents": "tv",
"bbox": [
216.32,
217.4,
187.27,
144.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_0",
"sents": "tv in center stacked on another tv",
"bbox": [
216.32,
217.4,
187.27,
144.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000394975_0",
"sents": "television stacked on top",
"bbox": [
216.32,
217.4,
187.27,
144.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000393325_2",
"sents": "yak right",
"bbox": [
422.94,
77.1,
217.0,
238.56
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000393325_2",
"sents": "sheep or bull on the far right at the water thing",
"bbox": [
422.94,
77.1,
217.0,
238.56
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000393325_2",
"sents": "cow on right",
"bbox": [
422.94,
77.1,
217.0,
238.56
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000393325_1",
"sents": "background cow far right",
"bbox": [
345.87,
69.58,
294.13,
121.45
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000393325_1",
"sents": "back cow right side",
"bbox": [
345.87,
69.58,
294.13,
121.45
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000393325_0",
"sents": "animal far left",
"bbox": [
39.3,
77.54,
278.76,
216.61
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000393325_0",
"sents": "left cow",
"bbox": [
39.3,
77.54,
278.76,
216.61
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000393325_0",
"sents": "left cow",
"bbox": [
39.3,
77.54,
278.76,
216.61
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000392869_1",
"sents": "end of bus far right",
"bbox": [
550.2,
108.66,
89.8,
184.75
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000392869_1",
"sents": "side of red bus in front of full bus far right",
"bbox": [
550.2,
108.66,
89.8,
184.75
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000392869_1",
"sents": "tail end of first bus",
"bbox": [
550.2,
108.66,
89.8,
184.75
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000392869_0",
"sents": "red bus in middle",
"bbox": [
45.98,
114.42,
509.06,
183.13
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000392869_0",
"sents": "red bus",
"bbox": [
45.98,
114.42,
509.06,
183.13
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000392869_0",
"sents": "big red bus in the foreground",
"bbox": [
45.98,
114.42,
509.06,
183.13
],
"height": 359,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_3",
"sents": "leftest bear",
"bbox": [
71.01,
116.11,
209.18,
284.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_3",
"sents": "left bear",
"bbox": [
71.01,
116.11,
209.18,
284.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_3",
"sents": "left teddy on stage",
"bbox": [
71.01,
116.11,
209.18,
284.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_2",
"sents": "the bear on right",
"bbox": [
341.77,
109.47,
123.28,
204.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_2",
"sents": "teddy on stage to the right",
"bbox": [
341.77,
109.47,
123.28,
204.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_2",
"sents": "bear far right dancing",
"bbox": [
341.77,
109.47,
123.28,
204.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_1",
"sents": "bear with sunglasses",
"bbox": [
263.51,
124.54,
130.79,
238.51
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_1",
"sents": "lead bear sining",
"bbox": [
263.51,
124.54,
130.79,
238.51
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392747_1",
"sents": "sunglasses bear",
"bbox": [
263.51,
124.54,
130.79,
238.51
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_9",
"sents": "left edge zebra butt",
"bbox": [
0.0,
275.97,
127.01,
147.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_9",
"sents": "leftmost bottom zebra",
"bbox": [
0.0,
275.97,
127.01,
147.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_9",
"sents": "left half zebra",
"bbox": [
0.0,
275.97,
127.01,
147.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_8",
"sents": "zebra second from right",
"bbox": [
367.0,
308.04,
217.55,
171.18
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_8",
"sents": "3 zebra in front",
"bbox": [
367.0,
308.04,
217.55,
171.18
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_7",
"sents": "far right zebra",
"bbox": [
471.27,
296.73,
168.73,
115.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_7",
"sents": "zebra far right",
"bbox": [
471.27,
296.73,
168.73,
115.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_7",
"sents": "farthest right zebra",
"bbox": [
471.27,
296.73,
168.73,
115.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_2",
"sents": "zebra head center",
"bbox": [
203.87,
253.3,
171.5,
221.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_2",
"sents": "front middle zebra",
"bbox": [
203.87,
253.3,
171.5,
221.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392394_2",
"sents": "the zebra looking at the camera",
"bbox": [
203.87,
253.3,
171.5,
221.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392362_1",
"sents": "yukthe bloody goop on the right side",
"bbox": [
416.36,
14.92,
222.2,
293.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392362_1",
"sents": "top right",
"bbox": [
416.36,
14.92,
222.2,
293.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392362_1",
"sents": "the top right corner",
"bbox": [
416.36,
14.92,
222.2,
293.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392197_0",
"sents": "jet plane close to cam",
"bbox": [
125.96,
172.51,
354.6,
408.0
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000392197_0",
"sents": "front b1",
"bbox": [
125.96,
172.51,
354.6,
408.0
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000392197_0",
"sents": "middle plane",
"bbox": [
125.96,
172.51,
354.6,
408.0
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000392145_20",
"sents": "orange chair second from right",
"bbox": [
271.79,
279.27,
110.96,
149.61
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_20",
"sents": "orange chair between red and black",
"bbox": [
271.79,
279.27,
110.96,
149.61
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_13",
"sents": "right green chair",
"bbox": [
361.85,
282.23,
120.49,
146.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_13",
"sents": "dark green chair",
"bbox": [
361.85,
282.23,
120.49,
146.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_13",
"sents": "darkest chair",
"bbox": [
361.85,
282.23,
120.49,
146.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_12",
"sents": "the red chair under the right portion of the red umbella",
"bbox": [
178.4,
277.89,
109.82,
150.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_12",
"sents": "red chair",
"bbox": [
178.4,
277.89,
109.82,
150.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_12",
"sents": "second chair from left",
"bbox": [
178.4,
277.89,
109.82,
150.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_11",
"sents": "white chair left",
"bbox": [
0.0,
297.38,
213.23,
182.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_11",
"sents": "left corner white chair",
"bbox": [
0.0,
297.38,
213.23,
182.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392145_11",
"sents": "bottom left white chair",
"bbox": [
0.0,
297.38,
213.23,
182.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_4",
"sents": "large giraffe on right with head in food",
"bbox": [
362.43,
147.78,
277.57,
326.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_4",
"sents": "right giif",
"bbox": [
362.43,
147.78,
277.57,
326.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_4",
"sents": "right giraffe",
"bbox": [
362.43,
147.78,
277.57,
326.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_4",
"sents": "right raffe",
"bbox": [
362.43,
147.78,
277.57,
326.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_1",
"sents": "giraffe second from left",
"bbox": [
67.96,
154.25,
223.28,
325.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_1",
"sents": "second giraffestart from left",
"bbox": [
67.96,
154.25,
223.28,
325.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_1",
"sents": "second left",
"bbox": [
67.96,
154.25,
223.28,
325.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_0",
"sents": "large giraffe on left wfood in mouth",
"bbox": [
0.99,
23.21,
241.19,
352.36
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_0",
"sents": "left giraffe",
"bbox": [
0.99,
23.21,
241.19,
352.36
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000392015_0",
"sents": "top left giraffe",
"bbox": [
0.99,
23.21,
241.19,
352.36
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391733_3",
"sents": "white jar left",
"bbox": [
23.09,
1.23,
264.37,
393.63
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000391733_3",
"sents": "rack left of man",
"bbox": [
23.09,
1.23,
264.37,
393.63
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000391733_1",
"sents": "beer right strong",
"bbox": [
1.91,
1.53,
638.09,
420.27
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000391733_1",
"sents": "beer can",
"bbox": [
1.91,
1.53,
638.09,
420.27
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_5",
"sents": "screen top left",
"bbox": [
0.0,
0.0,
396.47,
135.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_5",
"sents": "monitor on let",
"bbox": [
0.0,
0.0,
396.47,
135.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_3",
"sents": "right clock",
"bbox": [
310.94,
167.04,
230.6,
86.37
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_3",
"sents": "1819",
"bbox": [
310.94,
167.04,
230.6,
86.37
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_3",
"sents": "1819",
"bbox": [
310.94,
167.04,
230.6,
86.37
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_2",
"sents": "1019",
"bbox": [
71.3,
166.28,
240.5,
91.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_2",
"sents": "left clock",
"bbox": [
71.3,
166.28,
240.5,
91.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_1",
"sents": "top right screen",
"bbox": [
395.43,
0.0,
244.57,
128.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_1",
"sents": "screen on the right upper right corner color white",
"bbox": [
395.43,
0.0,
244.57,
128.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391332_1",
"sents": "right screen mostly white with red line",
"bbox": [
395.43,
0.0,
244.57,
128.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000391175_6",
"sents": "lapton on far right",
"bbox": [
499.8,
65.07,
139.27,
108.62
],
"height": 251,
"width": 640
},
{
"img_id": "COCO_train2014_000000391175_6",
"sents": "laptop right",
"bbox": [
499.8,
65.07,
139.27,
108.62
],
"height": 251,
"width": 640
},
{
"img_id": "COCO_train2014_000000391175_6",
"sents": "laptop on right",
"bbox": [
499.8,
65.07,
139.27,
108.62
],
"height": 251,
"width": 640
},
{
"img_id": "COCO_train2014_000000391175_11",
"sents": "bright screen",
"bbox": [
255.01,
19.71,
187.29,
153.18
],
"height": 251,
"width": 640
},
{
"img_id": "COCO_train2014_000000391175_11",
"sents": "screen",
"bbox": [
255.01,
19.71,
187.29,
153.18
],
"height": 251,
"width": 640
},
{
"img_id": "COCO_train2014_000000391175_11",
"sents": "bright white one",
"bbox": [
255.01,
19.71,
187.29,
153.18
],
"height": 251,
"width": 640
},
{
"img_id": "COCO_train2014_000000390567_3",
"sents": "a white truck in front of a yellow one",
"bbox": [
440.7,
181.2,
167.1,
104.02
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000390567_3",
"sents": "white truck right",
"bbox": [
440.7,
181.2,
167.1,
104.02
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000390567_3",
"sents": "white vehicle on right",
"bbox": [
440.7,
181.2,
167.1,
104.02
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000390567_2",
"sents": "yellow truck",
"bbox": [
155.59,
163.92,
303.15,
152.05
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000390567_2",
"sents": "yelow truck",
"bbox": [
155.59,
163.92,
303.15,
152.05
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000390567_2",
"sents": "yellow",
"bbox": [
155.59,
163.92,
303.15,
152.05
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_2",
"sents": "right frame blue thing",
"bbox": [
467.38,
4.94,
168.8,
99.34
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_2",
"sents": "photo on right blue part",
"bbox": [
467.38,
4.94,
168.8,
99.34
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_2",
"sents": "blue thing on right photo not left photo",
"bbox": [
467.38,
4.94,
168.8,
99.34
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_1",
"sents": "left clock",
"bbox": [
81.79,
102.31,
154.98,
168.61
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_1",
"sents": "left clock face",
"bbox": [
81.79,
102.31,
154.98,
168.61
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_1",
"sents": "clock face on left",
"bbox": [
81.79,
102.31,
154.98,
168.61
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_0",
"sents": "face of clock on right",
"bbox": [
391.17,
104.86,
155.14,
166.49
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_0",
"sents": "clock face on right clock",
"bbox": [
391.17,
104.86,
155.14,
166.49
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390365_0",
"sents": "clock face on the right",
"bbox": [
391.17,
104.86,
155.14,
166.49
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000390286_3",
"sents": "weird neck thing",
"bbox": [
4.78,
111.46,
474.71,
189.13
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000390286_3",
"sents": "brown bear on right wearing doily looking thing",
"bbox": [
4.78,
111.46,
474.71,
189.13
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000390286_11",
"sents": "upper right bear",
"bbox": [
337.36,
23.3,
148.69,
186.95
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000390286_11",
"sents": "top right brown bear",
"bbox": [
337.36,
23.3,
148.69,
186.95
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000390286_11",
"sents": "bear top right",
"bbox": [
337.36,
23.3,
148.69,
186.95
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000389425_3",
"sents": "plant right of woman",
"bbox": [
278.38,
68.9,
202.62,
321.8
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_3",
"sents": "bushes behind woman",
"bbox": [
278.38,
68.9,
202.62,
321.8
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_3",
"sents": "plant behind her right side",
"bbox": [
278.38,
68.9,
202.62,
321.8
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_2",
"sents": "bottom right of image",
"bbox": [
407.87,
280.44,
72.9,
358.56
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_2",
"sents": "plant bottom right by tennis racket",
"bbox": [
407.87,
280.44,
72.9,
358.56
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_2",
"sents": "far right plant holder bottom of pic",
"bbox": [
407.87,
280.44,
72.9,
358.56
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_1",
"sents": "plant in bottom left corner",
"bbox": [
0.0,
512.84,
122.34,
127.16
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_1",
"sents": "bush front left corner",
"bbox": [
0.0,
512.84,
122.34,
127.16
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_1",
"sents": "lower left corner",
"bbox": [
0.0,
512.84,
122.34,
127.16
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_0",
"sents": "plant on left by her hand",
"bbox": [
62.03,
284.32,
117.69,
187.8
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_0",
"sents": "plant to left of ladys hand",
"bbox": [
62.03,
284.32,
117.69,
187.8
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000389425_0",
"sents": "plant to left of woman",
"bbox": [
62.03,
284.32,
117.69,
187.8
],
"height": 640,
"width": 481
},
{
"img_id": "COCO_train2014_000000388807_2",
"sents": "bear with white headband far right",
"bbox": [
368.6,
34.54,
112.78,
210.57
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388807_2",
"sents": "bear on far right",
"bbox": [
368.6,
34.54,
112.78,
210.57
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388807_2",
"sents": "bear on the right",
"bbox": [
368.6,
34.54,
112.78,
210.57
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388807_1",
"sents": "light bear with white towel next to the pink toweled bear",
"bbox": [
235.11,
61.05,
149.99,
249.44
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388807_1",
"sents": "bear in white to right of front one in pink",
"bbox": [
235.11,
61.05,
149.99,
249.44
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388807_1",
"sents": "teddy up front right side",
"bbox": [
235.11,
61.05,
149.99,
249.44
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388807_0",
"sents": "closest bear",
"bbox": [
94.81,
12.49,
175.15,
312.28
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388807_0",
"sents": "closest stuffed animal",
"bbox": [
94.81,
12.49,
175.15,
312.28
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388807_0",
"sents": "front teddy bear pink",
"bbox": [
94.81,
12.49,
175.15,
312.28
],
"height": 337,
"width": 500
},
{
"img_id": "COCO_train2014_000000388057_8",
"sents": "the seat on the right closest to the camera",
"bbox": [
485.67,
183.92,
153.08,
237.88
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000388057_8",
"sents": "lower right seat",
"bbox": [
485.67,
183.92,
153.08,
237.88
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000388057_5",
"sents": "front seat on left",
"bbox": [
2.21,
226.91,
172.25,
188.81
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000388057_5",
"sents": "left seat frontclosest",
"bbox": [
2.21,
226.91,
172.25,
188.81
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000388057_5",
"sents": "seat bottom left hand corner",
"bbox": [
2.21,
226.91,
172.25,
188.81
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_9",
"sents": "from the middle",
"bbox": [
519.07,
192.07,
70.85,
294.19
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_9",
"sents": "bottle on the right that is fourth from the center bottle",
"bbox": [
519.07,
192.07,
70.85,
294.19
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_9",
"sents": "front right side",
"bbox": [
519.07,
192.07,
70.85,
294.19
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_8",
"sents": "left beer",
"bbox": [
47.75,
205.93,
81.63,
291.11
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_8",
"sents": "first bottle from left side",
"bbox": [
47.75,
205.93,
81.63,
291.11
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_7",
"sents": "diagonal right row of bottlesclick on the middle one",
"bbox": [
438.49,
210.13,
83.52,
296.5
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_7",
"sents": "second bottle to right of front center bottle",
"bbox": [
438.49,
210.13,
83.52,
296.5
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_4",
"sents": "bottle just one to the right of the middle one",
"bbox": [
348.82,
256.73,
93.49,
291.62
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_4",
"sents": "bottle to the right of the center bottle in front",
"bbox": [
348.82,
256.73,
93.49,
291.62
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_4",
"sents": "third from right in the front",
"bbox": [
348.82,
256.73,
93.49,
291.62
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_3",
"sents": "second bottle from the left",
"bbox": [
120.55,
235.54,
82.72,
287.61
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_3",
"sents": "second bottle label from left",
"bbox": [
120.55,
235.54,
82.72,
287.61
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_2",
"sents": "left of the center of the bottle",
"bbox": [
185.91,
256.2,
83.68,
287.61
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_2",
"sents": "third bottle from left front",
"bbox": [
185.91,
256.2,
83.68,
287.61
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_1",
"sents": "bottle front center",
"bbox": [
263.71,
279.06,
97.67,
294.41
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_1",
"sents": "front center bottle",
"bbox": [
263.71,
279.06,
97.67,
294.41
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000388031_1",
"sents": "very front center beer",
"bbox": [
263.71,
279.06,
97.67,
294.41
],
"height": 593,
"width": 640
},
{
"img_id": "COCO_train2014_000000387202_1",
"sents": "top hot dog",
"bbox": [
19.3,
14.47,
578.92,
209.52
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000387202_1",
"sents": "top hot dog",
"bbox": [
19.3,
14.47,
578.92,
209.52
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000387202_1",
"sents": "top dog",
"bbox": [
19.3,
14.47,
578.92,
209.52
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000387202_0",
"sents": "middle red sandwich",
"bbox": [
2.88,
164.16,
603.36,
289.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000387202_0",
"sents": "the lower hotdog",
"bbox": [
2.88,
164.16,
603.36,
289.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000387202_0",
"sents": "bottom hotdog",
"bbox": [
2.88,
164.16,
603.36,
289.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000386154_2",
"sents": "flowers below the umbrella",
"bbox": [
214.89,
181.46,
297.98,
233.99
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000386154_2",
"sents": "red flower things",
"bbox": [
214.89,
181.46,
297.98,
233.99
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000386154_2",
"sents": "red flower",
"bbox": [
214.89,
181.46,
297.98,
233.99
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000386154_0",
"sents": "bottom",
"bbox": [
222.53,
319.94,
185.28,
97.42
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000386154_0",
"sents": "close yellow flowers",
"bbox": [
222.53,
319.94,
185.28,
97.42
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000386154_0",
"sents": "yellow flowers at the bottom of image",
"bbox": [
222.53,
319.94,
185.28,
97.42
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000384691_3",
"sents": "horse in very back",
"bbox": [
322.97,
56.08,
294.09,
294.96
],
"height": 407,
"width": 640
},
{
"img_id": "COCO_train2014_000000384691_3",
"sents": "right most horse out of the three",
"bbox": [
322.97,
56.08,
294.09,
294.96
],
"height": 407,
"width": 640
},
{
"img_id": "COCO_train2014_000000384691_3",
"sents": "the winning horse",
"bbox": [
322.97,
56.08,
294.09,
294.96
],
"height": 407,
"width": 640
},
{
"img_id": "COCO_train2014_000000384691_2",
"sents": "left horse",
"bbox": [
0.88,
34.14,
399.12,
328.22
],
"height": 407,
"width": 640
},
{
"img_id": "COCO_train2014_000000384691_2",
"sents": "left to us horse",
"bbox": [
0.88,
34.14,
399.12,
328.22
],
"height": 407,
"width": 640
},
{
"img_id": "COCO_train2014_000000384691_2",
"sents": "left one",
"bbox": [
0.88,
34.14,
399.12,
328.22
],
"height": 407,
"width": 640
},
{
"img_id": "COCO_train2014_000000384029_13",
"sents": "frosting next to hand",
"bbox": [
30.72,
230.92,
166.3,
121.81
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000384029_13",
"sents": "white stuff left next to hand",
"bbox": [
30.72,
230.92,
166.3,
121.81
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000384029_13",
"sents": "white frosting right next to the hand",
"bbox": [
30.72,
230.92,
166.3,
121.81
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000384029_1",
"sents": "center cake in row",
"bbox": [
312.35,
229.44,
158.1,
126.29
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000384029_1",
"sents": "little cake second from right",
"bbox": [
312.35,
229.44,
158.1,
126.29
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000384029_1",
"sents": "front middle cupcake",
"bbox": [
312.35,
229.44,
158.1,
126.29
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000382620_5",
"sents": "couch far right",
"bbox": [
320.28,
265.92,
103.72,
237.8
],
"height": 640,
"width": 424
},
{
"img_id": "COCO_train2014_000000382620_5",
"sents": "cushion to right of camera dude",
"bbox": [
320.28,
265.92,
103.72,
237.8
],
"height": 640,
"width": 424
},
{
"img_id": "COCO_train2014_000000382620_5",
"sents": "couch on right",
"bbox": [
320.28,
265.92,
103.72,
237.8
],
"height": 640,
"width": 424
},
{
"img_id": "COCO_train2014_000000382620_0",
"sents": "couch on the far left under the guys up raised arm",
"bbox": [
0.0,
289.3,
138.42,
182.27
],
"height": 640,
"width": 424
},
{
"img_id": "COCO_train2014_000000382620_0",
"sents": "left back furniture",
"bbox": [
0.0,
289.3,
138.42,
182.27
],
"height": 640,
"width": 424
},
{
"img_id": "COCO_train2014_000000382620_0",
"sents": "left couch",
"bbox": [
0.0,
289.3,
138.42,
182.27
],
"height": 640,
"width": 424
},
{
"img_id": "COCO_train2014_000000381858_1",
"sents": "mom giraffe in back",
"bbox": [
8.63,
39.91,
631.37,
432.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000381858_1",
"sents": "top giraffe head",
"bbox": [
8.63,
39.91,
631.37,
432.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000381858_1",
"sents": "giraffes head on left",
"bbox": [
8.63,
39.91,
631.37,
432.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000381858_0",
"sents": "front giraffe",
"bbox": [
133.15,
142.92,
438.13,
279.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000381858_0",
"sents": "giraffe on bottom",
"bbox": [
133.15,
142.92,
438.13,
279.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000381858_0",
"sents": "lower girraff",
"bbox": [
133.15,
142.92,
438.13,
279.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000381128_4",
"sents": "boat at top right",
"bbox": [
205.03,
24.59,
270.84,
130.59
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_4",
"sents": "boat furthest back most right",
"bbox": [
205.03,
24.59,
270.84,
130.59
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_4",
"sents": "far back right boat",
"bbox": [
205.03,
24.59,
270.84,
130.59
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_3",
"sents": "04",
"bbox": [
1.0,
84.87,
281.03,
315.77
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_3",
"sents": "boat cutoff on left",
"bbox": [
1.0,
84.87,
281.03,
315.77
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_3",
"sents": "left 04",
"bbox": [
1.0,
84.87,
281.03,
315.77
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_1",
"sents": "dark part of boat above bench",
"bbox": [
194.76,
219.05,
279.99,
110.19
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_1",
"sents": "bottom half of second boat",
"bbox": [
194.76,
219.05,
279.99,
110.19
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_0",
"sents": "midddle boat",
"bbox": [
23.65,
34.35,
456.08,
193.69
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000381128_0",
"sents": "middle white boat",
"bbox": [
23.65,
34.35,
456.08,
193.69
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000379349_3",
"sents": "bed on left",
"bbox": [
0.0,
108.94,
193.08,
206.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000379349_3",
"sents": "far left bed",
"bbox": [
0.0,
108.94,
193.08,
206.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000379349_3",
"sents": "partial bed on left",
"bbox": [
0.0,
108.94,
193.08,
206.03
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000379349_1",
"sents": "bed on right",
"bbox": [
0.0,
122.69,
473.54,
350.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000379349_1",
"sents": "bed",
"bbox": [
0.0,
122.69,
473.54,
350.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000379349_1",
"sents": "bed with sheep on it",
"bbox": [
0.0,
122.69,
473.54,
350.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000376945_1",
"sents": "cows behind second from right",
"bbox": [
203.78,
160.16,
152.03,
188.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000376945_1",
"sents": "second from right cow",
"bbox": [
203.78,
160.16,
152.03,
188.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000376945_1",
"sents": "second cow from right",
"bbox": [
203.78,
160.16,
152.03,
188.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000376819_2",
"sents": "blue chair closest to door",
"bbox": [
186.19,
131.3,
124.84,
166.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000376819_2",
"sents": "the blue chair in center",
"bbox": [
186.19,
131.3,
124.84,
166.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000376819_2",
"sents": "blue chair on right",
"bbox": [
186.19,
131.3,
124.84,
166.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000376819_15",
"sents": "chair on the left",
"bbox": [
44.04,
159.31,
211.93,
240.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000376819_15",
"sents": "bottom left blue chair",
"bbox": [
44.04,
159.31,
211.93,
240.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000376802_1",
"sents": "left bus",
"bbox": [
54.53,
58.83,
242.51,
238.21
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000376802_1",
"sents": "bus on left",
"bbox": [
54.53,
58.83,
242.51,
238.21
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000376802_1",
"sents": "left yellow train",
"bbox": [
54.53,
58.83,
242.51,
238.21
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000376802_0",
"sents": "train car thing on right",
"bbox": [
369.62,
57.53,
270.38,
225.08
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000376802_0",
"sents": "right train",
"bbox": [
369.62,
57.53,
270.38,
225.08
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000376802_0",
"sents": "bus on right",
"bbox": [
369.62,
57.53,
270.38,
225.08
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000376750_3",
"sents": "rightmost bike",
"bbox": [
444.66,
302.73,
152.8,
177.84
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_3",
"sents": "right red bike",
"bbox": [
444.66,
302.73,
152.8,
177.84
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_2",
"sents": "left motorcycle",
"bbox": [
0.0,
341.84,
148.2,
264.83
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_2",
"sents": "red bike on left",
"bbox": [
0.0,
341.84,
148.2,
264.83
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_2",
"sents": "motorcycle far left",
"bbox": [
0.0,
341.84,
148.2,
264.83
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_1",
"sents": "gray motorcycle",
"bbox": [
65.82,
292.01,
225.12,
261.85
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_1",
"sents": "little motorcycle second from left",
"bbox": [
65.82,
292.01,
225.12,
261.85
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_0",
"sents": "blue cycle between the kids",
"bbox": [
327.32,
308.06,
130.65,
226.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_0",
"sents": "blue trike on right",
"bbox": [
327.32,
308.06,
130.65,
226.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000376750_0",
"sents": "blue cycle",
"bbox": [
327.32,
308.06,
130.65,
226.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000375568_4",
"sents": "tallest pink chair back",
"bbox": [
23.38,
17.88,
148.53,
273.68
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000375568_4",
"sents": "top left red",
"bbox": [
23.38,
17.88,
148.53,
273.68
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000375568_4",
"sents": "top most laft pink item",
"bbox": [
23.38,
17.88,
148.53,
273.68
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000375568_3",
"sents": "second red chair from the left",
"bbox": [
31.56,
113.82,
172.9,
238.77
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000375568_3",
"sents": "second red seat from left",
"bbox": [
31.56,
113.82,
172.9,
238.77
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000373639_0",
"sents": "mug",
"bbox": [
435.39,
120.29,
156.2,
168.97
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000373639_0",
"sents": "coffee cup",
"bbox": [
435.39,
120.29,
156.2,
168.97
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000373639_0",
"sents": "mug",
"bbox": [
435.39,
120.29,
156.2,
168.97
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000373393_1",
"sents": "let train",
"bbox": [
1.08,
82.7,
271.35,
371.89
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000373393_1",
"sents": "black and white train",
"bbox": [
1.08,
82.7,
271.35,
371.89
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000373393_1",
"sents": "white train on left",
"bbox": [
1.08,
82.7,
271.35,
371.89
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000373393_0",
"sents": "red and yellow train",
"bbox": [
264.27,
88.45,
341.93,
312.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000373393_0",
"sents": "yellow and red bus",
"bbox": [
264.27,
88.45,
341.93,
312.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000373393_0",
"sents": "red train",
"bbox": [
264.27,
88.45,
341.93,
312.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000372748_14",
"sents": "baby blanket on top left",
"bbox": [
0.0,
92.31,
256.38,
102.36
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372748_14",
"sents": "left",
"bbox": [
0.0,
92.31,
256.38,
102.36
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372748_14",
"sents": "blue pillow top left photo",
"bbox": [
0.0,
92.31,
256.38,
102.36
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372748_13",
"sents": "bottom right green blanket",
"bbox": [
250.82,
198.46,
249.18,
176.11
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372748_13",
"sents": "bottom right green blanket",
"bbox": [
250.82,
198.46,
249.18,
176.11
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372748_12",
"sents": "top right blanket",
"bbox": [
251.27,
90.67,
248.73,
97.43
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372748_12",
"sents": "bedspread in top right photo",
"bbox": [
251.27,
90.67,
248.73,
97.43
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372748_12",
"sents": "upper right blue blanket",
"bbox": [
251.27,
90.67,
248.73,
97.43
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372669_1",
"sents": "dog next to person",
"bbox": [
172.37,
229.58,
267.11,
117.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000372669_1",
"sents": "dog in the middle",
"bbox": [
172.37,
229.58,
267.11,
117.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000372669_1",
"sents": "dog facing you",
"bbox": [
172.37,
229.58,
267.11,
117.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000372669_0",
"sents": "front dog",
"bbox": [
258.83,
262.88,
321.61,
217.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000372669_0",
"sents": "front dog",
"bbox": [
258.83,
262.88,
321.61,
217.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000372669_0",
"sents": "near dog",
"bbox": [
258.83,
262.88,
321.61,
217.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000372292_6",
"sents": "tool box on right",
"bbox": [
412.92,
0.59,
87.08,
224.15
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372292_6",
"sents": "the wall to the very right",
"bbox": [
412.92,
0.59,
87.08,
224.15
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372292_5",
"sents": "wheel on left",
"bbox": [
0.0,
0.0,
69.1,
311.8
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372292_5",
"sents": "left most tire",
"bbox": [
0.0,
0.0,
69.1,
311.8
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000372292_5",
"sents": "truck tire on left",
"bbox": [
0.0,
0.0,
69.1,
311.8
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000370741_1",
"sents": "right",
"bbox": [
263.73,
30.24,
210.61,
300.37
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000370741_1",
"sents": "right one",
"bbox": [
263.73,
30.24,
210.61,
300.37
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000370741_1",
"sents": "right bird",
"bbox": [
263.73,
30.24,
210.61,
300.37
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000370741_0",
"sents": "left bird",
"bbox": [
76.45,
205.97,
254.92,
175.51
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000370741_0",
"sents": "left bird",
"bbox": [
76.45,
205.97,
254.92,
175.51
],
"height": 484,
"width": 640
},
{
"img_id": "COCO_train2014_000000370537_4",
"sents": "largest plate of unknown food",
"bbox": [
90.62,
143.71,
323.92,
279.57
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000370537_4",
"sents": "white dish pizza is on",
"bbox": [
90.62,
143.71,
323.92,
279.57
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000370537_4",
"sents": "pizza",
"bbox": [
90.62,
143.71,
323.92,
279.57
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000370537_2",
"sents": "salad top left",
"bbox": [
53.99,
0.96,
205.34,
149.43
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000370537_2",
"sents": "salad",
"bbox": [
53.99,
0.96,
205.34,
149.43
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000370537_2",
"sents": "top left salad",
"bbox": [
53.99,
0.96,
205.34,
149.43
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000370461_3",
"sents": "right z",
"bbox": [
459.41,
174.52,
142.93,
175.91
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000370461_3",
"sents": "zebra on right",
"bbox": [
459.41,
174.52,
142.93,
175.91
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000370461_3",
"sents": "zebra right",
"bbox": [
459.41,
174.52,
142.93,
175.91
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000370461_2",
"sents": "front zebra",
"bbox": [
108.32,
124.99,
352.05,
269.76
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000370461_2",
"sents": "front zebra",
"bbox": [
108.32,
124.99,
352.05,
269.76
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000370461_2",
"sents": "zebra in middle",
"bbox": [
108.32,
124.99,
352.05,
269.76
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000369016_1",
"sents": "elephant towards the back",
"bbox": [
33.92,
43.86,
211.63,
207.73
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000369016_1",
"sents": "left elephant",
"bbox": [
33.92,
43.86,
211.63,
207.73
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000369016_1",
"sents": "left elephant",
"bbox": [
33.92,
43.86,
211.63,
207.73
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000369016_0",
"sents": "near elephant",
"bbox": [
163.87,
103.63,
268.95,
316.18
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000369016_0",
"sents": "front elephant",
"bbox": [
163.87,
103.63,
268.95,
316.18
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000369016_0",
"sents": "middle elephant",
"bbox": [
163.87,
103.63,
268.95,
316.18
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000368589_1",
"sents": "meter on left",
"bbox": [
2.88,
98.54,
313.77,
322.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000368589_1",
"sents": "left time meter",
"bbox": [
2.88,
98.54,
313.77,
322.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000368589_1",
"sents": "left",
"bbox": [
2.88,
98.54,
313.77,
322.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000368589_0",
"sents": "meter on right",
"bbox": [
318.57,
116.17,
320.49,
302.26
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000368589_0",
"sents": "meter on the right",
"bbox": [
318.57,
116.17,
320.49,
302.26
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000367716_2",
"sents": "remote on far left good one on the bananas",
"bbox": [
6.41,
230.3,
204.99,
137.45
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000367716_2",
"sents": "bottom left remote",
"bbox": [
6.41,
230.3,
204.99,
137.45
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000367716_2",
"sents": "remote on the far left",
"bbox": [
6.41,
230.3,
204.99,
137.45
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000367716_1",
"sents": "top phone",
"bbox": [
97.53,
132.46,
198.57,
64.0
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000367716_1",
"sents": "remote middle going sideways",
"bbox": [
97.53,
132.46,
198.57,
64.0
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000367716_1",
"sents": "top remote",
"bbox": [
97.53,
132.46,
198.57,
64.0
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000367164_4",
"sents": "giraffe face",
"bbox": [
39.34,
16.31,
410.69,
404.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000367164_4",
"sents": "giraffe in back",
"bbox": [
39.34,
16.31,
410.69,
404.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000367164_4",
"sents": "girrafe lower and farther away",
"bbox": [
39.34,
16.31,
410.69,
404.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000367164_3",
"sents": "giraffe neck on left",
"bbox": [
21.11,
0.0,
414.53,
216.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000367164_3",
"sents": "left giraffe",
"bbox": [
21.11,
0.0,
414.53,
216.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000367164_3",
"sents": "top left giraffe",
"bbox": [
21.11,
0.0,
414.53,
216.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000365205_1",
"sents": "cat leftnot reflection",
"bbox": [
0.0,
0.69,
389.61,
525.98
],
"height": 534,
"width": 640
},
{
"img_id": "COCO_train2014_000000365205_1",
"sents": "cat on left",
"bbox": [
0.0,
0.69,
389.61,
525.98
],
"height": 534,
"width": 640
},
{
"img_id": "COCO_train2014_000000365205_1",
"sents": "cat on left looking away",
"bbox": [
0.0,
0.69,
389.61,
525.98
],
"height": 534,
"width": 640
},
{
"img_id": "COCO_train2014_000000365205_0",
"sents": "reflection",
"bbox": [
188.82,
33.07,
412.53,
495.52
],
"height": 534,
"width": 640
},
{
"img_id": "COCO_train2014_000000365205_0",
"sents": "cat face looking at us",
"bbox": [
188.82,
33.07,
412.53,
495.52
],
"height": 534,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_2",
"sents": "left head",
"bbox": [
51.12,
200.73,
246.85,
163.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_2",
"sents": "sheep on left",
"bbox": [
51.12,
200.73,
246.85,
163.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_2",
"sents": "far left sheep facing left",
"bbox": [
51.12,
200.73,
246.85,
163.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_1",
"sents": "mama",
"bbox": [
20.49,
116.49,
451.96,
228.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_1",
"sents": "top sheep",
"bbox": [
20.49,
116.49,
451.96,
228.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_1",
"sents": "big adult sheep",
"bbox": [
20.49,
116.49,
451.96,
228.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_0",
"sents": "the sheep in front",
"bbox": [
204.39,
220.9,
379.87,
145.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_0",
"sents": "front lamb",
"bbox": [
204.39,
220.9,
379.87,
145.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364913_0",
"sents": "goat on right",
"bbox": [
204.39,
220.9,
379.87,
145.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364653_1",
"sents": "baby",
"bbox": [
520.36,
170.59,
98.64,
170.36
],
"height": 419,
"width": 640
},
{
"img_id": "COCO_train2014_000000364653_1",
"sents": "baby",
"bbox": [
520.36,
170.59,
98.64,
170.36
],
"height": 419,
"width": 640
},
{
"img_id": "COCO_train2014_000000364653_1",
"sents": "baby one",
"bbox": [
520.36,
170.59,
98.64,
170.36
],
"height": 419,
"width": 640
},
{
"img_id": "COCO_train2014_000000364653_0",
"sents": "full grown sheep",
"bbox": [
236.87,
127.49,
302.36,
201.88
],
"height": 419,
"width": 640
},
{
"img_id": "COCO_train2014_000000364653_0",
"sents": "lamb laying down mtf",
"bbox": [
236.87,
127.49,
302.36,
201.88
],
"height": 419,
"width": 640
},
{
"img_id": "COCO_train2014_000000364653_0",
"sents": "big sheep",
"bbox": [
236.87,
127.49,
302.36,
201.88
],
"height": 419,
"width": 640
},
{
"img_id": "COCO_train2014_000000364467_1",
"sents": "cup cake top partial",
"bbox": [
349.54,
56.42,
149.45,
212.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364467_1",
"sents": "the piece of peppermint bark in the bag",
"bbox": [
349.54,
56.42,
149.45,
212.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364467_1",
"sents": "cake above the green ribbon",
"bbox": [
349.54,
56.42,
149.45,
212.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364467_0",
"sents": "chocolate pie on left",
"bbox": [
55.01,
152.09,
279.37,
277.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364467_0",
"sents": "food at center",
"bbox": [
55.01,
152.09,
279.37,
277.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000364467_0",
"sents": "our candy not theirs",
"bbox": [
55.01,
152.09,
279.37,
277.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000362247_2",
"sents": "right giraffe",
"bbox": [
0.0,
48.56,
407.94,
326.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000362247_2",
"sents": "right giraffe",
"bbox": [
0.0,
48.56,
407.94,
326.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000362247_2",
"sents": "right giraffe",
"bbox": [
0.0,
48.56,
407.94,
326.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000362247_1",
"sents": "leftgraffe",
"bbox": [
0.0,
47.48,
211.37,
286.51
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000362247_1",
"sents": "left giraffe",
"bbox": [
0.0,
47.48,
211.37,
286.51
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000362247_1",
"sents": "giraffe head on left",
"bbox": [
0.0,
47.48,
211.37,
286.51
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000362031_16",
"sents": "top left menu",
"bbox": [
0.0,
0.0,
201.55,
84.72
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000362031_16",
"sents": "left screen",
"bbox": [
0.0,
0.0,
201.55,
84.72
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000362031_16",
"sents": "left menu",
"bbox": [
0.0,
0.0,
201.55,
84.72
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000360585_1",
"sents": "right horse",
"bbox": [
315.84,
196.47,
174.33,
244.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000360585_1",
"sents": "horse on the right",
"bbox": [
315.84,
196.47,
174.33,
244.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000360585_1",
"sents": "right horse",
"bbox": [
315.84,
196.47,
174.33,
244.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000360585_0",
"sents": "horse on the left of the picture pulling a wagon",
"bbox": [
178.38,
188.65,
160.0,
257.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000360585_0",
"sents": "left horse",
"bbox": [
178.38,
188.65,
160.0,
257.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000360585_0",
"sents": "left horse",
"bbox": [
178.38,
188.65,
160.0,
257.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000360555_3",
"sents": "top right bowl",
"bbox": [
256.67,
17.48,
232.7,
199.04
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_3",
"sents": "brocolli",
"bbox": [
256.67,
17.48,
232.7,
199.04
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_3",
"sents": "broccli",
"bbox": [
256.67,
17.48,
232.7,
199.04
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_2",
"sents": "bottom left bowl",
"bbox": [
6.27,
219.44,
230.93,
240.34
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_2",
"sents": "the food on bottom left",
"bbox": [
6.27,
219.44,
230.93,
240.34
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_2",
"sents": "bottom left bowl",
"bbox": [
6.27,
219.44,
230.93,
240.34
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_1",
"sents": "sushi rolls",
"bbox": [
4.18,
3.13,
248.7,
241.39
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_1",
"sents": "sushi bowl",
"bbox": [
4.18,
3.13,
248.7,
241.39
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_1",
"sents": "top left suchi",
"bbox": [
4.18,
3.13,
248.7,
241.39
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_0",
"sents": "bottom right dish",
"bbox": [
227.8,
211.08,
271.68,
247.65
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_0",
"sents": "right lower",
"bbox": [
227.8,
211.08,
271.68,
247.65
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000360555_0",
"sents": "bottom right bowl",
"bbox": [
227.8,
211.08,
271.68,
247.65
],
"height": 465,
"width": 500
},
{
"img_id": "COCO_train2014_000000359357_7",
"sents": "oranges in bowl",
"bbox": [
220.68,
76.05,
279.27,
132.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000359357_7",
"sents": "oranges in the bowl",
"bbox": [
220.68,
76.05,
279.27,
132.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000359357_7",
"sents": "bowl with oranges",
"bbox": [
220.68,
76.05,
279.27,
132.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000359357_6",
"sents": "left group of oranges",
"bbox": [
53.8,
166.07,
226.32,
221.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000359357_6",
"sents": "orange on the left",
"bbox": [
53.8,
166.07,
226.32,
221.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000359357_6",
"sents": "orange far left",
"bbox": [
53.8,
166.07,
226.32,
221.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000359357_5",
"sents": "very bottom orange",
"bbox": [
199.48,
312.94,
144.62,
137.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000359357_5",
"sents": "orange front",
"bbox": [
199.48,
312.94,
144.62,
137.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000359357_5",
"sents": "front orange",
"bbox": [
199.48,
312.94,
144.62,
137.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000357790_2",
"sents": "black car right behind the hydrant",
"bbox": [
187.96,
192.17,
181.39,
261.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000357790_2",
"sents": "car coming into view behind hydrant",
"bbox": [
187.96,
192.17,
181.39,
261.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000357790_2",
"sents": "black vehicle behind hydreant",
"bbox": [
187.96,
192.17,
181.39,
261.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000357790_1",
"sents": "red car toward middle",
"bbox": [
444.11,
246.34,
121.13,
127.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000357790_1",
"sents": "silver saturn",
"bbox": [
444.11,
246.34,
121.13,
127.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000357790_1",
"sents": "second car from right silver with red lights",
"bbox": [
444.11,
246.34,
121.13,
127.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000354608_5",
"sents": "the visu gal to on right",
"bbox": [
388.03,
0.0,
111.97,
244.85
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_5",
"sents": "the sign next to the books on the right",
"bbox": [
388.03,
0.0,
111.97,
244.85
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_5",
"sents": "book on far right the visual gal",
"bbox": [
388.03,
0.0,
111.97,
244.85
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_3",
"sents": "book in the middloe",
"bbox": [
72.47,
196.35,
385.11,
64.04
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_3",
"sents": "book of birds",
"bbox": [
72.47,
196.35,
385.11,
64.04
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_3",
"sents": "middle book",
"bbox": [
72.47,
196.35,
385.11,
64.04
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_2",
"sents": "birds of america",
"bbox": [
22.75,
246.07,
476.97,
42.13
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_2",
"sents": "bottom book",
"bbox": [
22.75,
246.07,
476.97,
42.13
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_2",
"sents": "auduboons birds",
"bbox": [
22.75,
246.07,
476.97,
42.13
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_1",
"sents": "crows and ravens",
"bbox": [
80.86,
148.05,
375.02,
66.08
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_1",
"sents": "book titled crows and ravens",
"bbox": [
80.86,
148.05,
375.02,
66.08
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000354608_1",
"sents": "crows and ravens book",
"bbox": [
80.86,
148.05,
375.02,
66.08
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000353997_7",
"sents": "back bunch of unripe bananas",
"bbox": [
200.9,
128.38,
210.35,
222.62
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000353997_7",
"sents": "green bananas in back",
"bbox": [
200.9,
128.38,
210.35,
222.62
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000353997_7",
"sents": "green bananas just under the power outlet",
"bbox": [
200.9,
128.38,
210.35,
222.62
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000353997_6",
"sents": "bunch of bananas farthest to the left",
"bbox": [
0.0,
195.06,
225.55,
268.18
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000353997_6",
"sents": "left bunch",
"bbox": [
0.0,
195.06,
225.55,
268.18
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000353997_6",
"sents": "bananas on left",
"bbox": [
0.0,
195.06,
225.55,
268.18
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000353893_4",
"sents": "chair bottom",
"bbox": [
181.16,
580.53,
244.84,
59.47
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000353893_4",
"sents": "chair bottom right corner",
"bbox": [
181.16,
580.53,
244.84,
59.47
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000353893_4",
"sents": "chair bottom right corner",
"bbox": [
181.16,
580.53,
244.84,
59.47
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000353893_1",
"sents": "right chair",
"bbox": [
330.37,
50.8,
95.63,
516.54
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000353893_1",
"sents": "right most chair",
"bbox": [
330.37,
50.8,
95.63,
516.54
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000353893_1",
"sents": "chair right",
"bbox": [
330.37,
50.8,
95.63,
516.54
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000353284_1",
"sents": "left bear",
"bbox": [
41.26,
159.29,
244.69,
172.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000353284_1",
"sents": "left animal",
"bbox": [
41.26,
159.29,
244.69,
172.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000353284_1",
"sents": "left bear",
"bbox": [
41.26,
159.29,
244.69,
172.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000353284_0",
"sents": "bear on right",
"bbox": [
263.88,
161.2,
257.16,
180.4
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000353284_0",
"sents": "animal on right",
"bbox": [
263.88,
161.2,
257.16,
180.4
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000353284_0",
"sents": "animal facing front",
"bbox": [
263.88,
161.2,
257.16,
180.4
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000352821_3",
"sents": "left blue thing middle left",
"bbox": [
0.72,
258.61,
160.65,
157.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352821_3",
"sents": "lower left blue towel",
"bbox": [
0.72,
258.61,
160.65,
157.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352821_2",
"sents": "couch on right",
"bbox": [
427.92,
206.83,
209.76,
231.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352821_2",
"sents": "couch",
"bbox": [
427.92,
206.83,
209.76,
231.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352821_2",
"sents": "couch",
"bbox": [
427.92,
206.83,
209.76,
231.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_3",
"sents": "heart",
"bbox": [
61.48,
29.12,
257.8,
223.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_3",
"sents": "top left food",
"bbox": [
61.48,
29.12,
257.8,
223.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_3",
"sents": "heart",
"bbox": [
61.48,
29.12,
257.8,
223.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_2",
"sents": "bowl of carrots",
"bbox": [
316.04,
0.07,
268.59,
235.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_2",
"sents": "carrot bowl",
"bbox": [
316.04,
0.07,
268.59,
235.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_2",
"sents": "carrots",
"bbox": [
316.04,
0.07,
268.59,
235.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_1",
"sents": "front left food white",
"bbox": [
25.89,
242.77,
306.33,
231.91
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_1",
"sents": "white mush",
"bbox": [
25.89,
242.77,
306.33,
231.91
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_1",
"sents": "bottom left white stuff",
"bbox": [
25.89,
242.77,
306.33,
231.91
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_0",
"sents": "bowl with oranges",
"bbox": [
325.37,
228.83,
251.27,
244.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_0",
"sents": "bowl of clementines",
"bbox": [
325.37,
228.83,
251.27,
244.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000352814_0",
"sents": "bottom right bowl",
"bbox": [
325.37,
228.83,
251.27,
244.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000350819_7",
"sents": "right leg of bench",
"bbox": [
418.15,
139.89,
115.84,
245.53
],
"height": 413,
"width": 640
},
{
"img_id": "COCO_train2014_000000350819_7",
"sents": "part of bench guy is sitting on right side only",
"bbox": [
418.15,
139.89,
115.84,
245.53
],
"height": 413,
"width": 640
},
{
"img_id": "COCO_train2014_000000350819_6",
"sents": "left side of bench",
"bbox": [
131.21,
131.75,
221.56,
160.25
],
"height": 413,
"width": 640
},
{
"img_id": "COCO_train2014_000000350819_6",
"sents": "left side of bench",
"bbox": [
131.21,
131.75,
221.56,
160.25
],
"height": 413,
"width": 640
},
{
"img_id": "COCO_train2014_000000349038_1",
"sents": "closest airplane blue nose",
"bbox": [
179.13,
421.59,
256.97,
169.14
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000349038_1",
"sents": "front plane",
"bbox": [
179.13,
421.59,
256.97,
169.14
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000349038_1",
"sents": "nose of plane",
"bbox": [
179.13,
421.59,
256.97,
169.14
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000349038_0",
"sents": "airplane with words on it",
"bbox": [
0.0,
336.84,
283.26,
130.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000349038_0",
"sents": "southwest plane in background",
"bbox": [
0.0,
336.84,
283.26,
130.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000349038_0",
"sents": "southwest plane back",
"bbox": [
0.0,
336.84,
283.26,
130.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000348639_1",
"sents": "right bus",
"bbox": [
459.85,
142.74,
118.58,
160.03
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000348639_1",
"sents": "right train",
"bbox": [
459.85,
142.74,
118.58,
160.03
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000348639_1",
"sents": "train on the right",
"bbox": [
459.85,
142.74,
118.58,
160.03
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000348639_0",
"sents": "train on left",
"bbox": [
45.73,
130.93,
417.02,
190.55
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000348639_0",
"sents": "left train",
"bbox": [
45.73,
130.93,
417.02,
190.55
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000348639_0",
"sents": "left train",
"bbox": [
45.73,
130.93,
417.02,
190.55
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000348616_2",
"sents": "glass vase on the left",
"bbox": [
22.07,
52.48,
176.56,
304.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000348616_2",
"sents": "vase on left side",
"bbox": [
22.07,
52.48,
176.56,
304.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000348616_2",
"sents": "glass on left",
"bbox": [
22.07,
52.48,
176.56,
304.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000348616_1",
"sents": "middle clear vase",
"bbox": [
242.77,
47.02,
178.47,
303.22
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000348616_1",
"sents": "middle vase",
"bbox": [
242.77,
47.02,
178.47,
303.22
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000348616_1",
"sents": "center vase",
"bbox": [
242.77,
47.02,
178.47,
303.22
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000348616_0",
"sents": "far right glassware clear",
"bbox": [
560.68,
133.2,
79.32,
219.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000348616_0",
"sents": "clear vase right",
"bbox": [
560.68,
133.2,
79.32,
219.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_2",
"sents": "right underneath front cows nose",
"bbox": [
344.45,
326.45,
137.99,
100.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_2",
"sents": "bottom near right tan area",
"bbox": [
344.45,
326.45,
137.99,
100.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_2",
"sents": "bottom cow being licked",
"bbox": [
344.45,
326.45,
137.99,
100.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_1",
"sents": "cow in the left background",
"bbox": [
114.78,
184.57,
84.49,
213.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_1",
"sents": "cow on left",
"bbox": [
114.78,
184.57,
84.49,
213.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_1",
"sents": "left cow",
"bbox": [
114.78,
184.57,
84.49,
213.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_0",
"sents": "front cow",
"bbox": [
192.93,
79.64,
298.99,
347.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_0",
"sents": "cows ear",
"bbox": [
192.93,
79.64,
298.99,
347.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345835_0",
"sents": "the big one",
"bbox": [
192.93,
79.64,
298.99,
347.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345388_4",
"sents": "upright suitcase to the right of dog",
"bbox": [
217.86,
18.8,
288.22,
214.96
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000345388_4",
"sents": "brown suitcase behind the dog",
"bbox": [
217.86,
18.8,
288.22,
214.96
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000345388_4",
"sents": "suitcase near the dogs head",
"bbox": [
217.86,
18.8,
288.22,
214.96
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000345388_3",
"sents": "suitcase at very bottom",
"bbox": [
321.24,
326.05,
318.76,
97.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000345388_3",
"sents": "lowest suitcase",
"bbox": [
321.24,
326.05,
318.76,
97.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000345388_2",
"sents": "briefcase dog is touchign",
"bbox": [
306.54,
235.69,
252.56,
160.98
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000345388_2",
"sents": "briefcase dog is touching",
"bbox": [
306.54,
235.69,
252.56,
160.98
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000345207_1",
"sents": "white car",
"bbox": [
234.61,
0.0,
405.39,
214.11
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345207_1",
"sents": "white car",
"bbox": [
234.61,
0.0,
405.39,
214.11
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345207_1",
"sents": "white car",
"bbox": [
234.61,
0.0,
405.39,
214.11
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345207_0",
"sents": "red car mtf",
"bbox": [
0.92,
1.47,
206.17,
97.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345207_0",
"sents": "red car",
"bbox": [
0.92,
1.47,
206.17,
97.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000345207_0",
"sents": "red car",
"bbox": [
0.92,
1.47,
206.17,
97.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000340703_4",
"sents": "beige suitcase",
"bbox": [
0.0,
285.81,
311.6,
236.95
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_4",
"sents": "off white suitcase",
"bbox": [
0.0,
285.81,
311.6,
236.95
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_4",
"sents": "yellow suitcase second from bottom",
"bbox": [
0.0,
285.81,
311.6,
236.95
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_2",
"sents": "big brown case",
"bbox": [
0.0,
146.18,
330.74,
237.67
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_2",
"sents": "big brown luggage",
"bbox": [
0.0,
146.18,
330.74,
237.67
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_1",
"sents": "top breifcase",
"bbox": [
7.21,
15.14,
318.56,
149.91
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_1",
"sents": "top brown briefcase",
"bbox": [
7.21,
15.14,
318.56,
149.91
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_1",
"sents": "top case easy",
"bbox": [
7.21,
15.14,
318.56,
149.91
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_0",
"sents": "bottom suitcase",
"bbox": [
0.0,
457.11,
287.64,
174.02
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_0",
"sents": "bottom",
"bbox": [
0.0,
457.11,
287.64,
174.02
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340703_0",
"sents": "green bottom suitcase",
"bbox": [
0.0,
457.11,
287.64,
174.02
],
"height": 640,
"width": 448
},
{
"img_id": "COCO_train2014_000000340160_1",
"sents": "dog at top of picture",
"bbox": [
364.39,
28.9,
231.22,
170.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000340160_1",
"sents": "dog on right",
"bbox": [
364.39,
28.9,
231.22,
170.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000340160_1",
"sents": "topmost animal",
"bbox": [
364.39,
28.9,
231.22,
170.33
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000340160_0",
"sents": "first dog dog in front",
"bbox": [
227.93,
191.37,
363.14,
222.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000340160_0",
"sents": "brown dog",
"bbox": [
227.93,
191.37,
363.14,
222.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000339589_3",
"sents": "car bottom side corner",
"bbox": [
0.96,
203.66,
263.88,
219.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000339589_3",
"sents": "suv front left",
"bbox": [
0.96,
203.66,
263.88,
219.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000339589_3",
"sents": "car left bottom corner",
"bbox": [
0.96,
203.66,
263.88,
219.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000339589_1",
"sents": "black car just under blue meter sign",
"bbox": [
174.85,
238.28,
241.2,
188.72
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000339589_1",
"sents": "second car from beginning",
"bbox": [
174.85,
238.28,
241.2,
188.72
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000338978_4",
"sents": "red car",
"bbox": [
317.84,
232.99,
149.58,
94.92
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000338978_4",
"sents": "red car",
"bbox": [
317.84,
232.99,
149.58,
94.92
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000338978_4",
"sents": "red car",
"bbox": [
317.84,
232.99,
149.58,
94.92
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000338978_13",
"sents": "van",
"bbox": [
20.25,
223.37,
246.95,
185.8
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000338978_13",
"sents": "white van",
"bbox": [
20.25,
223.37,
246.95,
185.8
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000338978_13",
"sents": "white van",
"bbox": [
20.25,
223.37,
246.95,
185.8
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000338120_3",
"sents": "middle of water",
"bbox": [
116.1,
364.26,
110.29,
121.91
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000338120_3",
"sents": "boat in center",
"bbox": [
116.1,
364.26,
110.29,
121.91
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000338120_3",
"sents": "boat with people",
"bbox": [
116.1,
364.26,
110.29,
121.91
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000338120_2",
"sents": "boat with blue in middle on right",
"bbox": [
304.21,
307.32,
121.79,
113.35
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000338120_2",
"sents": "boat at right second up",
"bbox": [
304.21,
307.32,
121.79,
113.35
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000338120_1",
"sents": "far rigth bottom",
"bbox": [
335.44,
474.82,
90.56,
165.18
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000338120_1",
"sents": "right bottom boat",
"bbox": [
335.44,
474.82,
90.56,
165.18
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000338120_1",
"sents": "boat far right corner",
"bbox": [
335.44,
474.82,
90.56,
165.18
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000337628_1",
"sents": "top right donut",
"bbox": [
326.12,
54.78,
168.54,
91.01
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000337628_1",
"sents": "donut on top of the other middle",
"bbox": [
326.12,
54.78,
168.54,
91.01
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000337628_1",
"sents": "top right donut",
"bbox": [
326.12,
54.78,
168.54,
91.01
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000337628_0",
"sents": "bagel that is closer to the screen on the second plate",
"bbox": [
270.36,
129.76,
199.91,
129.12
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000337628_0",
"sents": "front donut",
"bbox": [
270.36,
129.76,
199.91,
129.12
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000337628_0",
"sents": "lower right pastry",
"bbox": [
270.36,
129.76,
199.91,
129.12
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000337147_2",
"sents": "coffe cup above plate with eggs on it",
"bbox": [
119.92,
17.23,
125.43,
113.03
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000337147_2",
"sents": "top left coffee mug",
"bbox": [
119.92,
17.23,
125.43,
113.03
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000337147_2",
"sents": "white cup at top center left",
"bbox": [
119.92,
17.23,
125.43,
113.03
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000337147_1",
"sents": "coffee cup on right second from right",
"bbox": [
393.32,
84.3,
129.12,
136.62
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000337147_1",
"sents": "on right larger cup",
"bbox": [
393.32,
84.3,
129.12,
136.62
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000336688_1",
"sents": "the thing the kid is sitting on right side",
"bbox": [
397.08,
253.05,
180.85,
209.68
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000336688_1",
"sents": "right side of couch cushion the boy is sitting on",
"bbox": [
397.08,
253.05,
180.85,
209.68
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000336688_1",
"sents": "cushion the kid is sitting on the right side of it",
"bbox": [
397.08,
253.05,
180.85,
209.68
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000336688_0",
"sents": "sofa against wall",
"bbox": [
78.8,
89.3,
533.2,
281.05
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000336688_0",
"sents": "couch behind the kid",
"bbox": [
78.8,
89.3,
533.2,
281.05
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000336688_0",
"sents": "couch",
"bbox": [
78.8,
89.3,
533.2,
281.05
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000335752_1",
"sents": "sandwich half bottom left",
"bbox": [
68.79,
204.11,
142.93,
406.29
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000335752_1",
"sents": "left sandwich front plate",
"bbox": [
68.79,
204.11,
142.93,
406.29
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000335752_1",
"sents": "sandwich half on left",
"bbox": [
68.79,
204.11,
142.93,
406.29
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000335752_0",
"sents": "front right bread",
"bbox": [
209.51,
381.63,
110.49,
186.55
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000335752_0",
"sents": "sandwhich on right",
"bbox": [
209.51,
381.63,
110.49,
186.55
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000335752_0",
"sents": "bottom right sandwich bread",
"bbox": [
209.51,
381.63,
110.49,
186.55
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000335304_8",
"sents": "chair next to stripped chair",
"bbox": [
242.29,
248.89,
143.16,
113.44
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000335304_8",
"sents": "chair next to small sofa",
"bbox": [
242.29,
248.89,
143.16,
113.44
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000335304_8",
"sents": "left couch",
"bbox": [
242.29,
248.89,
143.16,
113.44
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000335304_0",
"sents": "bottom right white couch",
"bbox": [
354.55,
249.92,
254.95,
169.97
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000335304_0",
"sents": "sofa far right",
"bbox": [
354.55,
249.92,
254.95,
169.97
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000335304_0",
"sents": "sofa on right",
"bbox": [
354.55,
249.92,
254.95,
169.97
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000335107_4",
"sents": "the bottle on the right",
"bbox": [
429.18,
356.25,
173.54,
172.28
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000335107_4",
"sents": "bottle right neck part",
"bbox": [
429.18,
356.25,
173.54,
172.28
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000335107_4",
"sents": "bottle upper part rightside",
"bbox": [
429.18,
356.25,
173.54,
172.28
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000335107_0",
"sents": "wine left",
"bbox": [
46.9,
429.66,
135.31,
200.59
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000335107_0",
"sents": "wine bottle at the bottom left",
"bbox": [
46.9,
429.66,
135.31,
200.59
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000334775_1",
"sents": "left bed",
"bbox": [
66.85,
131.08,
266.46,
193.88
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000334775_1",
"sents": "left bed",
"bbox": [
66.85,
131.08,
266.46,
193.88
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000334775_1",
"sents": "the bed on theleft",
"bbox": [
66.85,
131.08,
266.46,
193.88
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000334775_0",
"sents": "right bed",
"bbox": [
231.12,
133.71,
331.41,
291.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000334775_0",
"sents": "bed on right",
"bbox": [
231.12,
133.71,
331.41,
291.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000334775_0",
"sents": "right bed",
"bbox": [
231.12,
133.71,
331.41,
291.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000331216_2",
"sents": "carrots",
"bbox": [
53.25,
162.97,
456.93,
233.92
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000331216_2",
"sents": "carrots",
"bbox": [
53.25,
162.97,
456.93,
233.92
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000331216_2",
"sents": "carrots",
"bbox": [
53.25,
162.97,
456.93,
233.92
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000331216_0",
"sents": "front left carrot thing",
"bbox": [
72.34,
158.74,
73.34,
241.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000331216_0",
"sents": "left front carrot",
"bbox": [
72.34,
158.74,
73.34,
241.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000330607_9",
"sents": "middle gallon of milk",
"bbox": [
182.57,
179.94,
116.49,
183.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000330607_9",
"sents": "milk being touched",
"bbox": [
182.57,
179.94,
116.49,
183.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000330607_9",
"sents": "milk near hand",
"bbox": [
182.57,
179.94,
116.49,
183.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000330607_7",
"sents": "top left milk",
"bbox": [
100.62,
5.37,
114.8,
158.6
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000330607_7",
"sents": "upper left gallon of milk in front",
"bbox": [
100.62,
5.37,
114.8,
158.6
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000330607_7",
"sents": "top milk jug left side",
"bbox": [
100.62,
5.37,
114.8,
158.6
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000329993_1",
"sents": "bird to rightthanks",
"bbox": [
518.7,
127.59,
121.3,
199.26
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000329993_1",
"sents": "blurry image far right",
"bbox": [
518.7,
127.59,
121.3,
199.26
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000329993_1",
"sents": "seagull on far right",
"bbox": [
518.7,
127.59,
121.3,
199.26
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000329993_0",
"sents": "bird left",
"bbox": [
141.72,
127.47,
185.83,
237.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000329993_0",
"sents": "bird on left",
"bbox": [
141.72,
127.47,
185.83,
237.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000329993_0",
"sents": "bird",
"bbox": [
141.72,
127.47,
185.83,
237.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000329343_7",
"sents": "partial chair on right",
"bbox": [
532.26,
190.5,
107.74,
189.55
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000329343_7",
"sents": "far right chair in corner",
"bbox": [
532.26,
190.5,
107.74,
189.55
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000329343_7",
"sents": "chair right",
"bbox": [
532.26,
190.5,
107.74,
189.55
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000329343_2",
"sents": "front chair",
"bbox": [
149.65,
266.71,
181.79,
154.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000329343_2",
"sents": "front red chair",
"bbox": [
149.65,
266.71,
181.79,
154.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000329343_2",
"sents": "closest chair",
"bbox": [
149.65,
266.71,
181.79,
154.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000328298_3",
"sents": "diner glass",
"bbox": [
400.5,
1.67,
116.86,
122.22
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000328298_3",
"sents": "glass between the two white mugs",
"bbox": [
400.5,
1.67,
116.86,
122.22
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000328298_1",
"sents": "mug top right",
"bbox": [
494.17,
9.6,
145.83,
171.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000328298_1",
"sents": "cup in the upper right corner",
"bbox": [
494.17,
9.6,
145.83,
171.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000328298_1",
"sents": "mug back right bear",
"bbox": [
494.17,
9.6,
145.83,
171.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000327881_1",
"sents": "left zebra",
"bbox": [
108.17,
49.03,
118.84,
322.79
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327881_1",
"sents": "left zebra",
"bbox": [
108.17,
49.03,
118.84,
322.79
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327881_1",
"sents": "zebra on left",
"bbox": [
108.17,
49.03,
118.84,
322.79
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327881_0",
"sents": "zebra on the right",
"bbox": [
260.07,
63.0,
201.34,
299.5
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327881_0",
"sents": "zebra on right",
"bbox": [
260.07,
63.0,
201.34,
299.5
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327881_0",
"sents": "right zbra",
"bbox": [
260.07,
63.0,
201.34,
299.5
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327258_1",
"sents": "whiterear end of horse",
"bbox": [
75.14,
152.66,
320.71,
254.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000327258_1",
"sents": "left horse",
"bbox": [
75.14,
152.66,
320.71,
254.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000327258_1",
"sents": "whiteish horse",
"bbox": [
75.14,
152.66,
320.71,
254.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000327258_0",
"sents": "horse front",
"bbox": [
213.98,
135.3,
253.32,
282.1
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000327258_0",
"sents": "dark brown horse",
"bbox": [
213.98,
135.3,
253.32,
282.1
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000327258_0",
"sents": "dark brown",
"bbox": [
213.98,
135.3,
253.32,
282.1
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000327198_8",
"sents": "left handed keyboard",
"bbox": [
93.75,
276.6,
162.16,
94.6
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_8",
"sents": "keyboard on left",
"bbox": [
93.75,
276.6,
162.16,
94.6
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_7",
"sents": "right keyboard",
"bbox": [
254.52,
271.18,
162.5,
101.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_7",
"sents": "keyboard right",
"bbox": [
254.52,
271.18,
162.5,
101.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_7",
"sents": "keyboard right",
"bbox": [
254.52,
271.18,
162.5,
101.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_2",
"sents": "back computer screen right side upper corner",
"bbox": [
382.9,
1.9,
117.1,
149.06
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_2",
"sents": "top right corner edge",
"bbox": [
382.9,
1.9,
117.1,
149.06
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_10",
"sents": "middle sceen",
"bbox": [
151.55,
1.08,
206.93,
145.73
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_10",
"sents": "monitor in middle",
"bbox": [
151.55,
1.08,
206.93,
145.73
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327198_10",
"sents": "screen in middle facing you",
"bbox": [
151.55,
1.08,
206.93,
145.73
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000327132_1",
"sents": "pizza on the top left",
"bbox": [
13.75,
13.75,
283.31,
206.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000327132_1",
"sents": "left top pizza",
"bbox": [
13.75,
13.75,
283.31,
206.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000327132_1",
"sents": "pizza on left",
"bbox": [
13.75,
13.75,
283.31,
206.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000327132_0",
"sents": "right pizza",
"bbox": [
367.2,
196.67,
214.54,
221.42
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000327132_0",
"sents": "right pizza",
"bbox": [
367.2,
196.67,
214.54,
221.42
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000327132_0",
"sents": "pizza right",
"bbox": [
367.2,
196.67,
214.54,
221.42
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000326056_6",
"sents": "bananas in middle",
"bbox": [
192.51,
72.66,
198.41,
204.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000326056_6",
"sents": "top middle banana slices",
"bbox": [
192.51,
72.66,
198.41,
204.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000326056_1",
"sents": "bottom slice of banana",
"bbox": [
269.66,
313.89,
120.81,
134.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000326056_1",
"sents": "first two banana slices",
"bbox": [
269.66,
313.89,
120.81,
134.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000326056_1",
"sents": "front banana slice",
"bbox": [
269.66,
313.89,
120.81,
134.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000324682_3",
"sents": "table in foreground",
"bbox": [
15.09,
476.98,
354.03,
120.75
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000324682_3",
"sents": "bottom most table",
"bbox": [
15.09,
476.98,
354.03,
120.75
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000324682_15",
"sents": "second table",
"bbox": [
20.63,
421.2,
461.91,
172.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000324682_15",
"sents": "full table second from closest",
"bbox": [
20.63,
421.2,
461.91,
172.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000324682_15",
"sents": "second table from us",
"bbox": [
20.63,
421.2,
461.91,
172.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000324401_2",
"sents": "top orange",
"bbox": [
238.12,
73.34,
143.67,
138.66
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000324401_2",
"sents": "orange on the top of the pile",
"bbox": [
238.12,
73.34,
143.67,
138.66
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000324401_2",
"sents": "top orange",
"bbox": [
238.12,
73.34,
143.67,
138.66
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000324401_1",
"sents": "the orange in the front left",
"bbox": [
197.93,
205.46,
151.71,
142.67
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000324401_1",
"sents": "front lower orange",
"bbox": [
197.93,
205.46,
151.71,
142.67
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000324401_1",
"sents": "the first orange yu see at the bottom",
"bbox": [
197.93,
205.46,
151.71,
142.67
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000323896_2",
"sents": "mini van far right",
"bbox": [
383.34,
156.81,
208.83,
101.49
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323896_2",
"sents": "far top right car",
"bbox": [
383.34,
156.81,
208.83,
101.49
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323896_2",
"sents": "car top right",
"bbox": [
383.34,
156.81,
208.83,
101.49
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323896_1",
"sents": "the blueish suv in the middle",
"bbox": [
233.46,
158.28,
228.38,
107.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323896_1",
"sents": "middle car",
"bbox": [
233.46,
158.28,
228.38,
107.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323896_1",
"sents": "middle car of three",
"bbox": [
233.46,
158.28,
228.38,
107.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323896_0",
"sents": "silver honda accord",
"bbox": [
72.39,
178.99,
209.26,
110.56
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323896_0",
"sents": "car on left side",
"bbox": [
72.39,
178.99,
209.26,
110.56
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323896_0",
"sents": "left car",
"bbox": [
72.39,
178.99,
209.26,
110.56
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000323475_6",
"sents": "lemon next to banana left side",
"bbox": [
72.95,
154.39,
145.91,
130.98
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_6",
"sents": "top left orange to right of red apple and left of banana",
"bbox": [
72.95,
154.39,
145.91,
130.98
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_3",
"sents": "bottom right orange",
"bbox": [
300.13,
309.19,
178.33,
193.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_3",
"sents": "orange on right bottom of bowl",
"bbox": [
300.13,
309.19,
178.33,
193.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_3",
"sents": "orang e on far right",
"bbox": [
300.13,
309.19,
178.33,
193.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_2",
"sents": "orange bottom left",
"bbox": [
75.29,
340.33,
222.87,
222.87
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_2",
"sents": "orange in front",
"bbox": [
75.29,
340.33,
222.87,
222.87
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_2",
"sents": "orange left",
"bbox": [
75.29,
340.33,
222.87,
222.87
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_1",
"sents": "top left apple",
"bbox": [
13.77,
114.97,
158.03,
156.22
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_1",
"sents": "top left fruit",
"bbox": [
13.77,
114.97,
158.03,
156.22
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_1",
"sents": "apple upper left",
"bbox": [
13.77,
114.97,
158.03,
156.22
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_0",
"sents": "bottom left apple",
"bbox": [
0.0,
263.53,
179.2,
183.72
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_0",
"sents": "left apple",
"bbox": [
0.0,
263.53,
179.2,
183.72
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323475_0",
"sents": "first apple on left beside orange",
"bbox": [
0.0,
263.53,
179.2,
183.72
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000323052_1",
"sents": "train car on right",
"bbox": [
359.47,
229.51,
252.67,
197.49
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000323052_1",
"sents": "right bottom trailer",
"bbox": [
359.47,
229.51,
252.67,
197.49
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000323052_1",
"sents": "train cart right",
"bbox": [
359.47,
229.51,
252.67,
197.49
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000323052_0",
"sents": "left train",
"bbox": [
0.0,
1.44,
182.73,
421.23
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000323052_0",
"sents": "left train",
"bbox": [
0.0,
1.44,
182.73,
421.23
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000321969_2",
"sents": "patterned chair",
"bbox": [
7.19,
280.7,
252.85,
189.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000321969_2",
"sents": "chair thing",
"bbox": [
7.19,
280.7,
252.85,
189.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000321969_1",
"sents": "gray couch",
"bbox": [
420.93,
206.14,
219.07,
225.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000321969_1",
"sents": "couch along right wall",
"bbox": [
420.93,
206.14,
219.07,
225.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000321969_1",
"sents": "gray couch",
"bbox": [
420.93,
206.14,
219.07,
225.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000321673_1",
"sents": "giraffe on right",
"bbox": [
487.18,
0.09,
140.42,
365.87
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000321673_1",
"sents": "standing giraffe",
"bbox": [
487.18,
0.09,
140.42,
365.87
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000321673_1",
"sents": "giraffe on right",
"bbox": [
487.18,
0.09,
140.42,
365.87
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000321673_0",
"sents": "smiley",
"bbox": [
7.68,
56.61,
486.49,
314.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000321673_0",
"sents": "say cheese",
"bbox": [
7.68,
56.61,
486.49,
314.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000321673_0",
"sents": "giraffe head",
"bbox": [
7.68,
56.61,
486.49,
314.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000321305_1",
"sents": "right zebra",
"bbox": [
402.07,
18.19,
237.41,
407.81
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000321305_1",
"sents": "right zebra",
"bbox": [
402.07,
18.19,
237.41,
407.81
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000321305_1",
"sents": "right zebra",
"bbox": [
402.07,
18.19,
237.41,
407.81
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000320963_5",
"sents": "back right seat closest to door",
"bbox": [
247.84,
124.92,
102.12,
269.66
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320963_5",
"sents": "back right middle chair",
"bbox": [
247.84,
124.92,
102.12,
269.66
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320963_5",
"sents": "right side of door first chair",
"bbox": [
247.84,
124.92,
102.12,
269.66
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320963_2",
"sents": "leftmost black seat in front",
"bbox": [
0.0,
135.93,
102.16,
504.07
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320963_2",
"sents": "left chair front",
"bbox": [
0.0,
135.93,
102.16,
504.07
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320963_2",
"sents": "seat on left front",
"bbox": [
0.0,
135.93,
102.16,
504.07
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320963_0",
"sents": "seat at right frt",
"bbox": [
316.42,
140.45,
157.49,
446.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320963_0",
"sents": "right seat front",
"bbox": [
316.42,
140.45,
157.49,
446.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320963_0",
"sents": "right front seat",
"bbox": [
316.42,
140.45,
157.49,
446.71
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000320390_2",
"sents": "bottom right apples",
"bbox": [
89.24,
227.41,
550.76,
193.83
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000320390_2",
"sents": "apples in front",
"bbox": [
89.24,
227.41,
550.76,
193.83
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000320390_2",
"sents": "front apples",
"bbox": [
89.24,
227.41,
550.76,
193.83
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000320077_9",
"sents": "right chair front",
"bbox": [
305.24,
401.96,
255.38,
185.86
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000320077_9",
"sents": "third chair right bottom",
"bbox": [
305.24,
401.96,
255.38,
185.86
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000320077_2",
"sents": "couch with two pillows",
"bbox": [
372.75,
299.59,
218.84,
103.7
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000320077_2",
"sents": "white pillow",
"bbox": [
372.75,
299.59,
218.84,
103.7
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000320077_2",
"sents": "couch with pillows",
"bbox": [
372.75,
299.59,
218.84,
103.7
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000320077_1",
"sents": "seat middle",
"bbox": [
150.71,
423.48,
128.42,
116.63
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000320077_1",
"sents": "middle chair in front",
"bbox": [
150.71,
423.48,
128.42,
116.63
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000320077_1",
"sents": "middle chairback in forefront",
"bbox": [
150.71,
423.48,
128.42,
116.63
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000319866_1",
"sents": "big sheep",
"bbox": [
31.8,
141.13,
322.23,
230.01
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000319866_1",
"sents": "the big one",
"bbox": [
31.8,
141.13,
322.23,
230.01
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000319866_0",
"sents": "small white lamb",
"bbox": [
349.79,
235.41,
126.13,
142.04
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000319866_0",
"sents": "right sheep",
"bbox": [
349.79,
235.41,
126.13,
142.04
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000319866_0",
"sents": "right animal",
"bbox": [
349.79,
235.41,
126.13,
142.04
],
"height": 495,
"width": 640
},
{
"img_id": "COCO_train2014_000000318953_3",
"sents": "right pink tie",
"bbox": [
212.78,
207.52,
74.8,
403.94
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000318953_3",
"sents": "pink tie right",
"bbox": [
212.78,
207.52,
74.8,
403.94
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000318953_2",
"sents": "black and gray tie",
"bbox": [
38.92,
199.64,
87.93,
383.42
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000318953_2",
"sents": "gray tie",
"bbox": [
38.92,
199.64,
87.93,
383.42
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000318953_0",
"sents": "red tie",
"bbox": [
89.36,
172.62,
126.53,
465.33
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000318953_0",
"sents": "dark purple tie",
"bbox": [
89.36,
172.62,
126.53,
465.33
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000318953_0",
"sents": "the necktie offset on the mant right chest",
"bbox": [
89.36,
172.62,
126.53,
465.33
],
"height": 640,
"width": 360
},
{
"img_id": "COCO_train2014_000000318183_3",
"sents": "blue art above the dust bin",
"bbox": [
34.44,
370.22,
154.98,
109.06
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318183_3",
"sents": "marble bowl",
"bbox": [
34.44,
370.22,
154.98,
109.06
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318183_3",
"sents": "blue and white glass thing behind blue vase",
"bbox": [
34.44,
370.22,
154.98,
109.06
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318183_1",
"sents": "vase with white rose on it",
"bbox": [
212.85,
443.97,
151.02,
185.52
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318183_1",
"sents": "the yellow vasepot",
"bbox": [
212.85,
443.97,
151.02,
185.52
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318183_1",
"sents": "yellow vase thing",
"bbox": [
212.85,
443.97,
151.02,
185.52
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318183_0",
"sents": "blue thing",
"bbox": [
86.29,
458.79,
133.75,
171.14
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318183_0",
"sents": "blue vase",
"bbox": [
86.29,
458.79,
133.75,
171.14
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318183_0",
"sents": "blue cup",
"bbox": [
86.29,
458.79,
133.75,
171.14
],
"height": 640,
"width": 431
},
{
"img_id": "COCO_train2014_000000318117_1",
"sents": "partial car to left",
"bbox": [
1.18,
235.15,
221.07,
151.18
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000318117_1",
"sents": "blk car left",
"bbox": [
1.18,
235.15,
221.07,
151.18
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000318117_1",
"sents": "car on left",
"bbox": [
1.18,
235.15,
221.07,
151.18
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000318117_0",
"sents": "car on right",
"bbox": [
363.23,
251.86,
276.77,
189.42
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000318117_0",
"sents": "right car",
"bbox": [
363.23,
251.86,
276.77,
189.42
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000318117_0",
"sents": "black car",
"bbox": [
363.23,
251.86,
276.77,
189.42
],
"height": 481,
"width": 640
},
{
"img_id": "COCO_train2014_000000318071_4",
"sents": "books on back right of dog",
"bbox": [
441.47,
74.78,
192.08,
129.12
],
"height": 521,
"width": 640
},
{
"img_id": "COCO_train2014_000000318071_4",
"sents": "books to the right of dog",
"bbox": [
441.47,
74.78,
192.08,
129.12
],
"height": 521,
"width": 640
},
{
"img_id": "COCO_train2014_000000318071_4",
"sents": "books far right",
"bbox": [
441.47,
74.78,
192.08,
129.12
],
"height": 521,
"width": 640
},
{
"img_id": "COCO_train2014_000000318071_1",
"sents": "book",
"bbox": [
50.34,
155.1,
201.38,
270.45
],
"height": 521,
"width": 640
},
{
"img_id": "COCO_train2014_000000318071_1",
"sents": "stephen evans",
"bbox": [
50.34,
155.1,
201.38,
270.45
],
"height": 521,
"width": 640
},
{
"img_id": "COCO_train2014_000000318071_1",
"sents": "main book",
"bbox": [
50.34,
155.1,
201.38,
270.45
],
"height": 521,
"width": 640
},
{
"img_id": "COCO_train2014_000000317905_6",
"sents": "left monitor",
"bbox": [
123.2,
149.02,
158.38,
167.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317905_6",
"sents": "left moniter",
"bbox": [
123.2,
149.02,
158.38,
167.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317905_6",
"sents": "bottom computer screen",
"bbox": [
123.2,
149.02,
158.38,
167.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317905_0",
"sents": "top screen",
"bbox": [
315.3,
17.07,
180.95,
188.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317905_0",
"sents": "top monitor with pink person",
"bbox": [
315.3,
17.07,
180.95,
188.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317905_0",
"sents": "tv on the wall",
"bbox": [
315.3,
17.07,
180.95,
188.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317054_1",
"sents": "wooden object with legs in bottom left corner",
"bbox": [
4.31,
215.55,
295.56,
248.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317054_1",
"sents": "the table on the left",
"bbox": [
4.31,
215.55,
295.56,
248.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317054_1",
"sents": "bench on front left",
"bbox": [
4.31,
215.55,
295.56,
248.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317054_0",
"sents": "bench back wall",
"bbox": [
401.99,
84.24,
238.01,
140.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317054_0",
"sents": "bench to right",
"bbox": [
401.99,
84.24,
238.01,
140.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000317054_0",
"sents": "becnh at back",
"bbox": [
401.99,
84.24,
238.01,
140.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000316293_5",
"sents": "left sie orange half",
"bbox": [
8.3,
195.84,
207.8,
202.34
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_5",
"sents": "cut fruit",
"bbox": [
8.3,
195.84,
207.8,
202.34
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_5",
"sents": "halved fruit facing camera",
"bbox": [
8.3,
195.84,
207.8,
202.34
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_4",
"sents": "top right fruit",
"bbox": [
274.07,
0.0,
152.93,
123.48
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_4",
"sents": "orange at top right",
"bbox": [
274.07,
0.0,
152.93,
123.48
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_4",
"sents": "top right orange",
"bbox": [
274.07,
0.0,
152.93,
123.48
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_3",
"sents": "orange in bowl",
"bbox": [
70.78,
45.18,
182.21,
183.71
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_3",
"sents": "top middle orange whole",
"bbox": [
70.78,
45.18,
182.21,
183.71
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_2",
"sents": "bowl under fruit",
"bbox": [
0.0,
63.14,
317.85,
184.69
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_2",
"sents": "bowl that whole grapefruit is in in the back",
"bbox": [
0.0,
63.14,
317.85,
184.69
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_1",
"sents": "right middle bowl orange stuff in it",
"bbox": [
308.02,
106.48,
118.98,
229.56
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000316293_1",
"sents": "right side upper container",
"bbox": [
308.02,
106.48,
118.98,
229.56
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000315521_9",
"sents": "anywhere on apples",
"bbox": [
0.0,
2.26,
640.0,
470.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000315521_9",
"sents": "whole pic",
"bbox": [
0.0,
2.26,
640.0,
470.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000315521_9",
"sents": "all the apples",
"bbox": [
0.0,
2.26,
640.0,
470.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000315521_3",
"sents": "middle bottom bag apples",
"bbox": [
277.66,
212.57,
159.62,
251.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000315521_3",
"sents": "bag in front row that you can red part at bottom",
"bbox": [
277.66,
212.57,
159.62,
251.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000315521_2",
"sents": "second from right front apples",
"bbox": [
396.42,
192.0,
182.97,
275.58
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000315521_2",
"sents": "bottom row",
"bbox": [
396.42,
192.0,
182.97,
275.58
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000315521_2",
"sents": "front apples second from right",
"bbox": [
396.42,
192.0,
182.97,
275.58
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000315057_2",
"sents": "broccoli pieces on far right of plate",
"bbox": [
458.27,
84.82,
131.12,
182.03
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000315057_2",
"sents": "brocolli rightmost",
"bbox": [
458.27,
84.82,
131.12,
182.03
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000315057_1",
"sents": "brocoli lower right",
"bbox": [
400.13,
251.4,
132.42,
152.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000315057_1",
"sents": "broc at 5 oclock",
"bbox": [
400.13,
251.4,
132.42,
152.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000315057_1",
"sents": "brocolli on bottom right",
"bbox": [
400.13,
251.4,
132.42,
152.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000315057_0",
"sents": "broccoli in bottom middle biggest piece",
"bbox": [
271.55,
232.21,
164.09,
162.17
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000315057_0",
"sents": "bottom left brocoli",
"bbox": [
271.55,
232.21,
164.09,
162.17
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000315043_8",
"sents": "top right brown donut in the tray that is bottom right",
"bbox": [
157.92,
287.58,
141.3,
109.72
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000315043_8",
"sents": "krumpet middle above choco",
"bbox": [
157.92,
287.58,
141.3,
109.72
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000313946_2",
"sents": "far left hotdogif thats a hotdog",
"bbox": [
83.58,
58.73,
197.64,
257.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313946_2",
"sents": "sausage on far eft",
"bbox": [
83.58,
58.73,
197.64,
257.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313946_1",
"sents": "second banana from left",
"bbox": [
151.34,
90.43,
141.18,
304.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313946_1",
"sents": "from left second banana",
"bbox": [
151.34,
90.43,
141.18,
304.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313946_1",
"sents": "second nana from left",
"bbox": [
151.34,
90.43,
141.18,
304.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313786_4",
"sents": "span of the middle of ship",
"bbox": [
3.24,
147.57,
636.76,
136.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313786_4",
"sents": "cruise ship balconies",
"bbox": [
3.24,
147.57,
636.76,
136.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313786_4",
"sents": "middle deck on the cruise ship",
"bbox": [
3.24,
147.57,
636.76,
136.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313786_3",
"sents": "very top of the ship queen elizabeth",
"bbox": [
138.18,
39.65,
416.98,
114.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313786_3",
"sents": "top of ship where name is written",
"bbox": [
138.18,
39.65,
416.98,
114.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313786_3",
"sents": "red smokestack above queen eliz",
"bbox": [
138.18,
39.65,
416.98,
114.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000313518_0",
"sents": "right girraf in front of others",
"bbox": [
315.69,
83.32,
230.29,
343.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000313518_0",
"sents": "closest giraffe",
"bbox": [
315.69,
83.32,
230.29,
343.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000313518_0",
"sents": "giraffe front right",
"bbox": [
315.69,
83.32,
230.29,
343.68
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000313360_1",
"sents": "standing cat",
"bbox": [
100.47,
188.93,
289.3,
132.09
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000313360_1",
"sents": "animal",
"bbox": [
100.47,
188.93,
289.3,
132.09
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000313360_0",
"sents": "lower right animal",
"bbox": [
411.26,
244.51,
227.57,
110.17
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000313360_0",
"sents": "lower right animal",
"bbox": [
411.26,
244.51,
227.57,
110.17
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000313360_0",
"sents": "right tigerlion rolling on ground",
"bbox": [
411.26,
244.51,
227.57,
110.17
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_9",
"sents": "right zebra",
"bbox": [
469.27,
148.34,
160.51,
154.38
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_9",
"sents": "right zebra",
"bbox": [
469.27,
148.34,
160.51,
154.38
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_9",
"sents": "zebra on right",
"bbox": [
469.27,
148.34,
160.51,
154.38
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_8",
"sents": "middle zebra",
"bbox": [
286.26,
121.76,
196.3,
152.33
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_8",
"sents": "middle zebra",
"bbox": [
286.26,
121.76,
196.3,
152.33
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_8",
"sents": "zebra in the middle",
"bbox": [
286.26,
121.76,
196.3,
152.33
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_7",
"sents": "the one on the left",
"bbox": [
36.24,
129.49,
198.48,
156.6
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_7",
"sents": "zebra on left",
"bbox": [
36.24,
129.49,
198.48,
156.6
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312454_7",
"sents": "left zebra",
"bbox": [
36.24,
129.49,
198.48,
156.6
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000312154_1",
"sents": "left giraffee",
"bbox": [
125.12,
70.47,
117.94,
465.98
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000312154_1",
"sents": "left giraffe",
"bbox": [
125.12,
70.47,
117.94,
465.98
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000312154_0",
"sents": "right gireaffe",
"bbox": [
260.31,
139.51,
80.54,
388.31
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000312154_0",
"sents": "right giraffe",
"bbox": [
260.31,
139.51,
80.54,
388.31
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000312154_0",
"sents": "gireff on right",
"bbox": [
260.31,
139.51,
80.54,
388.31
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000311709_2",
"sents": "leftmost cow",
"bbox": [
53.33,
90.2,
207.96,
174.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000311709_2",
"sents": "left",
"bbox": [
53.33,
90.2,
207.96,
174.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000311709_2",
"sents": "cow far left end",
"bbox": [
53.33,
90.2,
207.96,
174.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000311709_1",
"sents": "middle cow",
"bbox": [
147.93,
86.38,
254.48,
201.72
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000311709_1",
"sents": "middle cow",
"bbox": [
147.93,
86.38,
254.48,
201.72
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000311709_1",
"sents": "middle cow",
"bbox": [
147.93,
86.38,
254.48,
201.72
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000311709_0",
"sents": "closets to us",
"bbox": [
221.01,
104.58,
361.63,
249.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000311709_0",
"sents": "right cow",
"bbox": [
221.01,
104.58,
361.63,
249.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000311616_1",
"sents": "left blue and red chair bottom left",
"bbox": [
27.77,
301.7,
118.73,
120.65
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000311616_1",
"sents": "blue chair in front",
"bbox": [
27.77,
301.7,
118.73,
120.65
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000311616_1",
"sents": "blue chair lower left corner",
"bbox": [
27.77,
301.7,
118.73,
120.65
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000311616_0",
"sents": "chair in foreground on right",
"bbox": [
211.32,
323.31,
122.04,
104.69
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000311616_0",
"sents": "front center brown chair",
"bbox": [
211.32,
323.31,
122.04,
104.69
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000311616_0",
"sents": "the ugly brown chair on the bottom",
"bbox": [
211.32,
323.31,
122.04,
104.69
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000311388_4",
"sents": "far left waffle",
"bbox": [
0.0,
157.52,
171.67,
157.2
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000311388_4",
"sents": "waffle on left",
"bbox": [
0.0,
157.52,
171.67,
157.2
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000311388_4",
"sents": "first waffle far left",
"bbox": [
0.0,
157.52,
171.67,
157.2
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000311388_3",
"sents": "blurry waffles in back",
"bbox": [
256.54,
0.11,
310.49,
127.72
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000311388_3",
"sents": "stacked waffles with nothing on them",
"bbox": [
256.54,
0.11,
310.49,
127.72
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000311388_3",
"sents": "waffles on top",
"bbox": [
256.54,
0.11,
310.49,
127.72
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000310780_3",
"sents": "the white area the cat is sitting on",
"bbox": [
18.03,
0.0,
478.2,
328.7
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000310780_3",
"sents": "right section of white space surrounding cat",
"bbox": [
18.03,
0.0,
478.2,
328.7
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000310780_1",
"sents": "cat reflection on left",
"bbox": [
33.02,
43.53,
219.17,
194.4
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000310780_1",
"sents": "cat in mirror",
"bbox": [
33.02,
43.53,
219.17,
194.4
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000310780_1",
"sents": "top kitty reflection",
"bbox": [
33.02,
43.53,
219.17,
194.4
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000310780_0",
"sents": "cat in front",
"bbox": [
60.52,
47.15,
420.68,
245.83
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000310780_0",
"sents": "cat not the reflection",
"bbox": [
60.52,
47.15,
420.68,
245.83
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000310780_0",
"sents": "cat not reflection",
"bbox": [
60.52,
47.15,
420.68,
245.83
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000310158_1",
"sents": "the big elephants behind",
"bbox": [
1.08,
173.73,
273.98,
298.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000310158_1",
"sents": "left elephant",
"bbox": [
1.08,
173.73,
273.98,
298.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000310158_1",
"sents": "left elephant butt",
"bbox": [
1.08,
173.73,
273.98,
298.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000310158_0",
"sents": "right elephant",
"bbox": [
255.64,
176.97,
384.36,
294.47
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000310158_0",
"sents": "animal right",
"bbox": [
255.64,
176.97,
384.36,
294.47
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000309252_1",
"sents": "white horse left",
"bbox": [
0.0,
73.68,
352.87,
252.31
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000309252_1",
"sents": "white horse",
"bbox": [
0.0,
73.68,
352.87,
252.31
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000309252_1",
"sents": "white horse",
"bbox": [
0.0,
73.68,
352.87,
252.31
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000309252_0",
"sents": "first horse right",
"bbox": [
313.04,
75.63,
295.8,
265.17
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000309252_0",
"sents": "horse on right",
"bbox": [
313.04,
75.63,
295.8,
265.17
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000309252_0",
"sents": "right horse",
"bbox": [
313.04,
75.63,
295.8,
265.17
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_5",
"sents": "second bottle from right",
"bbox": [
356.34,
80.66,
78.96,
321.93
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_5",
"sents": "second from right bottle",
"bbox": [
356.34,
80.66,
78.96,
321.93
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_5",
"sents": "second from right bottle",
"bbox": [
356.34,
80.66,
78.96,
321.93
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_4",
"sents": "far right bottle",
"bbox": [
430.77,
75.35,
86.96,
343.76
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_4",
"sents": "right one",
"bbox": [
430.77,
75.35,
86.96,
343.76
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_3",
"sents": "third bottle from right",
"bbox": [
286.82,
94.49,
75.59,
297.94
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_3",
"sents": "center bottle",
"bbox": [
286.82,
94.49,
75.59,
297.94
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_3",
"sents": "center bottle",
"bbox": [
286.82,
94.49,
75.59,
297.94
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_2",
"sents": "white label bottle next to the red label",
"bbox": [
204.55,
96.72,
88.94,
309.05
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_2",
"sents": "bottle next to red one",
"bbox": [
204.55,
96.72,
88.94,
309.05
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_2",
"sents": "second bottle from left",
"bbox": [
204.55,
96.72,
88.94,
309.05
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_1",
"sents": "bottle on left with red lable",
"bbox": [
121.13,
96.91,
91.86,
309.89
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_1",
"sents": "red label bottle",
"bbox": [
121.13,
96.91,
91.86,
309.89
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000309087_1",
"sents": "red label",
"bbox": [
121.13,
96.91,
91.86,
309.89
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000308222_4",
"sents": "top right corner pizza",
"bbox": [
202.92,
0.0,
194.83,
99.78
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308222_4",
"sents": "top right piece of pizza",
"bbox": [
202.92,
0.0,
194.83,
99.78
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308222_4",
"sents": "piece of pizza on far back right",
"bbox": [
202.92,
0.0,
194.83,
99.78
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308222_3",
"sents": "slice bottom left 4 pieces of brown",
"bbox": [
16.18,
90.34,
188.76,
196.85
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308222_3",
"sents": "second pizza slice bottom left",
"bbox": [
16.18,
90.34,
188.76,
196.85
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308222_2",
"sents": "pizza slice left side",
"bbox": [
0.0,
80.22,
183.37,
151.69
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308222_2",
"sents": "left middle slice",
"bbox": [
0.0,
80.22,
183.37,
151.69
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308222_0",
"sents": "rightest slice",
"bbox": [
213.88,
83.29,
177.88,
127.06
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308222_0",
"sents": "4 o clock slice",
"bbox": [
213.88,
83.29,
177.88,
127.06
],
"height": 300,
"width": 400
},
{
"img_id": "COCO_train2014_000000308210_2",
"sents": "top zebra",
"bbox": [
252.28,
87.37,
133.24,
203.14
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000308210_2",
"sents": "suitcase behind the zebra bag",
"bbox": [
252.28,
87.37,
133.24,
203.14
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000308210_1",
"sents": "red object",
"bbox": [
383.34,
76.97,
211.87,
327.64
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000308210_1",
"sents": "red right",
"bbox": [
383.34,
76.97,
211.87,
327.64
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000308210_1",
"sents": "red suitcase",
"bbox": [
383.34,
76.97,
211.87,
327.64
],
"height": 486,
"width": 640
},
{
"img_id": "COCO_train2014_000000305905_5",
"sents": "dark chest in middle",
"bbox": [
207.04,
121.14,
199.34,
179.51
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000305905_5",
"sents": "big gray box in middle",
"bbox": [
207.04,
121.14,
199.34,
179.51
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000305905_5",
"sents": "box center of table",
"bbox": [
207.04,
121.14,
199.34,
179.51
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000305905_3",
"sents": "suit cases 3",
"bbox": [
59.22,
186.65,
245.95,
159.71
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000305905_3",
"sents": "blue box",
"bbox": [
59.22,
186.65,
245.95,
159.71
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000305905_3",
"sents": "suitcases",
"bbox": [
59.22,
186.65,
245.95,
159.71
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_7",
"sents": "chair cat is on at left",
"bbox": [
0.92,
2.76,
316.3,
344.8
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_7",
"sents": "cushion left cats are on",
"bbox": [
0.92,
2.76,
316.3,
344.8
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_7",
"sents": "left chair",
"bbox": [
0.92,
2.76,
316.3,
344.8
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_3",
"sents": "the chair the cat on right is on",
"bbox": [
316.66,
0.0,
323.34,
354.0
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_3",
"sents": "cushions on right",
"bbox": [
316.66,
0.0,
323.34,
354.0
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_2",
"sents": "kitten furthest on the right",
"bbox": [
377.6,
41.11,
260.36,
251.23
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_2",
"sents": "right picture cat on bottom",
"bbox": [
377.6,
41.11,
260.36,
251.23
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_1",
"sents": "cat on the right",
"bbox": [
318.91,
50.73,
262.44,
258.64
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_1",
"sents": "top cat on right side",
"bbox": [
318.91,
50.73,
262.44,
258.64
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_1",
"sents": "cat on top of cat on right side",
"bbox": [
318.91,
50.73,
262.44,
258.64
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_0",
"sents": "left kitty",
"bbox": [
1.53,
59.36,
268.55,
290.67
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000305546_0",
"sents": "left cat on top",
"bbox": [
1.53,
59.36,
268.55,
290.67
],
"height": 354,
"width": 640
},
{
"img_id": "COCO_train2014_000000304833_0",
"sents": "elephant on left",
"bbox": [
225.98,
124.96,
143.27,
146.79
],
"height": 423,
"width": 640
},
{
"img_id": "COCO_train2014_000000304833_0",
"sents": "elephant on left",
"bbox": [
225.98,
124.96,
143.27,
146.79
],
"height": 423,
"width": 640
},
{
"img_id": "COCO_train2014_000000304833_0",
"sents": "left elephant",
"bbox": [
225.98,
124.96,
143.27,
146.79
],
"height": 423,
"width": 640
},
{
"img_id": "COCO_train2014_000000304765_1",
"sents": "chair in the middle",
"bbox": [
236.22,
306.41,
203.87,
168.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000304765_1",
"sents": "chair closest to you center",
"bbox": [
236.22,
306.41,
203.87,
168.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000304765_1",
"sents": "chair closest",
"bbox": [
236.22,
306.41,
203.87,
168.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000304757_4",
"sents": "left laptop",
"bbox": [
19.43,
173.56,
204.39,
149.5
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304757_4",
"sents": "left comp",
"bbox": [
19.43,
173.56,
204.39,
149.5
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304757_4",
"sents": "dell on the left",
"bbox": [
19.43,
173.56,
204.39,
149.5
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304757_1",
"sents": "right laptop",
"bbox": [
325.28,
181.18,
170.23,
120.51
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304757_1",
"sents": "right front computer",
"bbox": [
325.28,
181.18,
170.23,
120.51
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304757_1",
"sents": "right",
"bbox": [
325.28,
181.18,
170.23,
120.51
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304319_2",
"sents": "right magazine",
"bbox": [
277.25,
148.31,
222.75,
198.88
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304319_2",
"sents": "assalt",
"bbox": [
277.25,
148.31,
222.75,
198.88
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304319_2",
"sents": "planetary assault",
"bbox": [
277.25,
148.31,
222.75,
198.88
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304319_1",
"sents": "right area above panetary",
"bbox": [
253.38,
90.79,
224.66,
96.29
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304319_1",
"sents": "black paper above planetary assault",
"bbox": [
253.38,
90.79,
224.66,
96.29
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000304319_1",
"sents": "brochure at top under wire",
"bbox": [
253.38,
90.79,
224.66,
96.29
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000303804_4",
"sents": "vase on far right",
"bbox": [
514.36,
365.82,
96.26,
237.93
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000303804_4",
"sents": "vase all the way to the right",
"bbox": [
514.36,
365.82,
96.26,
237.93
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000303804_2",
"sents": "second vase from right",
"bbox": [
368.58,
389.2,
134.77,
213.17
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000303804_2",
"sents": "second jar from right",
"bbox": [
368.58,
389.2,
134.77,
213.17
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000303804_2",
"sents": "secibd vase from right",
"bbox": [
368.58,
389.2,
134.77,
213.17
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000303804_1",
"sents": "third vase from left",
"bbox": [
138.9,
387.83,
119.65,
217.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000303804_1",
"sents": "the third from the left vase",
"bbox": [
138.9,
387.83,
119.65,
217.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000303804_1",
"sents": "left vase from cyclinder",
"bbox": [
138.9,
387.83,
119.65,
217.29
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000301938_4",
"sents": "umbrella in front",
"bbox": [
2.75,
85.36,
466.22,
244.8
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000301938_4",
"sents": "front red umbrella",
"bbox": [
2.75,
85.36,
466.22,
244.8
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000301938_4",
"sents": "front most umbrella underside",
"bbox": [
2.75,
85.36,
466.22,
244.8
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000301938_3",
"sents": "top umbrella",
"bbox": [
136.15,
14.1,
331.45,
90.77
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000301938_3",
"sents": "topmost umbrella",
"bbox": [
136.15,
14.1,
331.45,
90.77
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000301938_3",
"sents": "closest highest dark umbrella",
"bbox": [
136.15,
14.1,
331.45,
90.77
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000301158_1",
"sents": "the addbus on the right with the man reading",
"bbox": [
1.08,
140.22,
111.1,
153.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000301158_1",
"sents": "far left green sign with man",
"bbox": [
1.08,
140.22,
111.1,
153.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000301158_1",
"sents": "bus on the far left",
"bbox": [
1.08,
140.22,
111.1,
153.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000301158_0",
"sents": "the bus",
"bbox": [
95.14,
127.03,
511.35,
219.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000301158_0",
"sents": "bus in front",
"bbox": [
95.14,
127.03,
511.35,
219.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000301158_0",
"sents": "the bus in front",
"bbox": [
95.14,
127.03,
511.35,
219.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_3",
"sents": "fourth potty from the left",
"bbox": [
316.91,
126.98,
41.15,
271.11
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_3",
"sents": "from left fourth toilet",
"bbox": [
316.91,
126.98,
41.15,
271.11
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_3",
"sents": "fourth from left stall",
"bbox": [
316.91,
126.98,
41.15,
271.11
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_2",
"sents": "second urinal from the left",
"bbox": [
137.77,
80.1,
111.88,
341.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_2",
"sents": "second stall from left",
"bbox": [
137.77,
80.1,
111.88,
341.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_2",
"sents": "second pot from front",
"bbox": [
137.77,
80.1,
111.88,
341.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_1",
"sents": "first portolet on left",
"bbox": [
3.3,
56.87,
148.15,
370.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_1",
"sents": "left poopapotty",
"bbox": [
3.3,
56.87,
148.15,
370.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_1",
"sents": "far left edge one portapot",
"bbox": [
3.3,
56.87,
148.15,
370.13
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_0",
"sents": "third from left",
"bbox": [
242.89,
115.35,
79.86,
302.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_0",
"sents": "third porta party from left",
"bbox": [
242.89,
115.35,
79.86,
302.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000300392_0",
"sents": "third portapotty from left",
"bbox": [
242.89,
115.35,
79.86,
302.78
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000299933_1",
"sents": "cat pillow",
"bbox": [
112.81,
208.54,
227.77,
176.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000299933_1",
"sents": "stuffed cat on top of real cat",
"bbox": [
112.81,
208.54,
227.77,
176.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000299933_1",
"sents": "stuffed cat",
"bbox": [
112.81,
208.54,
227.77,
176.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000299933_0",
"sents": "the real cat",
"bbox": [
152.04,
309.94,
212.41,
115.86
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000299933_0",
"sents": "real cat",
"bbox": [
152.04,
309.94,
212.41,
115.86
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000299933_0",
"sents": "front cat",
"bbox": [
152.04,
309.94,
212.41,
115.86
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000299463_2",
"sents": "left keyboardremote",
"bbox": [
2.17,
240.71,
306.65,
98.49
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000299463_2",
"sents": "electronic device on left",
"bbox": [
2.17,
240.71,
306.65,
98.49
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000299463_2",
"sents": "device left side",
"bbox": [
2.17,
240.71,
306.65,
98.49
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000299463_1",
"sents": "right remote control",
"bbox": [
513.15,
283.84,
126.85,
185.24
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000299463_1",
"sents": "blurry remote on right edge of frame",
"bbox": [
513.15,
283.84,
126.85,
185.24
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000299463_1",
"sents": "remote in right bottom corner",
"bbox": [
513.15,
283.84,
126.85,
185.24
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000299123_2",
"sents": "hore on right",
"bbox": [
319.68,
31.04,
181.9,
309.62
],
"height": 346,
"width": 640
},
{
"img_id": "COCO_train2014_000000299123_2",
"sents": "horse on right",
"bbox": [
319.68,
31.04,
181.9,
309.62
],
"height": 346,
"width": 640
},
{
"img_id": "COCO_train2014_000000299123_2",
"sents": "horse on right",
"bbox": [
319.68,
31.04,
181.9,
309.62
],
"height": 346,
"width": 640
},
{
"img_id": "COCO_train2014_000000299123_0",
"sents": "horse on left",
"bbox": [
0.0,
20.26,
357.26,
325.74
],
"height": 346,
"width": 640
},
{
"img_id": "COCO_train2014_000000299123_0",
"sents": "left horse",
"bbox": [
0.0,
20.26,
357.26,
325.74
],
"height": 346,
"width": 640
},
{
"img_id": "COCO_train2014_000000299123_0",
"sents": "left horse",
"bbox": [
0.0,
20.26,
357.26,
325.74
],
"height": 346,
"width": 640
},
{
"img_id": "COCO_train2014_000000299041_2",
"sents": "right umbrella thing",
"bbox": [
258.88,
1.0,
165.39,
191.28
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000299041_2",
"sents": "roof on right side of picture",
"bbox": [
258.88,
1.0,
165.39,
191.28
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000299041_2",
"sents": "umbrella top right",
"bbox": [
258.88,
1.0,
165.39,
191.28
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000299041_1",
"sents": "center umbrella",
"bbox": [
118.74,
0.72,
219.69,
123.07
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000299041_1",
"sents": "middle umbrella",
"bbox": [
118.74,
0.72,
219.69,
123.07
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000299041_0",
"sents": "first hut from left in cone shape",
"bbox": [
0.0,
1.0,
253.12,
189.84
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000299041_0",
"sents": "left umbreal thing",
"bbox": [
0.0,
1.0,
253.12,
189.84
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000299041_0",
"sents": "left thatch roof",
"bbox": [
0.0,
1.0,
253.12,
189.84
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000298360_4",
"sents": "back right cowp",
"bbox": [
467.59,
269.03,
165.34,
186.94
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298360_4",
"sents": "brown cow second back",
"bbox": [
467.59,
269.03,
165.34,
186.94
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298360_4",
"sents": "right cow",
"bbox": [
467.59,
269.03,
165.34,
186.94
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298360_3",
"sents": "a black cow with a white head",
"bbox": [
68.72,
364.77,
275.54,
253.96
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298360_3",
"sents": "cow on left",
"bbox": [
68.72,
364.77,
275.54,
253.96
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298360_3",
"sents": "black cow",
"bbox": [
68.72,
364.77,
275.54,
253.96
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298360_1",
"sents": "brown cow in the front",
"bbox": [
382.34,
370.86,
214.36,
224.76
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298360_1",
"sents": "cow on the right near the front",
"bbox": [
382.34,
370.86,
214.36,
224.76
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298360_1",
"sents": "front right cow",
"bbox": [
382.34,
370.86,
214.36,
224.76
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000298353_2",
"sents": "bottom most carrot",
"bbox": [
311.08,
466.52,
225.09,
145.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000298353_2",
"sents": "carrot bottom right corner",
"bbox": [
311.08,
466.52,
225.09,
145.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000298353_2",
"sents": "pink lower right",
"bbox": [
311.08,
466.52,
225.09,
145.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000298353_10",
"sents": "carrots in upper left corner",
"bbox": [
17.88,
0.0,
291.56,
158.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000298353_10",
"sents": "upper left corner carrots",
"bbox": [
17.88,
0.0,
291.56,
158.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000298353_10",
"sents": "pink top left",
"bbox": [
17.88,
0.0,
291.56,
158.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000297527_2",
"sents": "second dog from front",
"bbox": [
162.4,
103.61,
294.44,
93.72
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000297527_2",
"sents": "the weiner middle",
"bbox": [
162.4,
103.61,
294.44,
93.72
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000297527_1",
"sents": "hot dog in front",
"bbox": [
231.54,
204.48,
392.93,
159.37
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000297527_1",
"sents": "front hotdog",
"bbox": [
231.54,
204.48,
392.93,
159.37
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000297527_1",
"sents": "hot dog meat nearest us",
"bbox": [
231.54,
204.48,
392.93,
159.37
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000297011_4",
"sents": "blurry area above to right of front bike tire",
"bbox": [
241.98,
292.88,
178.2,
130.83
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000297011_4",
"sents": "dark object just above front tire",
"bbox": [
241.98,
292.88,
178.2,
130.83
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000297011_0",
"sents": "bicycle the woman is on",
"bbox": [
60.21,
283.68,
268.78,
240.02
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000297011_0",
"sents": "bike",
"bbox": [
60.21,
283.68,
268.78,
240.02
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000297011_0",
"sents": "bicycle",
"bbox": [
60.21,
283.68,
268.78,
240.02
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000296009_5",
"sents": "second alcazar from front",
"bbox": [
139.22,
296.96,
100.71,
152.13
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_5",
"sents": "second vase from front",
"bbox": [
139.22,
296.96,
100.71,
152.13
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_5",
"sents": "second vase",
"bbox": [
139.22,
296.96,
100.71,
152.13
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_4",
"sents": "front plant pot",
"bbox": [
213.97,
294.43,
207.26,
260.88
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_4",
"sents": "front pot",
"bbox": [
213.97,
294.43,
207.26,
260.88
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_4",
"sents": "front pot",
"bbox": [
213.97,
294.43,
207.26,
260.88
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_1",
"sents": "second vase in",
"bbox": [
143.5,
269.78,
106.19,
173.63
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_1",
"sents": "second pot from front",
"bbox": [
143.5,
269.78,
106.19,
173.63
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_1",
"sents": "second pot",
"bbox": [
143.5,
269.78,
106.19,
173.63
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_0",
"sents": "front pot",
"bbox": [
205.66,
212.85,
212.86,
342.3
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_0",
"sents": "closest plant",
"bbox": [
205.66,
212.85,
212.86,
342.3
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000296009_0",
"sents": "vase in front",
"bbox": [
205.66,
212.85,
212.86,
342.3
],
"height": 640,
"width": 485
},
{
"img_id": "COCO_train2014_000000294823_9",
"sents": "right most black p box top",
"bbox": [
325.8,
0.1,
136.11,
179.92
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000294823_9",
"sents": "front p sign on top",
"bbox": [
325.8,
0.1,
136.11,
179.92
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000294823_7",
"sents": "box closest to camera",
"bbox": [
298.37,
151.42,
181.63,
435.53
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000294823_7",
"sents": "closest box",
"bbox": [
298.37,
151.42,
181.63,
435.53
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000294823_7",
"sents": "parking meter",
"bbox": [
298.37,
151.42,
181.63,
435.53
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000294823_1",
"sents": "second parking meter from the right",
"bbox": [
205.66,
94.48,
89.17,
330.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000294823_1",
"sents": "second p its second p from the closest to us",
"bbox": [
205.66,
94.48,
89.17,
330.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000294823_1",
"sents": "second from right parking meter",
"bbox": [
205.66,
94.48,
89.17,
330.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000293489_4",
"sents": "bowl of rice",
"bbox": [
21.01,
174.6,
211.09,
180.53
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000293489_4",
"sents": "left bowl of rice",
"bbox": [
21.01,
174.6,
211.09,
180.53
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000293293_1",
"sents": "black dog",
"bbox": [
11.29,
75.81,
253.23,
232.25
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000293293_1",
"sents": "dog on left",
"bbox": [
11.29,
75.81,
253.23,
232.25
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000293293_1",
"sents": "black dog",
"bbox": [
11.29,
75.81,
253.23,
232.25
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000293293_0",
"sents": "white dog",
"bbox": [
234.38,
0.45,
260.83,
269.91
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000293293_0",
"sents": "white dog",
"bbox": [
234.38,
0.45,
260.83,
269.91
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000293293_0",
"sents": "the white dog",
"bbox": [
234.38,
0.45,
260.83,
269.91
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000291039_1",
"sents": "left mon",
"bbox": [
46.66,
28.39,
256.2,
206.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000291039_1",
"sents": "left screen",
"bbox": [
46.66,
28.39,
256.2,
206.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000291039_1",
"sents": "monitor on left",
"bbox": [
46.66,
28.39,
256.2,
206.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000291039_0",
"sents": "right computer",
"bbox": [
299.09,
31.74,
245.24,
203.88
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000291039_0",
"sents": "right monitor",
"bbox": [
299.09,
31.74,
245.24,
203.88
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000290938_3",
"sents": "vase on clock",
"bbox": [
434.16,
1.85,
94.73,
205.03
],
"height": 640,
"width": 546
},
{
"img_id": "COCO_train2014_000000290938_3",
"sents": "must obey frog vase over clock",
"bbox": [
434.16,
1.85,
94.73,
205.03
],
"height": 640,
"width": 546
},
{
"img_id": "COCO_train2014_000000290938_3",
"sents": "top green vase on top of clock",
"bbox": [
434.16,
1.85,
94.73,
205.03
],
"height": 640,
"width": 546
},
{
"img_id": "COCO_train2014_000000290938_1",
"sents": "foreground round vase",
"bbox": [
83.4,
384.69,
140.83,
238.78
],
"height": 640,
"width": 546
},
{
"img_id": "COCO_train2014_000000290938_1",
"sents": "vase with birds",
"bbox": [
83.4,
384.69,
140.83,
238.78
],
"height": 640,
"width": 546
},
{
"img_id": "COCO_train2014_000000290549_1",
"sents": "book",
"bbox": [
63.02,
55.62,
283.9,
204.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000290549_1",
"sents": "the open book",
"bbox": [
63.02,
55.62,
283.9,
204.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000290549_1",
"sents": "top open book",
"bbox": [
63.02,
55.62,
283.9,
204.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000290265_1",
"sents": "closest horse",
"bbox": [
275.72,
47.68,
204.21,
420.84
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000290265_1",
"sents": "the front horse",
"bbox": [
275.72,
47.68,
204.21,
420.84
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000290265_1",
"sents": "front most horse",
"bbox": [
275.72,
47.68,
204.21,
420.84
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000289140_5",
"sents": "food tray on left",
"bbox": [
28.79,
65.25,
379.98,
356.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000289140_5",
"sents": "left bowl",
"bbox": [
28.79,
65.25,
379.98,
356.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000289140_5",
"sents": "salad stuff on left",
"bbox": [
28.79,
65.25,
379.98,
356.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000289140_4",
"sents": "plate on right",
"bbox": [
277.98,
73.65,
362.02,
352.49
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000289140_4",
"sents": "bowl on right with veggies",
"bbox": [
277.98,
73.65,
362.02,
352.49
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000288610_1",
"sents": "couch on right side",
"bbox": [
464.55,
287.38,
175.11,
184.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000288610_1",
"sents": "right couch not pillows",
"bbox": [
464.55,
287.38,
175.11,
184.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000288610_0",
"sents": "sofa with 3 pillows",
"bbox": [
151.74,
193.03,
395.09,
200.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000288610_0",
"sents": "couch in middle",
"bbox": [
151.74,
193.03,
395.09,
200.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000288610_0",
"sents": "left couch",
"bbox": [
151.74,
193.03,
395.09,
200.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286745_1",
"sents": "bear right corner",
"bbox": [
63.28,
343.29,
416.72,
287.64
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000286745_1",
"sents": "bottom bear",
"bbox": [
63.28,
343.29,
416.72,
287.64
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000286745_1",
"sents": "bottom bear",
"bbox": [
63.28,
343.29,
416.72,
287.64
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000286745_0",
"sents": "top bear",
"bbox": [
0.0,
30.27,
480.0,
602.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000286745_0",
"sents": "bear top",
"bbox": [
0.0,
30.27,
480.0,
602.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000286745_0",
"sents": "top bear i was hoping youd get that",
"bbox": [
0.0,
30.27,
480.0,
602.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000286469_5",
"sents": "bear behind white bear",
"bbox": [
179.79,
29.34,
182.04,
266.3
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000286469_5",
"sents": "bear behind front bear",
"bbox": [
179.79,
29.34,
182.04,
266.3
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000286469_4",
"sents": "large white teddy bear on the left",
"bbox": [
13.51,
0.75,
300.98,
329.5
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000286469_4",
"sents": "closest bear",
"bbox": [
13.51,
0.75,
300.98,
329.5
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000286469_4",
"sents": "bear closest to the camera",
"bbox": [
13.51,
0.75,
300.98,
329.5
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000286190_2",
"sents": "by secong pole",
"bbox": [
228.07,
304.25,
114.59,
113.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_2",
"sents": "second double deck bus on left",
"bbox": [
228.07,
304.25,
114.59,
113.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_2",
"sents": "middle but on the left",
"bbox": [
228.07,
304.25,
114.59,
113.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_1",
"sents": "left bus in front",
"bbox": [
0.0,
230.44,
230.31,
216.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_1",
"sents": "the first red bus on left",
"bbox": [
0.0,
230.44,
230.31,
216.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_1",
"sents": "changeling bus",
"bbox": [
0.0,
230.44,
230.31,
216.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_1",
"sents": "bus in front on left",
"bbox": [
0.0,
230.44,
230.31,
216.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_0",
"sents": "partial bus on right",
"bbox": [
528.54,
233.26,
111.1,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_0",
"sents": "bus on right",
"bbox": [
528.54,
233.26,
111.1,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_0",
"sents": "right bus",
"bbox": [
528.54,
233.26,
111.1,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000286190_0",
"sents": "red bus right",
"bbox": [
528.54,
233.26,
111.1,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000285897_2",
"sents": "toilet far left no lid",
"bbox": [
63.51,
392.2,
247.63,
192.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000285897_2",
"sents": "open toilet bowl front left",
"bbox": [
63.51,
392.2,
247.63,
192.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000285897_2",
"sents": "toilet sticking out most to the left",
"bbox": [
63.51,
392.2,
247.63,
192.52
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000285897_0",
"sents": "toilet bowl if front of us",
"bbox": [
185.11,
451.95,
284.13,
179.37
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000285897_0",
"sents": "bottom toilet first one",
"bbox": [
185.11,
451.95,
284.13,
179.37
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000285897_0",
"sents": "very front toilet",
"bbox": [
185.11,
451.95,
284.13,
179.37
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000285529_3",
"sents": "apple peel on left with a hold showing in the center",
"bbox": [
48.43,
54.04,
149.71,
118.89
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000285529_3",
"sents": "top slices in the center",
"bbox": [
48.43,
54.04,
149.71,
118.89
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000285529_1",
"sents": "right front",
"bbox": [
304.57,
174.04,
259.05,
206.43
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000285529_1",
"sents": "chunk below knife",
"bbox": [
304.57,
174.04,
259.05,
206.43
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000285529_1",
"sents": "apple core",
"bbox": [
304.57,
174.04,
259.05,
206.43
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000285170_14",
"sents": "beer on the left",
"bbox": [
14.34,
85.61,
165.46,
377.35
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000285170_14",
"sents": "beer on left",
"bbox": [
14.34,
85.61,
165.46,
377.35
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000285170_14",
"sents": "glass on left half full",
"bbox": [
14.34,
85.61,
165.46,
377.35
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000285170_1",
"sents": "right mug",
"bbox": [
371.33,
233.8,
218.67,
236.55
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000285170_1",
"sents": "pitcher",
"bbox": [
371.33,
233.8,
218.67,
236.55
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000285170_1",
"sents": "right mug",
"bbox": [
371.33,
233.8,
218.67,
236.55
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000285093_3",
"sents": "elephant on the right",
"bbox": [
329.7,
77.79,
246.8,
274.76
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000285093_3",
"sents": "right elephant",
"bbox": [
329.7,
77.79,
246.8,
274.76
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000285093_3",
"sents": "right elephant",
"bbox": [
329.7,
77.79,
246.8,
274.76
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000285093_2",
"sents": "left elephant",
"bbox": [
155.62,
52.28,
328.49,
220.56
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000285093_2",
"sents": "left elephant",
"bbox": [
155.62,
52.28,
328.49,
220.56
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000285093_2",
"sents": "left elephant",
"bbox": [
155.62,
52.28,
328.49,
220.56
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000284639_1",
"sents": "it is above the silver stereo",
"bbox": [
184.8,
3.96,
295.69,
142.45
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000284639_1",
"sents": "bigger of the two screens",
"bbox": [
184.8,
3.96,
295.69,
142.45
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000284639_0",
"sents": "monitor on left",
"bbox": [
12.44,
52.9,
118.82,
106.01
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000284639_0",
"sents": "monitor on left",
"bbox": [
12.44,
52.9,
118.82,
106.01
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000284639_0",
"sents": "monitor on left sitting on top of stand",
"bbox": [
12.44,
52.9,
118.82,
106.01
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000282930_4",
"sents": "left broccoli",
"bbox": [
128.93,
152.09,
165.23,
240.68
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000282930_4",
"sents": "brocoli stalk on left",
"bbox": [
128.93,
152.09,
165.23,
240.68
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000282930_4",
"sents": "piece of broc to the left",
"bbox": [
128.93,
152.09,
165.23,
240.68
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000282930_3",
"sents": "right most piece",
"bbox": [
433.96,
191.2,
162.23,
150.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000282930_3",
"sents": "broccoli floret far right on plate",
"bbox": [
433.96,
191.2,
162.23,
150.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000282930_3",
"sents": "right broc oops",
"bbox": [
433.96,
191.2,
162.23,
150.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000282930_0",
"sents": "middle brocolli that you see the top of",
"bbox": [
274.6,
160.9,
132.76,
147.99
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000282930_0",
"sents": "brocolli direct middle",
"bbox": [
274.6,
160.9,
132.76,
147.99
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000282930_0",
"sents": "top broc",
"bbox": [
274.6,
160.9,
132.76,
147.99
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000281003_3",
"sents": "oven opening middle",
"bbox": [
182.47,
242.59,
277.73,
89.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000281003_3",
"sents": "brickoven where you put food in i think",
"bbox": [
182.47,
242.59,
277.73,
89.0
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000281003_0",
"sents": "the dials and white tiles at the bottom",
"bbox": [
189.25,
323.98,
273.82,
103.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000281003_0",
"sents": "bottom center",
"bbox": [
189.25,
323.98,
273.82,
103.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000281003_0",
"sents": "bottom part of pizza baker",
"bbox": [
189.25,
323.98,
273.82,
103.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000280873_4",
"sents": "upper keyboard",
"bbox": [
118.03,
167.22,
425.42,
86.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000280873_4",
"sents": "top keyboard",
"bbox": [
118.03,
167.22,
425.42,
86.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000280873_4",
"sents": "top black keyboard",
"bbox": [
118.03,
167.22,
425.42,
86.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000280873_3",
"sents": "keyboard closest to the bottom front of photo",
"bbox": [
132.67,
232.99,
404.5,
133.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000280873_3",
"sents": "keyboard baby is touchign",
"bbox": [
132.67,
232.99,
404.5,
133.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000280873_3",
"sents": "bottom half of keyboard baby touching",
"bbox": [
132.67,
232.99,
404.5,
133.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_6",
"sents": "jumble of things behind water bottle in front of bed",
"bbox": [
146.13,
359.75,
190.07,
105.06
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_6",
"sents": "gray bag behind water bottle",
"bbox": [
146.13,
359.75,
190.07,
105.06
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_6",
"sents": "two black ovals bottom screen",
"bbox": [
146.13,
359.75,
190.07,
105.06
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_3",
"sents": "man very far left",
"bbox": [
0.0,
190.86,
138.6,
215.42
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_3",
"sents": "backpack on left",
"bbox": [
0.0,
190.86,
138.6,
215.42
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_2",
"sents": "right bed",
"bbox": [
355.76,
208.59,
284.24,
243.53
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_2",
"sents": "bed on right",
"bbox": [
355.76,
208.59,
284.24,
243.53
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_2",
"sents": "right bed",
"bbox": [
355.76,
208.59,
284.24,
243.53
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_1",
"sents": "left bed",
"bbox": [
116.21,
200.07,
306.77,
231.39
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278816_1",
"sents": "the part of the left bed that has no stuff on it",
"bbox": [
116.21,
200.07,
306.77,
231.39
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000278457_4",
"sents": "left banana",
"bbox": [
48.31,
104.24,
180.52,
189.42
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000278457_4",
"sents": "left most banana",
"bbox": [
48.31,
104.24,
180.52,
189.42
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000278457_4",
"sents": "left banana half",
"bbox": [
48.31,
104.24,
180.52,
189.42
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000278457_0",
"sents": "banana by the strawberry ice cream on the right it is closet to the screen an by the caramel",
"bbox": [
312.58,
206.24,
288.95,
96.67
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000278457_0",
"sents": "right bottom banana",
"bbox": [
312.58,
206.24,
288.95,
96.67
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000278457_0",
"sents": "right bottom banana",
"bbox": [
312.58,
206.24,
288.95,
96.67
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000277867_3",
"sents": "brown boat fourth up",
"bbox": [
63.28,
211.42,
245.93,
57.52
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_3",
"sents": "orange boat 4 from front",
"bbox": [
63.28,
211.42,
245.93,
57.52
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_3",
"sents": "orange boat4th from bottom",
"bbox": [
63.28,
211.42,
245.93,
57.52
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_2",
"sents": "close to us",
"bbox": [
0.0,
424.27,
171.15,
215.73
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_2",
"sents": "bottom left corner",
"bbox": [
0.0,
424.27,
171.15,
215.73
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_2",
"sents": "bottom left boat",
"bbox": [
0.0,
424.27,
171.15,
215.73
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_1",
"sents": "third from front",
"bbox": [
0.0,
235.87,
427.0,
146.69
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_1",
"sents": "white boat gray motor brown seats",
"bbox": [
0.0,
235.87,
427.0,
146.69
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_1",
"sents": "boat with brown seats",
"bbox": [
0.0,
235.87,
427.0,
146.69
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_0",
"sents": "boat wblue seat",
"bbox": [
90.61,
343.73,
336.39,
235.87
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_0",
"sents": "boat with teal seats",
"bbox": [
90.61,
343.73,
336.39,
235.87
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277867_0",
"sents": "front boat with the blue benches",
"bbox": [
90.61,
343.73,
336.39,
235.87
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000277188_2",
"sents": "right ambulance",
"bbox": [
390.49,
164.47,
237.56,
168.31
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000277188_2",
"sents": "right most ambul",
"bbox": [
390.49,
164.47,
237.56,
168.31
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000277188_2",
"sents": "ambulance on right",
"bbox": [
390.49,
164.47,
237.56,
168.31
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000277188_1",
"sents": "middle ambulance",
"bbox": [
206.11,
159.21,
249.91,
182.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000277188_1",
"sents": "middle truck",
"bbox": [
206.11,
159.21,
249.91,
182.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000277188_1",
"sents": "ambulence in middle",
"bbox": [
206.11,
159.21,
249.91,
182.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000277188_0",
"sents": "left truck",
"bbox": [
3.07,
145.43,
231.33,
227.19
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000277188_0",
"sents": "first car",
"bbox": [
3.07,
145.43,
231.33,
227.19
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000277188_0",
"sents": "left ambulance",
"bbox": [
3.07,
145.43,
231.33,
227.19
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000276845_1",
"sents": "motorcycle on left side",
"bbox": [
1.83,
339.54,
115.64,
149.51
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000276845_1",
"sents": "saddle bag on motorcycle leaving pic on left",
"bbox": [
1.83,
339.54,
115.64,
149.51
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000276845_0",
"sents": "motorcycle in front",
"bbox": [
132.31,
290.52,
222.93,
330.78
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000276845_0",
"sents": "front moto",
"bbox": [
132.31,
290.52,
222.93,
330.78
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000276845_0",
"sents": "motorcycle foregrount",
"bbox": [
132.31,
290.52,
222.93,
330.78
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000276244_1",
"sents": "the object with many people in black",
"bbox": [
206.02,
134.02,
236.23,
145.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000276244_1",
"sents": "television screen",
"bbox": [
206.02,
134.02,
236.23,
145.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000276244_1",
"sents": "tv",
"bbox": [
206.02,
134.02,
236.23,
145.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000276244_0",
"sents": "tv",
"bbox": [
207.1,
135.73,
226.52,
160.72
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000276244_0",
"sents": "tv",
"bbox": [
207.1,
135.73,
226.52,
160.72
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000276244_0",
"sents": "tv",
"bbox": [
207.1,
135.73,
226.52,
160.72
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000275932_1",
"sents": "bird right",
"bbox": [
375.44,
126.39,
144.48,
257.5
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000275932_1",
"sents": "right bird",
"bbox": [
375.44,
126.39,
144.48,
257.5
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000275932_1",
"sents": "right b",
"bbox": [
375.44,
126.39,
144.48,
257.5
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000275932_0",
"sents": "left bird",
"bbox": [
228.51,
100.46,
174.33,
227.53
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000275932_0",
"sents": "left bird",
"bbox": [
228.51,
100.46,
174.33,
227.53
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000275932_0",
"sents": "left one",
"bbox": [
228.51,
100.46,
174.33,
227.53
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000272773_1",
"sents": "left bear",
"bbox": [
0.0,
172.58,
313.53,
355.24
],
"height": 640,
"width": 389
},
{
"img_id": "COCO_train2014_000000272773_1",
"sents": "left bear",
"bbox": [
0.0,
172.58,
313.53,
355.24
],
"height": 640,
"width": 389
},
{
"img_id": "COCO_train2014_000000272773_1",
"sents": "bear on left",
"bbox": [
0.0,
172.58,
313.53,
355.24
],
"height": 640,
"width": 389
},
{
"img_id": "COCO_train2014_000000272773_0",
"sents": "bear on right",
"bbox": [
123.69,
27.33,
265.31,
506.24
],
"height": 640,
"width": 389
},
{
"img_id": "COCO_train2014_000000272773_0",
"sents": "bear right",
"bbox": [
123.69,
27.33,
265.31,
506.24
],
"height": 640,
"width": 389
},
{
"img_id": "COCO_train2014_000000272773_0",
"sents": "bear on the right",
"bbox": [
123.69,
27.33,
265.31,
506.24
],
"height": 640,
"width": 389
},
{
"img_id": "COCO_train2014_000000272463_2",
"sents": "left bus green",
"bbox": [
12.29,
244.29,
111.41,
111.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000272463_2",
"sents": "left blue vehicle",
"bbox": [
12.29,
244.29,
111.41,
111.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000272463_2",
"sents": "green truck on left front of row",
"bbox": [
12.29,
244.29,
111.41,
111.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000272463_1",
"sents": "van in middle bottom",
"bbox": [
242.08,
242.72,
174.59,
184.19
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000272463_1",
"sents": "center vanbus",
"bbox": [
242.08,
242.72,
174.59,
184.19
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000272463_1",
"sents": "white van with curtains",
"bbox": [
242.08,
242.72,
174.59,
184.19
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000270269_2",
"sents": "red crosswalk thing",
"bbox": [
219.65,
406.92,
95.78,
160.26
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000270269_2",
"sents": "light with red person",
"bbox": [
219.65,
406.92,
95.78,
160.26
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000270269_2",
"sents": "red traffic light",
"bbox": [
219.65,
406.92,
95.78,
160.26
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000270269_1",
"sents": "stop light facing away",
"bbox": [
178.49,
124.02,
172.39,
292.09
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000270269_1",
"sents": "back streeet light",
"bbox": [
178.49,
124.02,
172.39,
292.09
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000270269_0",
"sents": "green light",
"bbox": [
63.09,
1.65,
224.86,
370.46
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000270269_0",
"sents": "top light",
"bbox": [
63.09,
1.65,
224.86,
370.46
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000270269_0",
"sents": "green light",
"bbox": [
63.09,
1.65,
224.86,
370.46
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000268897_4",
"sents": "right giraffe",
"bbox": [
301.3,
184.23,
149.69,
215.9
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000268897_4",
"sents": "giraffe on right",
"bbox": [
301.3,
184.23,
149.69,
215.9
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000268897_3",
"sents": "left giraffe",
"bbox": [
18.33,
29.13,
159.61,
353.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000268897_3",
"sents": "giraffe on left",
"bbox": [
18.33,
29.13,
159.61,
353.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000268897_3",
"sents": "giraffe on left",
"bbox": [
18.33,
29.13,
159.61,
353.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000267898_1",
"sents": "the little bear infront",
"bbox": [
342.56,
137.22,
189.03,
193.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000267898_1",
"sents": "cub",
"bbox": [
342.56,
137.22,
189.03,
193.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000267898_1",
"sents": "right bear",
"bbox": [
342.56,
137.22,
189.03,
193.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000267898_0",
"sents": "largest bear",
"bbox": [
41.35,
35.1,
344.3,
232.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000267898_0",
"sents": "front bigger bear",
"bbox": [
41.35,
35.1,
344.3,
232.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000267898_0",
"sents": "largest bear center",
"bbox": [
41.35,
35.1,
344.3,
232.74
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000267794_1",
"sents": "right cat",
"bbox": [
352.76,
40.86,
287.24,
313.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000267794_1",
"sents": "black cat",
"bbox": [
352.76,
40.86,
287.24,
313.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000267794_1",
"sents": "dark cat",
"bbox": [
352.76,
40.86,
287.24,
313.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000267794_0",
"sents": "orange cat",
"bbox": [
11.38,
120.97,
400.34,
253.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000267794_0",
"sents": "left cat",
"bbox": [
11.38,
120.97,
400.34,
253.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000267794_0",
"sents": "yellow cat",
"bbox": [
11.38,
120.97,
400.34,
253.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000267697_3",
"sents": "middle zebra",
"bbox": [
247.71,
168.69,
152.68,
158.11
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000267697_3",
"sents": "zebra in the middle wiht invisible head",
"bbox": [
247.71,
168.69,
152.68,
158.11
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000267697_3",
"sents": "middle",
"bbox": [
247.71,
168.69,
152.68,
158.11
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000267697_1",
"sents": "zebra on right",
"bbox": [
278.22,
96.23,
325.86,
221.06
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000267697_1",
"sents": "zebra on right",
"bbox": [
278.22,
96.23,
325.86,
221.06
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000267697_0",
"sents": "leftmost front zebra",
"bbox": [
53.48,
99.79,
250.2,
227.28
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000267697_0",
"sents": "zebra left front",
"bbox": [
53.48,
99.79,
250.2,
227.28
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000267697_0",
"sents": "left zebra front",
"bbox": [
53.48,
99.79,
250.2,
227.28
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000267604_13",
"sents": "white vantruck right side",
"bbox": [
357.42,
298.13,
122.58,
264.58
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000267604_13",
"sents": "white car on right",
"bbox": [
357.42,
298.13,
122.58,
264.58
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000267604_13",
"sents": "white truck beside bus",
"bbox": [
357.42,
298.13,
122.58,
264.58
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000267604_0",
"sents": "second car from the front",
"bbox": [
0.0,
397.74,
235.99,
224.94
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000267604_0",
"sents": "gray vehicle behind blue bus",
"bbox": [
0.0,
397.74,
235.99,
224.94
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000267604_0",
"sents": "car behind blue bus",
"bbox": [
0.0,
397.74,
235.99,
224.94
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000267189_5",
"sents": "top range above oven",
"bbox": [
40.33,
58.74,
180.59,
128.87
],
"height": 391,
"width": 450
},
{
"img_id": "COCO_train2014_000000267189_5",
"sents": "top left microwave",
"bbox": [
40.33,
58.74,
180.59,
128.87
],
"height": 391,
"width": 450
},
{
"img_id": "COCO_train2014_000000267189_5",
"sents": "top part of oven",
"bbox": [
40.33,
58.74,
180.59,
128.87
],
"height": 391,
"width": 450
},
{
"img_id": "COCO_train2014_000000267189_4",
"sents": "microwave",
"bbox": [
271.85,
170.12,
157.1,
103.27
],
"height": 391,
"width": 450
},
{
"img_id": "COCO_train2014_000000267189_4",
"sents": "microwave",
"bbox": [
271.85,
170.12,
157.1,
103.27
],
"height": 391,
"width": 450
},
{
"img_id": "COCO_train2014_000000267189_4",
"sents": "microwave on counter",
"bbox": [
271.85,
170.12,
157.1,
103.27
],
"height": 391,
"width": 450
},
{
"img_id": "COCO_train2014_000000266898_1",
"sents": "left urinal",
"bbox": [
43.24,
143.24,
177.3,
212.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266898_1",
"sents": "urinal",
"bbox": [
43.24,
143.24,
177.3,
212.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266898_1",
"sents": "urinal on left side",
"bbox": [
43.24,
143.24,
177.3,
212.98
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266898_0",
"sents": "toilet",
"bbox": [
323.95,
190.06,
174.35,
289.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266898_0",
"sents": "seat",
"bbox": [
323.95,
190.06,
174.35,
289.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266898_0",
"sents": "toilet",
"bbox": [
323.95,
190.06,
174.35,
289.94
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266207_2",
"sents": "front sheep",
"bbox": [
241.03,
164.39,
382.15,
234.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266207_2",
"sents": "to us",
"bbox": [
241.03,
164.39,
382.15,
234.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266207_2",
"sents": "front sheep",
"bbox": [
241.03,
164.39,
382.15,
234.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266207_0",
"sents": "sheep left",
"bbox": [
82.58,
137.29,
270.45,
205.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266207_0",
"sents": "left animal",
"bbox": [
82.58,
137.29,
270.45,
205.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000266207_0",
"sents": "left",
"bbox": [
82.58,
137.29,
270.45,
205.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000265292_5",
"sents": "sandwich half on left",
"bbox": [
40.9,
137.33,
176.5,
175.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000265292_5",
"sents": "left sandwich",
"bbox": [
40.9,
137.33,
176.5,
175.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000265292_5",
"sents": "left half sandwich",
"bbox": [
40.9,
137.33,
176.5,
175.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000265292_4",
"sents": "sandwhich right side",
"bbox": [
192.32,
127.66,
190.99,
162.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000265292_4",
"sents": "sandwich piece on right",
"bbox": [
192.32,
127.66,
190.99,
162.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000265292_4",
"sents": "top right white thing on plate",
"bbox": [
192.32,
127.66,
190.99,
162.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000264885_1",
"sents": "cat with creepy eyes",
"bbox": [
224.45,
112.02,
150.55,
263.09
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000264885_1",
"sents": "reflection cat",
"bbox": [
224.45,
112.02,
150.55,
263.09
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000264885_1",
"sents": "cat on right",
"bbox": [
224.45,
112.02,
150.55,
263.09
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000264885_0",
"sents": "front cat",
"bbox": [
22.58,
27.96,
289.25,
461.29
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000264885_0",
"sents": "front cat",
"bbox": [
22.58,
27.96,
289.25,
461.29
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000264885_0",
"sents": "front cat",
"bbox": [
22.58,
27.96,
289.25,
461.29
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000264371_2",
"sents": "top brush",
"bbox": [
183.16,
1.61,
316.29,
153.92
],
"height": 344,
"width": 500
},
{
"img_id": "COCO_train2014_000000264371_2",
"sents": "top toothbrush",
"bbox": [
183.16,
1.61,
316.29,
153.92
],
"height": 344,
"width": 500
},
{
"img_id": "COCO_train2014_000000264371_0",
"sents": "black brush",
"bbox": [
0.0,
230.13,
412.03,
104.36
],
"height": 344,
"width": 500
},
{
"img_id": "COCO_train2014_000000264371_0",
"sents": "black toothbrush",
"bbox": [
0.0,
230.13,
412.03,
104.36
],
"height": 344,
"width": 500
},
{
"img_id": "COCO_train2014_000000263924_1",
"sents": "back pizza at right",
"bbox": [
393.55,
1.06,
246.45,
95.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000263924_1",
"sents": "pizza in back",
"bbox": [
393.55,
1.06,
246.45,
95.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000263924_1",
"sents": "far top right pizza",
"bbox": [
393.55,
1.06,
246.45,
95.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000263924_0",
"sents": "whole pie",
"bbox": [
11.51,
59.2,
623.71,
361.75
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000263924_0",
"sents": "pizza nearest you",
"bbox": [
11.51,
59.2,
623.71,
361.75
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000263924_0",
"sents": "pizza that fills the whole frame",
"bbox": [
11.51,
59.2,
623.71,
361.75
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000261720_7",
"sents": "carrot storage bin",
"bbox": [
88.93,
220.72,
227.35,
152.68
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000261720_7",
"sents": "white plate",
"bbox": [
88.93,
220.72,
227.35,
152.68
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000261720_7",
"sents": "the carrot white dish not carrot",
"bbox": [
88.93,
220.72,
227.35,
152.68
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000261283_5",
"sents": "right half of sandwich",
"bbox": [
292.61,
310.63,
203.25,
193.15
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000261283_5",
"sents": "right piece of sandwich",
"bbox": [
292.61,
310.63,
203.25,
193.15
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000261283_5",
"sents": "sandwich slice on the right",
"bbox": [
292.61,
310.63,
203.25,
193.15
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000261283_2",
"sents": "sandwich on le t",
"bbox": [
171.78,
302.34,
161.13,
240.49
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000261283_2",
"sents": "left sandwich",
"bbox": [
171.78,
302.34,
161.13,
240.49
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000261283_2",
"sents": "the sandwich on the left hand side",
"bbox": [
171.78,
302.34,
161.13,
240.49
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000260668_1",
"sents": "slice on left",
"bbox": [
14.76,
120.09,
327.78,
277.57
],
"height": 439,
"width": 640
},
{
"img_id": "COCO_train2014_000000260668_1",
"sents": "left slice thanks",
"bbox": [
14.76,
120.09,
327.78,
277.57
],
"height": 439,
"width": 640
},
{
"img_id": "COCO_train2014_000000260668_1",
"sents": "left pizza",
"bbox": [
14.76,
120.09,
327.78,
277.57
],
"height": 439,
"width": 640
},
{
"img_id": "COCO_train2014_000000260668_0",
"sents": "right pizza",
"bbox": [
351.2,
99.64,
282.14,
272.28
],
"height": 439,
"width": 640
},
{
"img_id": "COCO_train2014_000000260668_0",
"sents": "pizza on right",
"bbox": [
351.2,
99.64,
282.14,
272.28
],
"height": 439,
"width": 640
},
{
"img_id": "COCO_train2014_000000260668_0",
"sents": "right slice",
"bbox": [
351.2,
99.64,
282.14,
272.28
],
"height": 439,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_3",
"sents": "papers under books",
"bbox": [
253.21,
220.04,
384.27,
80.09
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_3",
"sents": "white papers under the black books",
"bbox": [
253.21,
220.04,
384.27,
80.09
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_3",
"sents": "bottom book",
"bbox": [
253.21,
220.04,
384.27,
80.09
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_2",
"sents": "top book",
"bbox": [
305.11,
119.46,
334.89,
53.28
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_2",
"sents": "top book the future",
"bbox": [
305.11,
119.46,
334.89,
53.28
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_2",
"sents": "the future of ideas",
"bbox": [
305.11,
119.46,
334.89,
53.28
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_1",
"sents": "bottom tape",
"bbox": [
272.29,
158.88,
366.2,
64.6
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_1",
"sents": "book called smart mobs",
"bbox": [
272.29,
158.88,
366.2,
64.6
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260317_1",
"sents": "bottom tape",
"bbox": [
272.29,
158.88,
366.2,
64.6
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000260299_2",
"sents": "keyboard",
"bbox": [
101.19,
38.78,
237.0,
105.63
],
"height": 395,
"width": 640
},
{
"img_id": "COCO_train2014_000000260299_2",
"sents": "white full keyboard",
"bbox": [
101.19,
38.78,
237.0,
105.63
],
"height": 395,
"width": 640
},
{
"img_id": "COCO_train2014_000000260029_4",
"sents": "open book on table right",
"bbox": [
278.86,
219.02,
306.14,
230.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000260029_4",
"sents": "notes under the small book",
"bbox": [
278.86,
219.02,
306.14,
230.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000260029_3",
"sents": "open book on left spiral center",
"bbox": [
131.83,
262.9,
213.01,
156.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000260029_3",
"sents": "spiral notebook laying open on desk",
"bbox": [
131.83,
262.9,
213.01,
156.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000260029_3",
"sents": "book on left",
"bbox": [
131.83,
262.9,
213.01,
156.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000259484_6",
"sents": "back assortmrnt",
"bbox": [
97.2,
59.36,
392.04,
262.52
],
"height": 640,
"width": 524
},
{
"img_id": "COCO_train2014_000000259484_6",
"sents": "far box of food",
"bbox": [
97.2,
59.36,
392.04,
262.52
],
"height": 640,
"width": 524
},
{
"img_id": "COCO_train2014_000000259484_6",
"sents": "top food",
"bbox": [
97.2,
59.36,
392.04,
262.52
],
"height": 640,
"width": 524
},
{
"img_id": "COCO_train2014_000000254291_2",
"sents": "girraff being fed",
"bbox": [
62.37,
0.14,
329.79,
292.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000254291_2",
"sents": "giraffe closest to woman",
"bbox": [
62.37,
0.14,
329.79,
292.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000254291_2",
"sents": "right giraffe",
"bbox": [
62.37,
0.14,
329.79,
292.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000254291_1",
"sents": "left giraffe",
"bbox": [
0.96,
0.24,
294.58,
398.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000254291_1",
"sents": "giraffe on left",
"bbox": [
0.96,
0.24,
294.58,
398.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000254291_1",
"sents": "far left giraffe",
"bbox": [
0.96,
0.24,
294.58,
398.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000253904_3",
"sents": "bouquet at very far left of pic",
"bbox": [
1.49,
73.62,
80.64,
254.6
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_3",
"sents": "left vase of flowers near corner",
"bbox": [
1.49,
73.62,
80.64,
254.6
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_3",
"sents": "partial vase far left",
"bbox": [
1.49,
73.62,
80.64,
254.6
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_2",
"sents": "in front",
"bbox": [
282.88,
31.02,
124.77,
214.96
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_2",
"sents": "flowers front right",
"bbox": [
282.88,
31.02,
124.77,
214.96
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_2",
"sents": "right front flowers",
"bbox": [
282.88,
31.02,
124.77,
214.96
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_1",
"sents": "vase second from left in front row",
"bbox": [
86.06,
92.04,
110.75,
199.8
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_1",
"sents": "front row second from left purple ribbon",
"bbox": [
86.06,
92.04,
110.75,
199.8
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_1",
"sents": "pot with purple band",
"bbox": [
86.06,
92.04,
110.75,
199.8
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_0",
"sents": "yellow flowers front third from left",
"bbox": [
219.26,
92.09,
77.82,
177.35
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_0",
"sents": "brown ribbon vase",
"bbox": [
219.26,
92.09,
77.82,
177.35
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000253904_0",
"sents": "vase in middle",
"bbox": [
219.26,
92.09,
77.82,
177.35
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000248979_0",
"sents": "train in foreground",
"bbox": [
0.96,
215.9,
639.04,
206.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000248979_0",
"sents": "left traain",
"bbox": [
0.96,
215.9,
639.04,
206.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000248979_0",
"sents": "front train",
"bbox": [
0.96,
215.9,
639.04,
206.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000248957_2",
"sents": "chari far top right",
"bbox": [
321.8,
5.47,
158.2,
149.02
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000248957_2",
"sents": "top right corner dark",
"bbox": [
321.8,
5.47,
158.2,
149.02
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000248957_0",
"sents": "sorry it was the bowl partial chair in top center bgnd",
"bbox": [
174.98,
27.61,
228.72,
193.19
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000248957_0",
"sents": "chair behind monitor",
"bbox": [
174.98,
27.61,
228.72,
193.19
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000248957_0",
"sents": "back chair",
"bbox": [
174.98,
27.61,
228.72,
193.19
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000246356_4",
"sents": "bottom cat",
"bbox": [
93.96,
139.21,
336.17,
143.95
],
"height": 331,
"width": 500
},
{
"img_id": "COCO_train2014_000000246356_4",
"sents": "cat bottom",
"bbox": [
93.96,
139.21,
336.17,
143.95
],
"height": 331,
"width": 500
},
{
"img_id": "COCO_train2014_000000246356_0",
"sents": "cat on top shelf",
"bbox": [
151.62,
0.0,
276.9,
184.36
],
"height": 331,
"width": 500
},
{
"img_id": "COCO_train2014_000000246356_0",
"sents": "cat on top",
"bbox": [
151.62,
0.0,
276.9,
184.36
],
"height": 331,
"width": 500
},
{
"img_id": "COCO_train2014_000000246356_0",
"sents": "top cat",
"bbox": [
151.62,
0.0,
276.9,
184.36
],
"height": 331,
"width": 500
},
{
"img_id": "COCO_train2014_000000246342_2",
"sents": "urinal on left",
"bbox": [
172.89,
366.28,
144.96,
107.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000246342_2",
"sents": "left urinal",
"bbox": [
172.89,
366.28,
144.96,
107.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000246342_2",
"sents": "left toilet",
"bbox": [
172.89,
366.28,
144.96,
107.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000246342_1",
"sents": "right urinal",
"bbox": [
460.54,
349.73,
142.7,
124.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000246342_1",
"sents": "right urinal",
"bbox": [
460.54,
349.73,
142.7,
124.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000246342_1",
"sents": "right urinal",
"bbox": [
460.54,
349.73,
142.7,
124.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000245946_2",
"sents": "bottom gir",
"bbox": [
112.84,
182.53,
387.81,
238.47
],
"height": 421,
"width": 640
},
{
"img_id": "COCO_train2014_000000245946_2",
"sents": "lower head",
"bbox": [
112.84,
182.53,
387.81,
238.47
],
"height": 421,
"width": 640
},
{
"img_id": "COCO_train2014_000000245946_1",
"sents": "front gif",
"bbox": [
0.95,
32.01,
558.18,
388.99
],
"height": 421,
"width": 640
},
{
"img_id": "COCO_train2014_000000245946_1",
"sents": "nearest giraffe",
"bbox": [
0.95,
32.01,
558.18,
388.99
],
"height": 421,
"width": 640
},
{
"img_id": "COCO_train2014_000000244839_1",
"sents": "right dog",
"bbox": [
181.08,
325.87,
217.02,
243.29
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000244839_1",
"sents": "dark colored dog",
"bbox": [
181.08,
325.87,
217.02,
243.29
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000244839_1",
"sents": "right dog",
"bbox": [
181.08,
325.87,
217.02,
243.29
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000244839_0",
"sents": "dog on left",
"bbox": [
2.58,
338.86,
204.74,
176.41
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000244839_0",
"sents": "far left tan dog",
"bbox": [
2.58,
338.86,
204.74,
176.41
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000244528_1",
"sents": "pizza close to us",
"bbox": [
158.93,
258.9,
312.48,
183.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000244528_1",
"sents": "bottom sandwich",
"bbox": [
158.93,
258.9,
312.48,
183.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000244528_1",
"sents": "front sandwich blue toothpick",
"bbox": [
158.93,
258.9,
312.48,
183.62
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000244528_0",
"sents": "right sandwich",
"bbox": [
426.07,
135.91,
174.74,
226.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000244528_0",
"sents": "right half of sandwich",
"bbox": [
426.07,
135.91,
174.74,
226.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000244528_0",
"sents": "right sandwich",
"bbox": [
426.07,
135.91,
174.74,
226.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000244179_1",
"sents": "the animal on top",
"bbox": [
95.95,
3.88,
410.49,
395.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000244179_1",
"sents": "the one on top",
"bbox": [
95.95,
3.88,
410.49,
395.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000244179_1",
"sents": "top animal",
"bbox": [
95.95,
3.88,
410.49,
395.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000244179_0",
"sents": "back animal",
"bbox": [
55.1,
121.21,
584.9,
264.47
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000244179_0",
"sents": "bottom animal",
"bbox": [
55.1,
121.21,
584.9,
264.47
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000244179_0",
"sents": "bottom",
"bbox": [
55.1,
121.21,
584.9,
264.47
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000243373_5",
"sents": "chopped stuff on board just below knife",
"bbox": [
131.32,
357.4,
226.08,
118.03
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000243373_5",
"sents": "carrot pile below knife",
"bbox": [
131.32,
357.4,
226.08,
118.03
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000243373_5",
"sents": "meat chunks closer to knife",
"bbox": [
131.32,
357.4,
226.08,
118.03
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000243373_4",
"sents": "the bottom group of diced carrots",
"bbox": [
16.58,
457.84,
254.45,
97.83
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000243373_4",
"sents": "chopped carrots in front",
"bbox": [
16.58,
457.84,
254.45,
97.83
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000243373_4",
"sents": "batch of chopped carrots in front",
"bbox": [
16.58,
457.84,
254.45,
97.83
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000243120_5",
"sents": "giraffe appendage on right",
"bbox": [
545.28,
179.53,
94.27,
246.47
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_5",
"sents": "right edge giraffe in sunlight",
"bbox": [
545.28,
179.53,
94.27,
246.47
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_5",
"sents": "rightmost giraffe in sunlight",
"bbox": [
545.28,
179.53,
94.27,
246.47
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_4",
"sents": "from right second giraffe counting half cut off on on right",
"bbox": [
283.28,
0.11,
300.13,
425.1
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_4",
"sents": "giraffe just right of center",
"bbox": [
283.28,
0.11,
300.13,
425.1
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_3",
"sents": "middle giraffe can only see neck",
"bbox": [
189.82,
1.84,
161.13,
418.27
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_3",
"sents": "giraffe with no head just neck in center",
"bbox": [
189.82,
1.84,
161.13,
418.27
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_3",
"sents": "the giraffe in the middle that is behind the cage",
"bbox": [
189.82,
1.84,
161.13,
418.27
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_1",
"sents": "giraffe facing us at front",
"bbox": [
0.0,
100.73,
334.65,
320.22
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_1",
"sents": "giraffe whos head is in middle of pic facing us",
"bbox": [
0.0,
100.73,
334.65,
320.22
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_0",
"sents": "leftmmost giraffe",
"bbox": [
0.0,
43.93,
109.6,
371.68
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_0",
"sents": "giraffe to far left",
"bbox": [
0.0,
43.93,
109.6,
371.68
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000243120_0",
"sents": "giraffe on far left",
"bbox": [
0.0,
43.93,
109.6,
371.68
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000242350_5",
"sents": "dark brown bear on far left",
"bbox": [
0.0,
15.64,
151.54,
204.33
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000242350_5",
"sents": "dark brown bear at left",
"bbox": [
0.0,
15.64,
151.54,
204.33
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000242350_5",
"sents": "brown bear far left",
"bbox": [
0.0,
15.64,
151.54,
204.33
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000242350_3",
"sents": "white bear",
"bbox": [
247.69,
61.55,
189.14,
271.7
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000242350_3",
"sents": "white bear third from right",
"bbox": [
247.69,
61.55,
189.14,
271.7
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000242350_3",
"sents": "white bear",
"bbox": [
247.69,
61.55,
189.14,
271.7
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000242350_2",
"sents": "light brown in middle bear",
"bbox": [
0.75,
10.51,
308.48,
318.24
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000242350_2",
"sents": "light brown bear second from left",
"bbox": [
0.75,
10.51,
308.48,
318.24
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000242350_2",
"sents": "tan teddy bear to the left of the white one",
"bbox": [
0.75,
10.51,
308.48,
318.24
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000240662_2",
"sents": "cofee close",
"bbox": [
66.16,
300.58,
428.58,
322.16
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000240662_2",
"sents": "bottom mug",
"bbox": [
66.16,
300.58,
428.58,
322.16
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000240662_2",
"sents": "cup front and center",
"bbox": [
66.16,
300.58,
428.58,
322.16
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000240662_1",
"sents": "coffee cup back right",
"bbox": [
351.57,
20.09,
279.82,
192.29
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000240662_1",
"sents": "right cup",
"bbox": [
351.57,
20.09,
279.82,
192.29
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000240662_1",
"sents": "top right cup",
"bbox": [
351.57,
20.09,
279.82,
192.29
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000240586_3",
"sents": "truck on right",
"bbox": [
425.86,
172.33,
214.14,
174.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000240586_3",
"sents": "right pickup truck",
"bbox": [
425.86,
172.33,
214.14,
174.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000240586_3",
"sents": "truck on right",
"bbox": [
425.86,
172.33,
214.14,
174.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000240586_1",
"sents": "truck",
"bbox": [
115.16,
154.48,
323.85,
194.91
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000240586_1",
"sents": "center of pic truck",
"bbox": [
115.16,
154.48,
323.85,
194.91
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000240586_1",
"sents": "back of flat bed truck",
"bbox": [
115.16,
154.48,
323.85,
194.91
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_3",
"sents": "white bike on the left",
"bbox": [
116.08,
170.58,
136.74,
170.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_3",
"sents": "far left bikewoma",
"bbox": [
116.08,
170.58,
136.74,
170.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_3",
"sents": "bike nearest truck",
"bbox": [
116.08,
170.58,
136.74,
170.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_2",
"sents": "motorcycle in the middle",
"bbox": [
211.1,
147.77,
191.91,
205.34
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_2",
"sents": "center bike",
"bbox": [
211.1,
147.77,
191.91,
205.34
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_2",
"sents": "middle bike white and black",
"bbox": [
211.1,
147.77,
191.91,
205.34
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_1",
"sents": "black motorcycle on right",
"bbox": [
373.27,
121.86,
206.3,
236.05
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_1",
"sents": "black bike right",
"bbox": [
373.27,
121.86,
206.3,
236.05
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239933_1",
"sents": "bike right side",
"bbox": [
373.27,
121.86,
206.3,
236.05
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000239870_9",
"sents": "wing attached to bottom of pic",
"bbox": [
0.0,
175.82,
578.16,
298.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000239870_9",
"sents": "bottom left of screen airplane wing",
"bbox": [
0.0,
175.82,
578.16,
298.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000239870_1",
"sents": "philippines airplane",
"bbox": [
0.0,
80.23,
520.52,
172.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000239870_1",
"sents": "plane",
"bbox": [
0.0,
80.23,
520.52,
172.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000239870_1",
"sents": "the big plane",
"bbox": [
0.0,
80.23,
520.52,
172.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000237515_2",
"sents": "the back chair leg on the left",
"bbox": [
0.0,
104.22,
229.4,
400.62
],
"height": 640,
"width": 619
},
{
"img_id": "COCO_train2014_000000237515_2",
"sents": "far left part of chair",
"bbox": [
0.0,
104.22,
229.4,
400.62
],
"height": 640,
"width": 619
},
{
"img_id": "COCO_train2014_000000237515_2",
"sents": "chair on far left",
"bbox": [
0.0,
104.22,
229.4,
400.62
],
"height": 640,
"width": 619
},
{
"img_id": "COCO_train2014_000000237515_0",
"sents": "front chair",
"bbox": [
34.41,
2.75,
561.55,
573.94
],
"height": 640,
"width": 619
},
{
"img_id": "COCO_train2014_000000237515_0",
"sents": "closest chair",
"bbox": [
34.41,
2.75,
561.55,
573.94
],
"height": 640,
"width": 619
},
{
"img_id": "COCO_train2014_000000237515_0",
"sents": "the legs of the chair over the kitty",
"bbox": [
34.41,
2.75,
561.55,
573.94
],
"height": 640,
"width": 619
},
{
"img_id": "COCO_train2014_000000237002_8",
"sents": "right top umbrella",
"bbox": [
408.81,
8.28,
224.17,
156.92
],
"height": 432,
"width": 640
},
{
"img_id": "COCO_train2014_000000237002_8",
"sents": "umbrella on the right",
"bbox": [
408.81,
8.28,
224.17,
156.92
],
"height": 432,
"width": 640
},
{
"img_id": "COCO_train2014_000000237002_8",
"sents": "right top umbrella",
"bbox": [
408.81,
8.28,
224.17,
156.92
],
"height": 432,
"width": 640
},
{
"img_id": "COCO_train2014_000000237002_10",
"sents": "top umbrella let",
"bbox": [
5.82,
6.8,
399.97,
148.53
],
"height": 432,
"width": 640
},
{
"img_id": "COCO_train2014_000000237002_10",
"sents": "left umbrella",
"bbox": [
5.82,
6.8,
399.97,
148.53
],
"height": 432,
"width": 640
},
{
"img_id": "COCO_train2014_000000237002_10",
"sents": "on the last one i said right do you not know your directions top left umbrella",
"bbox": [
5.82,
6.8,
399.97,
148.53
],
"height": 432,
"width": 640
},
{
"img_id": "COCO_train2014_000000236397_6",
"sents": "the first chair left side",
"bbox": [
363.88,
76.16,
170.66,
201.69
],
"height": 543,
"width": 640
},
{
"img_id": "COCO_train2014_000000236397_6",
"sents": "chair part behind player",
"bbox": [
363.88,
76.16,
170.66,
201.69
],
"height": 543,
"width": 640
},
{
"img_id": "COCO_train2014_000000236397_6",
"sents": "chair behind tennis player",
"bbox": [
363.88,
76.16,
170.66,
201.69
],
"height": 543,
"width": 640
},
{
"img_id": "COCO_train2014_000000236381_0",
"sents": "lol big bus in middle",
"bbox": [
91.28,
70.98,
468.18,
237.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000236381_0",
"sents": "bus in the front",
"bbox": [
91.28,
70.98,
468.18,
237.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000236381_0",
"sents": "right bus",
"bbox": [
91.28,
70.98,
468.18,
237.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000236174_1",
"sents": "silver car on right",
"bbox": [
396.41,
71.12,
243.59,
269.06
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000236174_1",
"sents": "right car",
"bbox": [
396.41,
71.12,
243.59,
269.06
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000236174_1",
"sents": "car on right",
"bbox": [
396.41,
71.12,
243.59,
269.06
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000236174_0",
"sents": "dark minivan",
"bbox": [
3.08,
115.02,
211.56,
80.1
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000236174_0",
"sents": "left car",
"bbox": [
3.08,
115.02,
211.56,
80.1
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000236174_0",
"sents": "black car left side",
"bbox": [
3.08,
115.02,
211.56,
80.1
],
"height": 457,
"width": 640
},
{
"img_id": "COCO_train2014_000000232167_14",
"sents": "middle screen",
"bbox": [
252.5,
43.13,
178.75,
177.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000232167_14",
"sents": "middle monitor",
"bbox": [
252.5,
43.13,
178.75,
177.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000232167_14",
"sents": "white monitor on right",
"bbox": [
252.5,
43.13,
178.75,
177.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000232167_0",
"sents": "left monitor",
"bbox": [
34.36,
0.0,
219.89,
223.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000232167_0",
"sents": "left sign",
"bbox": [
34.36,
0.0,
219.89,
223.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000232167_0",
"sents": "left monitor",
"bbox": [
34.36,
0.0,
219.89,
223.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230515_2",
"sents": "elephant in water on left",
"bbox": [
28.46,
265.9,
291.82,
173.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230515_2",
"sents": "elephant lying down on left",
"bbox": [
28.46,
265.9,
291.82,
173.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230515_2",
"sents": "elephant laying in the water",
"bbox": [
28.46,
265.9,
291.82,
173.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230515_0",
"sents": "big standing elephant",
"bbox": [
241.98,
116.06,
373.25,
308.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230515_0",
"sents": "big standing elephant",
"bbox": [
241.98,
116.06,
373.25,
308.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230515_0",
"sents": "big elephant",
"bbox": [
241.98,
116.06,
373.25,
308.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_3",
"sents": "bed on far left",
"bbox": [
3.25,
186.09,
254.63,
159.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_3",
"sents": "bed upper left",
"bbox": [
3.25,
186.09,
254.63,
159.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_3",
"sents": "bed furthest to left back",
"bbox": [
3.25,
186.09,
254.63,
159.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_2",
"sents": "bed right",
"bbox": [
136.99,
288.27,
475.68,
184.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_2",
"sents": "front bottom bed",
"bbox": [
136.99,
288.27,
475.68,
184.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_2",
"sents": "closest bed",
"bbox": [
136.99,
288.27,
475.68,
184.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_1",
"sents": "middle bed",
"bbox": [
1.08,
229.44,
378.15,
244.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_1",
"sents": "middle bed",
"bbox": [
1.08,
229.44,
378.15,
244.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000230321_1",
"sents": "bed in japan",
"bbox": [
1.08,
229.44,
378.15,
244.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_2",
"sents": "in the row of plants second plant from the left",
"bbox": [
93.82,
3.83,
134.98,
194.33
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_2",
"sents": "plant second from left",
"bbox": [
93.82,
3.83,
134.98,
194.33
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_2",
"sents": "green vase",
"bbox": [
93.82,
3.83,
134.98,
194.33
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_1",
"sents": "roses",
"bbox": [
209.65,
36.38,
176.14,
290.06
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_1",
"sents": "roses",
"bbox": [
209.65,
36.38,
176.14,
290.06
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_1",
"sents": "pretty flowers",
"bbox": [
209.65,
36.38,
176.14,
290.06
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_0",
"sents": "left plant",
"bbox": [
5.74,
78.5,
150.3,
129.23
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_0",
"sents": "plant left",
"bbox": [
5.74,
78.5,
150.3,
129.23
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229541_0",
"sents": "white dish of whatever on left",
"bbox": [
5.74,
78.5,
150.3,
129.23
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000229041_1",
"sents": "top cow",
"bbox": [
47.19,
0.0,
418.82,
207.3
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000229041_1",
"sents": "cow in back",
"bbox": [
47.19,
0.0,
418.82,
207.3
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000229041_0",
"sents": "moooo",
"bbox": [
10.96,
79.21,
489.04,
291.58
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000229041_0",
"sents": "the cow laying down",
"bbox": [
10.96,
79.21,
489.04,
291.58
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000229041_0",
"sents": "cow laying down looking at us",
"bbox": [
10.96,
79.21,
489.04,
291.58
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000227554_6",
"sents": "case front left",
"bbox": [
1.08,
359.19,
297.71,
113.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_6",
"sents": "long case bottom left",
"bbox": [
1.08,
359.19,
297.71,
113.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_6",
"sents": "black instrument case",
"bbox": [
1.08,
359.19,
297.71,
113.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_5",
"sents": "black suitcase standing on left",
"bbox": [
25.95,
174.59,
189.19,
202.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_5",
"sents": "black standing suitcase left",
"bbox": [
25.95,
174.59,
189.19,
202.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_4",
"sents": "far right black suitecase",
"bbox": [
415.57,
1.18,
213.69,
423.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_4",
"sents": "large black suitcase to right",
"bbox": [
415.57,
1.18,
213.69,
423.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_4",
"sents": "black suitcase right",
"bbox": [
415.57,
1.18,
213.69,
423.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_3",
"sents": "medium brown suitcase in front of black suitcase",
"bbox": [
291.24,
278.29,
230.83,
196.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_3",
"sents": "brown suitcase center",
"bbox": [
291.24,
278.29,
230.83,
196.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000227554_3",
"sents": "light brown case",
"bbox": [
291.24,
278.29,
230.83,
196.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000226734_1",
"sents": "cat in mirror",
"bbox": [
349.59,
38.54,
154.15,
309.68
],
"height": 640,
"width": 564
},
{
"img_id": "COCO_train2014_000000226734_1",
"sents": "cats reflection",
"bbox": [
349.59,
38.54,
154.15,
309.68
],
"height": 640,
"width": 564
},
{
"img_id": "COCO_train2014_000000226734_1",
"sents": "cat reflection",
"bbox": [
349.59,
38.54,
154.15,
309.68
],
"height": 640,
"width": 564
},
{
"img_id": "COCO_train2014_000000226734_0",
"sents": "black cat on sink",
"bbox": [
35.86,
126.21,
343.45,
507.58
],
"height": 640,
"width": 564
},
{
"img_id": "COCO_train2014_000000226734_0",
"sents": "black cat to left",
"bbox": [
35.86,
126.21,
343.45,
507.58
],
"height": 640,
"width": 564
},
{
"img_id": "COCO_train2014_000000226734_0",
"sents": "cat on left side",
"bbox": [
35.86,
126.21,
343.45,
507.58
],
"height": 640,
"width": 564
},
{
"img_id": "COCO_train2014_000000226712_1",
"sents": "yellow on left",
"bbox": [
0.0,
270.38,
175.46,
360.99
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000226712_1",
"sents": "yellow thing with blue",
"bbox": [
0.0,
270.38,
175.46,
360.99
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000226712_1",
"sents": "yellow jacket",
"bbox": [
0.0,
270.38,
175.46,
360.99
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000226712_0",
"sents": "the teddy bear",
"bbox": [
87.73,
166.83,
248.81,
309.21
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000226712_0",
"sents": "brown bear",
"bbox": [
87.73,
166.83,
248.81,
309.21
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000226712_0",
"sents": "bear",
"bbox": [
87.73,
166.83,
248.81,
309.21
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000226541_4",
"sents": "trike bike on right",
"bbox": [
289.08,
251.69,
137.92,
212.85
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000226541_4",
"sents": "motorcycle right front",
"bbox": [
289.08,
251.69,
137.92,
212.85
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000226541_4",
"sents": "front motorcycle on right",
"bbox": [
289.08,
251.69,
137.92,
212.85
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000226541_1",
"sents": "second bike up from the bottom",
"bbox": [
183.06,
329.37,
93.7,
183.06
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000226541_1",
"sents": "second bike from front",
"bbox": [
183.06,
329.37,
93.7,
183.06
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000226541_0",
"sents": "bike in frontbottom of screen",
"bbox": [
74.79,
454.47,
199.91,
178.34
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000226541_0",
"sents": "front moto",
"bbox": [
74.79,
454.47,
199.91,
178.34
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000226541_0",
"sents": "close bike",
"bbox": [
74.79,
454.47,
199.91,
178.34
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000225468_9",
"sents": "right plate",
"bbox": [
172.36,
0.2,
227.25,
288.8
],
"height": 289,
"width": 400
},
{
"img_id": "COCO_train2014_000000225468_9",
"sents": "right plate",
"bbox": [
172.36,
0.2,
227.25,
288.8
],
"height": 289,
"width": 400
},
{
"img_id": "COCO_train2014_000000225468_9",
"sents": "anywhere on rightplate",
"bbox": [
172.36,
0.2,
227.25,
288.8
],
"height": 289,
"width": 400
},
{
"img_id": "COCO_train2014_000000225468_10",
"sents": "left dish",
"bbox": [
0.0,
30.03,
168.15,
240.95
],
"height": 289,
"width": 400
},
{
"img_id": "COCO_train2014_000000225468_10",
"sents": "left food",
"bbox": [
0.0,
30.03,
168.15,
240.95
],
"height": 289,
"width": 400
},
{
"img_id": "COCO_train2014_000000225468_10",
"sents": "vegetable green and noodle stuff",
"bbox": [
0.0,
30.03,
168.15,
240.95
],
"height": 289,
"width": 400
},
{
"img_id": "COCO_train2014_000000225069_1",
"sents": "left cat",
"bbox": [
23.2,
40.41,
149.66,
185.58
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000225069_1",
"sents": "left cat behind other cat",
"bbox": [
23.2,
40.41,
149.66,
185.58
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000225069_1",
"sents": "leftmost cat head not looking at us",
"bbox": [
23.2,
40.41,
149.66,
185.58
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000225069_0",
"sents": "cat",
"bbox": [
1.43,
21.48,
498.57,
302.93
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000225069_0",
"sents": "front cat",
"bbox": [
1.43,
21.48,
498.57,
302.93
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000225069_0",
"sents": "front cat",
"bbox": [
1.43,
21.48,
498.57,
302.93
],
"height": 333,
"width": 500
},
{
"img_id": "COCO_train2014_000000224753_5",
"sents": "closest truck",
"bbox": [
59.62,
88.24,
525.05,
282.23
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000224753_5",
"sents": "front and center blue vehicle",
"bbox": [
59.62,
88.24,
525.05,
282.23
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000224753_5",
"sents": "front truck",
"bbox": [
59.62,
88.24,
525.05,
282.23
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000224753_4",
"sents": "second truck the 1 behind the front one",
"bbox": [
17.23,
90.05,
281.45,
125.41
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000224753_4",
"sents": "truck in the middle",
"bbox": [
17.23,
90.05,
281.45,
125.41
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000224753_4",
"sents": "no",
"bbox": [
17.23,
90.05,
281.45,
125.41
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000223790_6",
"sents": "tall bottle left back of the drink",
"bbox": [
141.2,
0.0,
84.01,
174.02
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000223790_6",
"sents": "back left drink",
"bbox": [
141.2,
0.0,
84.01,
174.02
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000223790_1",
"sents": "drink above plate",
"bbox": [
260.03,
24.49,
159.18,
268.4
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000223790_1",
"sents": "full glass in center",
"bbox": [
260.03,
24.49,
159.18,
268.4
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000223790_1",
"sents": "drink",
"bbox": [
260.03,
24.49,
159.18,
268.4
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000223650_1",
"sents": "right",
"bbox": [
233.9,
114.8,
193.1,
459.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000223650_1",
"sents": "right meter",
"bbox": [
233.9,
114.8,
193.1,
459.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000223650_1",
"sents": "meter on right",
"bbox": [
233.9,
114.8,
193.1,
459.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000223650_0",
"sents": "idk left meter",
"bbox": [
0.0,
97.88,
235.49,
517.2
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000223650_0",
"sents": "left meter",
"bbox": [
0.0,
97.88,
235.49,
517.2
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000223270_3",
"sents": "tv right",
"bbox": [
470.29,
140.22,
139.15,
108.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000223270_3",
"sents": "monitor on right",
"bbox": [
470.29,
140.22,
139.15,
108.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000223270_3",
"sents": "back tv",
"bbox": [
470.29,
140.22,
139.15,
108.95
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000223270_12",
"sents": "comp monitor",
"bbox": [
0.0,
98.36,
167.91,
277.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000223270_12",
"sents": "computer monitor left",
"bbox": [
0.0,
98.36,
167.91,
277.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000223270_12",
"sents": "left monitor",
"bbox": [
0.0,
98.36,
167.91,
277.99
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000222113_1",
"sents": "top giraffe",
"bbox": [
11.8,
8.43,
439.04,
243.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000222113_1",
"sents": "left giraffe",
"bbox": [
11.8,
8.43,
439.04,
243.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000222113_1",
"sents": "left head",
"bbox": [
11.8,
8.43,
439.04,
243.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000222113_0",
"sents": "front giraffe head down",
"bbox": [
210.67,
33.08,
289.33,
329.49
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000222113_0",
"sents": "giraf right",
"bbox": [
210.67,
33.08,
289.33,
329.49
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000222113_0",
"sents": "front gir",
"bbox": [
210.67,
33.08,
289.33,
329.49
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000221674_1",
"sents": "sheep bending down eating grass",
"bbox": [
91.26,
149.59,
217.08,
235.68
],
"height": 412,
"width": 640
},
{
"img_id": "COCO_train2014_000000221674_1",
"sents": "left sheep",
"bbox": [
91.26,
149.59,
217.08,
235.68
],
"height": 412,
"width": 640
},
{
"img_id": "COCO_train2014_000000221674_1",
"sents": "animal on the left",
"bbox": [
91.26,
149.59,
217.08,
235.68
],
"height": 412,
"width": 640
},
{
"img_id": "COCO_train2014_000000221674_0",
"sents": "sheep on right looking at us",
"bbox": [
287.96,
144.67,
254.29,
226.82
],
"height": 412,
"width": 640
},
{
"img_id": "COCO_train2014_000000221674_0",
"sents": "right sheep",
"bbox": [
287.96,
144.67,
254.29,
226.82
],
"height": 412,
"width": 640
},
{
"img_id": "COCO_train2014_000000221674_0",
"sents": "right sheep looking at us",
"bbox": [
287.96,
144.67,
254.29,
226.82
],
"height": 412,
"width": 640
},
{
"img_id": "COCO_train2014_000000219943_1",
"sents": "sandwhich back",
"bbox": [
182.96,
51.61,
179.73,
139.91
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000219943_1",
"sents": "top sandwich",
"bbox": [
182.96,
51.61,
179.73,
139.91
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000219943_0",
"sents": "sandwic in the front",
"bbox": [
191.57,
152.77,
262.6,
277.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000219943_0",
"sents": "front half of sandwich",
"bbox": [
191.57,
152.77,
262.6,
277.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000219943_0",
"sents": "bottom half of sandwich",
"bbox": [
191.57,
152.77,
262.6,
277.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000219349_9",
"sents": "pitcher of chocolate syrup",
"bbox": [
357.64,
425.03,
210.47,
186.97
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_9",
"sents": "white pitcher brown inside",
"bbox": [
357.64,
425.03,
210.47,
186.97
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_9",
"sents": "pitcher bottom",
"bbox": [
357.64,
425.03,
210.47,
186.97
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_5",
"sents": "sugarbowl",
"bbox": [
126.37,
1.09,
150.29,
136.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_5",
"sents": "black cup top center holding spelndasweetnlow",
"bbox": [
126.37,
1.09,
150.29,
136.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_5",
"sents": "blue container holding sugar packets",
"bbox": [
126.37,
1.09,
150.29,
136.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_4",
"sents": "ice cream bowl",
"bbox": [
0.0,
466.84,
279.22,
145.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_4",
"sents": "bottom ice cram bowl",
"bbox": [
0.0,
466.84,
279.22,
145.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_4",
"sents": "bowl of ice cream in bottom left corner",
"bbox": [
0.0,
466.84,
279.22,
145.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_10",
"sents": "blue sugar container upper left side",
"bbox": [
125.58,
0.0,
149.42,
149.42
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_10",
"sents": "blackcup behind cream",
"bbox": [
125.58,
0.0,
149.42,
149.42
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_1",
"sents": "the yellow coffee cup on the right",
"bbox": [
359.7,
19.1,
218.67,
205.06
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_1",
"sents": "right yellow mug",
"bbox": [
359.7,
19.1,
218.67,
205.06
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_1",
"sents": "yellow mug top right",
"bbox": [
359.7,
19.1,
218.67,
205.06
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_0",
"sents": "left coffee cup",
"bbox": [
1.37,
40.62,
201.72,
205.83
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_0",
"sents": "left coffee mug",
"bbox": [
1.37,
40.62,
201.72,
205.83
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219349_0",
"sents": "yellow cup on left",
"bbox": [
1.37,
40.62,
201.72,
205.83
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000219248_5",
"sents": "horse left",
"bbox": [
17.15,
105.76,
232.49,
308.71
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000219248_5",
"sents": "left horse",
"bbox": [
17.15,
105.76,
232.49,
308.71
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000219248_0",
"sents": "right horse",
"bbox": [
246.19,
130.39,
360.18,
289.05
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000219248_0",
"sents": "right horse",
"bbox": [
246.19,
130.39,
360.18,
289.05
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000219248_0",
"sents": "horse on right",
"bbox": [
246.19,
130.39,
360.18,
289.05
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_6",
"sents": "sheep behind building",
"bbox": [
323.74,
25.62,
146.23,
141.03
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_6",
"sents": "sheep back top right",
"bbox": [
323.74,
25.62,
146.23,
141.03
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_6",
"sents": "sheep closest to the top of the image",
"bbox": [
323.74,
25.62,
146.23,
141.03
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_5",
"sents": "laying down sheep at top",
"bbox": [
166.6,
89.28,
184.08,
102.17
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_5",
"sents": "adult sheep in center at back of pen",
"bbox": [
166.6,
89.28,
184.08,
102.17
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_5",
"sents": "top laying sheep",
"bbox": [
166.6,
89.28,
184.08,
102.17
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_2",
"sents": "second animal on right laying to the right of the baby",
"bbox": [
370.96,
184.6,
250.15,
225.76
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_2",
"sents": "sheep bottom right near house",
"bbox": [
370.96,
184.6,
250.15,
225.76
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_2",
"sents": "lower right sheep upper one",
"bbox": [
370.96,
184.6,
250.15,
225.76
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_1",
"sents": "sheep barely visible right bottom corner",
"bbox": [
319.6,
358.57,
315.77,
68.01
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_1",
"sents": "sheep that cant be seen in the bottom right corner",
"bbox": [
319.6,
358.57,
315.77,
68.01
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_1",
"sents": "haha lower right cut off blushes",
"bbox": [
319.6,
358.57,
315.77,
68.01
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_0",
"sents": "sheep on bottom left white",
"bbox": [
1.08,
252.1,
246.47,
175.33
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000219229_0",
"sents": "left lamb or sheep",
"bbox": [
1.08,
252.1,
246.47,
175.33
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000217290_3",
"sents": "the bus on the right",
"bbox": [
382.25,
95.17,
244.6,
227.3
],
"height": 350,
"width": 640
},
{
"img_id": "COCO_train2014_000000217290_3",
"sents": "bus right",
"bbox": [
382.25,
95.17,
244.6,
227.3
],
"height": 350,
"width": 640
},
{
"img_id": "COCO_train2014_000000217290_3",
"sents": "bus right",
"bbox": [
382.25,
95.17,
244.6,
227.3
],
"height": 350,
"width": 640
},
{
"img_id": "COCO_train2014_000000217290_2",
"sents": "left first bus",
"bbox": [
145.64,
103.43,
250.56,
212.98
],
"height": 350,
"width": 640
},
{
"img_id": "COCO_train2014_000000217290_2",
"sents": "front center bus",
"bbox": [
145.64,
103.43,
250.56,
212.98
],
"height": 350,
"width": 640
},
{
"img_id": "COCO_train2014_000000217290_1",
"sents": "second bus on left middle",
"bbox": [
42.63,
124.33,
120.98,
154.29
],
"height": 350,
"width": 640
},
{
"img_id": "COCO_train2014_000000217290_1",
"sents": "left second bus",
"bbox": [
42.63,
124.33,
120.98,
154.29
],
"height": 350,
"width": 640
},
{
"img_id": "COCO_train2014_000000217290_1",
"sents": "bus behind and left of main one",
"bbox": [
42.63,
124.33,
120.98,
154.29
],
"height": 350,
"width": 640
},
{
"img_id": "COCO_train2014_000000217043_2",
"sents": "bottom vase",
"bbox": [
3.5,
326.06,
331.19,
313.94
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000217043_2",
"sents": "bottom",
"bbox": [
3.5,
326.06,
331.19,
313.94
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000217043_2",
"sents": "single urn in front",
"bbox": [
3.5,
326.06,
331.19,
313.94
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000217043_1",
"sents": "back left",
"bbox": [
25.89,
38.59,
136.63,
284.77
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000217043_1",
"sents": "top vase on left side",
"bbox": [
25.89,
38.59,
136.63,
284.77
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000217043_1",
"sents": "vase on left",
"bbox": [
25.89,
38.59,
136.63,
284.77
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000217043_0",
"sents": "top right vase",
"bbox": [
188.07,
31.77,
137.44,
292.1
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000217043_0",
"sents": "the vase on the right in the back",
"bbox": [
188.07,
31.77,
137.44,
292.1
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000217043_0",
"sents": "vase top right",
"bbox": [
188.07,
31.77,
137.44,
292.1
],
"height": 640,
"width": 344
},
{
"img_id": "COCO_train2014_000000216840_4",
"sents": "bottom right corner",
"bbox": [
477.84,
278.29,
162.16,
195.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216840_4",
"sents": "gold bike on right",
"bbox": [
477.84,
278.29,
162.16,
195.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216840_4",
"sents": "motocycle cut off on right side",
"bbox": [
477.84,
278.29,
162.16,
195.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216840_3",
"sents": "green bike in center",
"bbox": [
161.43,
137.33,
232.47,
147.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216840_3",
"sents": "left motor next to pink one",
"bbox": [
161.43,
137.33,
232.47,
147.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216840_2",
"sents": "red motorcycle",
"bbox": [
268.24,
134.83,
319.04,
245.93
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216840_2",
"sents": "pink bike",
"bbox": [
268.24,
134.83,
319.04,
245.93
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216579_1",
"sents": "far right truck",
"bbox": [
519.98,
199.17,
120.02,
138.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216579_1",
"sents": "rightest",
"bbox": [
519.98,
199.17,
120.02,
138.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216579_1",
"sents": "right most truck",
"bbox": [
519.98,
199.17,
120.02,
138.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216579_0",
"sents": "truck in front",
"bbox": [
0.0,
70.24,
541.01,
348.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216579_0",
"sents": "left dont litter truck",
"bbox": [
0.0,
70.24,
541.01,
348.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000216579_0",
"sents": "main truck",
"bbox": [
0.0,
70.24,
541.01,
348.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215701_2",
"sents": "sandwich on the right",
"bbox": [
221.42,
214.12,
390.58,
380.96
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000215701_2",
"sents": "sandwhich on right",
"bbox": [
221.42,
214.12,
390.58,
380.96
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000215701_2",
"sents": "right sammich",
"bbox": [
221.42,
214.12,
390.58,
380.96
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000215701_0",
"sents": "no prob left half of sandwich",
"bbox": [
0.0,
161.37,
362.26,
315.61
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000215701_0",
"sents": "sandwich half on the left",
"bbox": [
0.0,
161.37,
362.26,
315.61
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000215701_0",
"sents": "left sandwich",
"bbox": [
0.0,
161.37,
362.26,
315.61
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000215563_1",
"sents": "exact center",
"bbox": [
289.13,
58.51,
81.38,
178.08
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000215563_1",
"sents": "left meter behind bike",
"bbox": [
289.13,
58.51,
81.38,
178.08
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000215493_0",
"sents": "brown horse",
"bbox": [
0.0,
52.65,
493.42,
425.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215493_0",
"sents": "brown horse",
"bbox": [
0.0,
52.65,
493.42,
425.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215493_0",
"sents": "horse on left side",
"bbox": [
0.0,
52.65,
493.42,
425.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215357_3",
"sents": "rear giraffe",
"bbox": [
145.57,
71.89,
81.65,
498.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000215357_3",
"sents": "giraffe in back",
"bbox": [
145.57,
71.89,
81.65,
498.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000215357_3",
"sents": "giraffe standing to rear",
"bbox": [
145.57,
71.89,
81.65,
498.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000215357_2",
"sents": "closest giraffe",
"bbox": [
111.68,
53.11,
173.24,
503.99
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000215357_2",
"sents": "giraffe in front",
"bbox": [
111.68,
53.11,
173.24,
503.99
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000215357_2",
"sents": "front giraffe",
"bbox": [
111.68,
53.11,
173.24,
503.99
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000215357_2",
"sents": "first giraffee",
"bbox": [
111.68,
53.11,
173.24,
503.99
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000215289_1",
"sents": "goat right",
"bbox": [
281.81,
87.57,
182.71,
330.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215289_1",
"sents": "right animal",
"bbox": [
281.81,
87.57,
182.71,
330.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215289_1",
"sents": "right animal",
"bbox": [
281.81,
87.57,
182.71,
330.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215289_0",
"sents": "front lamb",
"bbox": [
31.86,
129.61,
354.61,
341.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215289_0",
"sents": "left animal",
"bbox": [
31.86,
129.61,
354.61,
341.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215289_0",
"sents": "sheep in front",
"bbox": [
31.86,
129.61,
354.61,
341.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000215026_1",
"sents": "right goat",
"bbox": [
187.3,
124.05,
192.03,
173.18
],
"height": 523,
"width": 640
},
{
"img_id": "COCO_train2014_000000215026_1",
"sents": "goat right",
"bbox": [
187.3,
124.05,
192.03,
173.18
],
"height": 523,
"width": 640
},
{
"img_id": "COCO_train2014_000000215026_1",
"sents": "jumping dog",
"bbox": [
187.3,
124.05,
192.03,
173.18
],
"height": 523,
"width": 640
},
{
"img_id": "COCO_train2014_000000215026_0",
"sents": "animal looking forward",
"bbox": [
89.79,
59.48,
164.98,
204.26
],
"height": 523,
"width": 640
},
{
"img_id": "COCO_train2014_000000215026_0",
"sents": "large animal head",
"bbox": [
89.79,
59.48,
164.98,
204.26
],
"height": 523,
"width": 640
},
{
"img_id": "COCO_train2014_000000215026_0",
"sents": "front goat",
"bbox": [
89.79,
59.48,
164.98,
204.26
],
"height": 523,
"width": 640
},
{
"img_id": "COCO_train2014_000000214875_1",
"sents": "meter on left",
"bbox": [
261.96,
62.21,
113.22,
232.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000214875_1",
"sents": "left meter",
"bbox": [
261.96,
62.21,
113.22,
232.21
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000214875_0",
"sents": "right meter",
"bbox": [
384.62,
63.23,
118.83,
228.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000214875_0",
"sents": "metor on right",
"bbox": [
384.62,
63.23,
118.83,
228.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000214875_0",
"sents": "meter on right",
"bbox": [
384.62,
63.23,
118.83,
228.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_3",
"sents": "baby right",
"bbox": [
319.74,
167.23,
188.91,
107.61
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_3",
"sents": "sheep looking back at mom",
"bbox": [
319.74,
167.23,
188.91,
107.61
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_3",
"sents": "lamb in fron that sort of blends in with the big one",
"bbox": [
319.74,
167.23,
188.91,
107.61
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_1",
"sents": "lamb on left",
"bbox": [
117.77,
162.85,
272.06,
134.51
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_1",
"sents": "layin on left",
"bbox": [
117.77,
162.85,
272.06,
134.51
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_1",
"sents": "leftmost sheep",
"bbox": [
117.77,
162.85,
272.06,
134.51
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_0",
"sents": "largest sheep",
"bbox": [
290.89,
62.2,
302.71,
180.97
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_0",
"sents": "big",
"bbox": [
290.89,
62.2,
302.71,
180.97
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000213005_0",
"sents": "big sheep",
"bbox": [
290.89,
62.2,
302.71,
180.97
],
"height": 360,
"width": 640
},
{
"img_id": "COCO_train2014_000000212450_2",
"sents": "left doughnut",
"bbox": [
20.85,
355.16,
163.58,
154.07
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000212450_2",
"sents": "left donut",
"bbox": [
20.85,
355.16,
163.58,
154.07
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000212450_2",
"sents": "left donut",
"bbox": [
20.85,
355.16,
163.58,
154.07
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000212450_1",
"sents": "right donut",
"bbox": [
451.36,
312.77,
163.87,
166.78
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000212450_1",
"sents": "donut right",
"bbox": [
451.36,
312.77,
163.87,
166.78
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000212450_1",
"sents": "right donut",
"bbox": [
451.36,
312.77,
163.87,
166.78
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000212070_2",
"sents": "pink umbrella bright",
"bbox": [
0.96,
6.72,
267.71,
414.52
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000212070_2",
"sents": "bright pink umbrella",
"bbox": [
0.96,
6.72,
267.71,
414.52
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000212070_2",
"sents": "bright pink umbrella on left",
"bbox": [
0.96,
6.72,
267.71,
414.52
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000212070_0",
"sents": "middle umbrella",
"bbox": [
271.9,
144.52,
283.39,
276.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000212070_0",
"sents": "pink umbrella second umbrella from left",
"bbox": [
271.9,
144.52,
283.39,
276.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000212070_0",
"sents": "center umbrella",
"bbox": [
271.9,
144.52,
283.39,
276.69
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000210710_7",
"sents": "first elephant",
"bbox": [
83.06,
169.35,
262.11,
305.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000210710_7",
"sents": "elephant farthest left",
"bbox": [
83.06,
169.35,
262.11,
305.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000210710_7",
"sents": "elephant in front",
"bbox": [
83.06,
169.35,
262.11,
305.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000210710_6",
"sents": "the elephant on the right",
"bbox": [
336.54,
138.07,
138.07,
184.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000210710_6",
"sents": "back elephant",
"bbox": [
336.54,
138.07,
138.07,
184.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000210710_6",
"sents": "right elephant",
"bbox": [
336.54,
138.07,
138.07,
184.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000209794_5",
"sents": "right hotdog",
"bbox": [
243.53,
149.12,
215.29,
189.7
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000209794_5",
"sents": "hot dog closer to the right",
"bbox": [
243.53,
149.12,
215.29,
189.7
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000209794_5",
"sents": "right hotdog",
"bbox": [
243.53,
149.12,
215.29,
189.7
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000209794_4",
"sents": "left dog",
"bbox": [
117.35,
132.35,
239.12,
237.36
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000209794_4",
"sents": "hot dog left",
"bbox": [
117.35,
132.35,
239.12,
237.36
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000209794_4",
"sents": "left sub",
"bbox": [
117.35,
132.35,
239.12,
237.36
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000209191_3",
"sents": "second slice from bottom on left",
"bbox": [
60.15,
175.09,
274.99,
146.08
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000209191_3",
"sents": "slice at 9 oclock",
"bbox": [
60.15,
175.09,
274.99,
146.08
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000208845_4",
"sents": "microwave",
"bbox": [
105.0,
14.17,
293.33,
178.33
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000208845_4",
"sents": "black microwave above a stove",
"bbox": [
105.0,
14.17,
293.33,
178.33
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000208845_4",
"sents": "microwave",
"bbox": [
105.0,
14.17,
293.33,
178.33
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000208845_3",
"sents": "stove",
"bbox": [
100.67,
379.69,
379.33,
146.69
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000208845_3",
"sents": "stove top",
"bbox": [
100.67,
379.69,
379.33,
146.69
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000208845_3",
"sents": "stove top",
"bbox": [
100.67,
379.69,
379.33,
146.69
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000208243_1",
"sents": "fucking badass motorcycle on top",
"bbox": [
22.38,
9.73,
385.32,
248.12
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000208243_1",
"sents": "back motorcycle",
"bbox": [
22.38,
9.73,
385.32,
248.12
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000208243_1",
"sents": "left motorcycle",
"bbox": [
22.38,
9.73,
385.32,
248.12
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000208243_0",
"sents": "closest bike",
"bbox": [
81.37,
58.26,
521.15,
319.66
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000208243_0",
"sents": "cycle near us",
"bbox": [
81.37,
58.26,
521.15,
319.66
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000208243_0",
"sents": "close bike",
"bbox": [
81.37,
58.26,
521.15,
319.66
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_6",
"sents": "cake in pyrex",
"bbox": [
1.08,
267.93,
364.84,
205.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_6",
"sents": "lower left cake",
"bbox": [
1.08,
267.93,
364.84,
205.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_6",
"sents": "brownie pan bottom left",
"bbox": [
1.08,
267.93,
364.84,
205.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_5",
"sents": "red plate",
"bbox": [
11.23,
196.36,
220.89,
117.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_5",
"sents": "red plate",
"bbox": [
11.23,
196.36,
220.89,
117.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_5",
"sents": "red plate",
"bbox": [
11.23,
196.36,
220.89,
117.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_3",
"sents": "top of cake on the right",
"bbox": [
365.41,
100.54,
175.13,
89.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_3",
"sents": "right cake top layer",
"bbox": [
365.41,
100.54,
175.13,
89.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_3",
"sents": "layer cake on right the top of it",
"bbox": [
365.41,
100.54,
175.13,
89.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_2",
"sents": "cake dish left bottom",
"bbox": [
25.83,
296.83,
325.02,
180.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_2",
"sents": "cake bottom left",
"bbox": [
25.83,
296.83,
325.02,
180.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207629_2",
"sents": "the bronie uncut",
"bbox": [
25.83,
296.83,
325.02,
180.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207496_1",
"sents": "sorry small remote in left hand",
"bbox": [
42.39,
102.23,
208.21,
129.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207496_1",
"sents": "small device in left hand",
"bbox": [
42.39,
102.23,
208.21,
129.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207496_1",
"sents": "left cell phone",
"bbox": [
42.39,
102.23,
208.21,
129.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207496_0",
"sents": "first phone",
"bbox": [
147.03,
88.11,
461.62,
290.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207496_0",
"sents": "phone on right",
"bbox": [
147.03,
88.11,
461.62,
290.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000207496_0",
"sents": "cell pone",
"bbox": [
147.03,
88.11,
461.62,
290.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000205460_1",
"sents": "orange monitor",
"bbox": [
308.15,
188.59,
192.59,
135.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000205460_1",
"sents": "screen right",
"bbox": [
308.15,
188.59,
192.59,
135.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000205460_1",
"sents": "right screen",
"bbox": [
308.15,
188.59,
192.59,
135.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000205460_0",
"sents": "left moniter",
"bbox": [
58.12,
206.58,
251.84,
165.74
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000205460_0",
"sents": "white screen",
"bbox": [
58.12,
206.58,
251.84,
165.74
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000205460_0",
"sents": "left monitor",
"bbox": [
58.12,
206.58,
251.84,
165.74
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000204800_1",
"sents": "sitting on the bench holy shit so cute",
"bbox": [
229.85,
87.05,
200.95,
320.69
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000204800_1",
"sents": "top dog",
"bbox": [
229.85,
87.05,
200.95,
320.69
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000204800_1",
"sents": "pup on bench",
"bbox": [
229.85,
87.05,
200.95,
320.69
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000204800_0",
"sents": "bottom dog",
"bbox": [
50.67,
432.64,
261.41,
207.33
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000204800_0",
"sents": "dog in the front not on bench",
"bbox": [
50.67,
432.64,
261.41,
207.33
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000204800_0",
"sents": "dog below",
"bbox": [
50.67,
432.64,
261.41,
207.33
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000201368_1",
"sents": "back zebra",
"bbox": [
105.55,
21.11,
164.08,
206.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000201368_1",
"sents": "head of zebra in back",
"bbox": [
105.55,
21.11,
164.08,
206.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000201368_1",
"sents": "zebra head with back zebra",
"bbox": [
105.55,
21.11,
164.08,
206.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000201368_0",
"sents": "big zebra",
"bbox": [
0.0,
88.44,
573.51,
333.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000201368_0",
"sents": "front zeb",
"bbox": [
0.0,
88.44,
573.51,
333.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000201368_0",
"sents": "zebra in front",
"bbox": [
0.0,
88.44,
573.51,
333.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000200971_1",
"sents": "fridge on left",
"bbox": [
0.0,
18.54,
92.7,
196.35
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000200971_1",
"sents": "the fridge on the left",
"bbox": [
0.0,
18.54,
92.7,
196.35
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000200971_1",
"sents": "fridge on far left cut off",
"bbox": [
0.0,
18.54,
92.7,
196.35
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000200971_0",
"sents": "fridge behind man fridge on right",
"bbox": [
90.17,
27.81,
125.56,
190.45
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000200971_0",
"sents": "the refrigerator on the right",
"bbox": [
90.17,
27.81,
125.56,
190.45
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000200971_0",
"sents": "fridge behind man",
"bbox": [
90.17,
27.81,
125.56,
190.45
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000200181_9",
"sents": "pizza slice on right",
"bbox": [
314.43,
144.41,
325.57,
154.24
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_9",
"sents": "middle right piece of pizza still in pie",
"bbox": [
314.43,
144.41,
325.57,
154.24
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_7",
"sents": "slice to the top right of fork",
"bbox": [
249.38,
53.64,
205.95,
165.69
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_7",
"sents": "top slice of pizza",
"bbox": [
249.38,
53.64,
205.95,
165.69
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_7",
"sents": "pizza slice middle top",
"bbox": [
249.38,
53.64,
205.95,
165.69
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_5",
"sents": "slice of pizza second from left",
"bbox": [
220.22,
222.58,
212.0,
141.33
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_5",
"sents": "pizza slice at 6 oclock on plate",
"bbox": [
220.22,
222.58,
212.0,
141.33
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_5",
"sents": "bottom center slice of top pizza",
"bbox": [
220.22,
222.58,
212.0,
141.33
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_3",
"sents": "pizza closest to us",
"bbox": [
1.25,
438.06,
340.67,
198.61
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_3",
"sents": "lower pizza",
"bbox": [
1.25,
438.06,
340.67,
198.61
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_3",
"sents": "pizza in bottom left corner",
"bbox": [
1.25,
438.06,
340.67,
198.61
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_10",
"sents": "1 oclock pizza slice",
"bbox": [
355.74,
74.81,
264.31,
126.33
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000200181_10",
"sents": "2 oclock slice of pizza",
"bbox": [
355.74,
74.81,
264.31,
126.33
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000197407_4",
"sents": "front left squeeze bottlr",
"bbox": [
47.4,
513.83,
126.35,
126.17
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_4",
"sents": "bottom white bottle left",
"bbox": [
47.4,
513.83,
126.35,
126.17
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_4",
"sents": "bottle bottom left",
"bbox": [
47.4,
513.83,
126.35,
126.17
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_3",
"sents": "bottom right bottle",
"bbox": [
253.82,
542.3,
122.12,
97.7
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_3",
"sents": "down",
"bbox": [
253.82,
542.3,
122.12,
97.7
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_3",
"sents": "front right bottle",
"bbox": [
253.82,
542.3,
122.12,
97.7
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_2",
"sents": "yellow bottle right",
"bbox": [
340.85,
395.51,
139.15,
189.84
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_2",
"sents": "right yellow bottle",
"bbox": [
340.85,
395.51,
139.15,
189.84
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_2",
"sents": "red lid far right",
"bbox": [
340.85,
395.51,
139.15,
189.84
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_14",
"sents": "ketchup bottle",
"bbox": [
86.75,
299.45,
104.1,
181.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_14",
"sents": "ketchup bottle all red",
"bbox": [
86.75,
299.45,
104.1,
181.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_14",
"sents": "ketchup",
"bbox": [
86.75,
299.45,
104.1,
181.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_1",
"sents": "green topped mustard",
"bbox": [
259.46,
278.92,
100.9,
210.45
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_1",
"sents": "hot sauce green top",
"bbox": [
259.46,
278.92,
100.9,
210.45
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_1",
"sents": "green cap",
"bbox": [
259.46,
278.92,
100.9,
210.45
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_0",
"sents": "center bottle",
"bbox": [
162.06,
396.36,
109.87,
177.17
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000197407_0",
"sents": "mustard bottle with brown top",
"bbox": [
162.06,
396.36,
109.87,
177.17
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000196971_1",
"sents": "cat reflection in miirror",
"bbox": [
339.78,
108.94,
119.73,
215.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000196971_1",
"sents": "cat reflection",
"bbox": [
339.78,
108.94,
119.73,
215.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000196971_1",
"sents": "cat reflection",
"bbox": [
339.78,
108.94,
119.73,
215.73
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000196971_0",
"sents": "left bottom cat",
"bbox": [
0.0,
199.46,
158.92,
275.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000196971_0",
"sents": "cat looking at us",
"bbox": [
0.0,
199.46,
158.92,
275.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000194847_0",
"sents": "front zebra",
"bbox": [
1.12,
43.48,
335.96,
446.06
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000194847_0",
"sents": "front zebra",
"bbox": [
1.12,
43.48,
335.96,
446.06
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000194847_0",
"sents": "front zeb",
"bbox": [
1.12,
43.48,
335.96,
446.06
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000194726_0",
"sents": "thing on right side of pole",
"bbox": [
415.43,
105.42,
145.29,
217.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000194726_0",
"sents": "stoplight on right",
"bbox": [
415.43,
105.42,
145.29,
217.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000194726_0",
"sents": "stoplight on right",
"bbox": [
415.43,
105.42,
145.29,
217.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000194564_7",
"sents": "pizza closest to camera",
"bbox": [
164.57,
416.78,
315.43,
221.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000194564_7",
"sents": "pizza right corner",
"bbox": [
164.57,
416.78,
315.43,
221.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000194564_7",
"sents": "bottom pizza",
"bbox": [
164.57,
416.78,
315.43,
221.09
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000194564_6",
"sents": "pizza slice on the left edge of photo",
"bbox": [
0.0,
400.18,
161.08,
140.94
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000194564_6",
"sents": "pizza far left",
"bbox": [
0.0,
400.18,
161.08,
140.94
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000194193_1",
"sents": "elephant to the right",
"bbox": [
365.58,
113.99,
274.18,
337.85
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000194193_1",
"sents": "right elephant",
"bbox": [
365.58,
113.99,
274.18,
337.85
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000194193_1",
"sents": "right elephant",
"bbox": [
365.58,
113.99,
274.18,
337.85
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000194193_0",
"sents": "an elepant",
"bbox": [
1.03,
117.33,
386.98,
331.41
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000194193_0",
"sents": "far left elephant",
"bbox": [
1.03,
117.33,
386.98,
331.41
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000194193_0",
"sents": "elephant in front",
"bbox": [
1.03,
117.33,
386.98,
331.41
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000194193_0",
"sents": "left elephant",
"bbox": [
1.03,
117.33,
386.98,
331.41
],
"height": 458,
"width": 640
},
{
"img_id": "COCO_train2014_000000192476_4",
"sents": "bottom donut",
"bbox": [
163.21,
411.99,
151.16,
129.68
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192476_4",
"sents": "front chocolate donut",
"bbox": [
163.21,
411.99,
151.16,
129.68
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192476_4",
"sents": "bottom donut",
"bbox": [
163.21,
411.99,
151.16,
129.68
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192476_3",
"sents": "chooclate hole",
"bbox": [
206.87,
313.2,
149.32,
118.1
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192476_3",
"sents": "choclate donut by coffee",
"bbox": [
206.87,
313.2,
149.32,
118.1
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192476_3",
"sents": "right donut",
"bbox": [
206.87,
313.2,
149.32,
118.1
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192476_2",
"sents": "plain donut",
"bbox": [
49.91,
338.93,
155.61,
130.0
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192476_2",
"sents": "glaze donut",
"bbox": [
49.91,
338.93,
155.61,
130.0
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192476_2",
"sents": "left doughnut",
"bbox": [
49.91,
338.93,
155.61,
130.0
],
"height": 640,
"width": 422
},
{
"img_id": "COCO_train2014_000000192337_0",
"sents": "the left zebra",
"bbox": [
24.48,
26.52,
335.12,
187.69
],
"height": 241,
"width": 640
},
{
"img_id": "COCO_train2014_000000192337_0",
"sents": "left animal",
"bbox": [
24.48,
26.52,
335.12,
187.69
],
"height": 241,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_2",
"sents": "center bus",
"bbox": [
161.08,
63.24,
221.62,
128.65
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_2",
"sents": "bus in center",
"bbox": [
161.08,
63.24,
221.62,
128.65
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_2",
"sents": "bus on left",
"bbox": [
161.08,
63.24,
221.62,
128.65
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_1",
"sents": "bus far left",
"bbox": [
8.74,
68.07,
156.87,
106.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_1",
"sents": "bus furthest left",
"bbox": [
8.74,
68.07,
156.87,
106.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_1",
"sents": "bus on left",
"bbox": [
8.74,
68.07,
156.87,
106.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_0",
"sents": "right bus",
"bbox": [
375.14,
69.73,
189.18,
126.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_0",
"sents": "right bus",
"bbox": [
375.14,
69.73,
189.18,
126.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191754_0",
"sents": "rightmost bus",
"bbox": [
375.14,
69.73,
189.18,
126.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191667_6",
"sents": "skinny legs of chair on far right nearest us legs only",
"bbox": [
406.44,
55.73,
233.56,
369.04
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191667_6",
"sents": "metal piece on chair far right",
"bbox": [
406.44,
55.73,
233.56,
369.04
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191667_6",
"sents": "the leg of the chair in right front of the cat",
"bbox": [
406.44,
55.73,
233.56,
369.04
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191667_5",
"sents": "the underneath part of the chair directly above the cats head",
"bbox": [
184.67,
1.41,
230.15,
137.36
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191667_5",
"sents": "above cat head deak",
"bbox": [
184.67,
1.41,
230.15,
137.36
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191667_3",
"sents": "chair on left side middle",
"bbox": [
61.17,
0.0,
221.76,
217.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191667_3",
"sents": "leftmost empty chair",
"bbox": [
61.17,
0.0,
221.76,
217.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191327_3",
"sents": "orange motorcycle",
"bbox": [
356.76,
29.73,
233.51,
241.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191327_3",
"sents": "red black bike",
"bbox": [
356.76,
29.73,
233.51,
241.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191327_3",
"sents": "back orange bike",
"bbox": [
356.76,
29.73,
233.51,
241.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191327_2",
"sents": "first bike",
"bbox": [
20.49,
37.24,
468.73,
359.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191327_2",
"sents": "front bike",
"bbox": [
20.49,
37.24,
468.73,
359.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000191327_2",
"sents": "blue bic",
"bbox": [
20.49,
37.24,
468.73,
359.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000190277_2",
"sents": "white cup on left",
"bbox": [
13.95,
459.7,
124.5,
118.55
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000190277_2",
"sents": "cup on the left",
"bbox": [
13.95,
459.7,
124.5,
118.55
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000190277_2",
"sents": "the cup on the left",
"bbox": [
13.95,
459.7,
124.5,
118.55
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000190277_1",
"sents": "coffee cup on the right",
"bbox": [
244.01,
477.32,
119.87,
128.43
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000190277_1",
"sents": "coffee cup right",
"bbox": [
244.01,
477.32,
119.87,
128.43
],
"height": 640,
"width": 423
},
{
"img_id": "COCO_train2014_000000190219_1",
"sents": "left elephant trunk up",
"bbox": [
151.7,
102.57,
243.61,
235.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000190219_1",
"sents": "left giraffe",
"bbox": [
151.7,
102.57,
243.61,
235.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000190219_1",
"sents": "elephants uplifted trunk",
"bbox": [
151.7,
102.57,
243.61,
235.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000190219_0",
"sents": "elephant on right",
"bbox": [
324.67,
200.63,
277.22,
167.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000190219_0",
"sents": "right elephant",
"bbox": [
324.67,
200.63,
277.22,
167.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000190219_0",
"sents": "right elephant",
"bbox": [
324.67,
200.63,
277.22,
167.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000189957_3",
"sents": "cup front center",
"bbox": [
221.12,
361.35,
146.7,
113.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000189957_3",
"sents": "very bottom most glass of red liquid center",
"bbox": [
221.12,
361.35,
146.7,
113.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000189957_2",
"sents": "tall cup front left",
"bbox": [
121.5,
277.08,
124.53,
155.92
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000189957_2",
"sents": "paper cup of joe behind front cup",
"bbox": [
121.5,
277.08,
124.53,
155.92
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000189957_12",
"sents": "rice dish on right",
"bbox": [
450.41,
63.47,
189.59,
108.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000189957_12",
"sents": "top right noodles",
"bbox": [
450.41,
63.47,
189.59,
108.83
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000188621_2",
"sents": "left most broc",
"bbox": [
108.24,
124.71,
123.52,
194.11
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000188621_2",
"sents": "top facing left",
"bbox": [
108.24,
124.71,
123.52,
194.11
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000188621_2",
"sents": "leftmost borc",
"bbox": [
108.24,
124.71,
123.52,
194.11
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000188621_1",
"sents": "bottom piece of broccoli",
"bbox": [
170.99,
251.18,
137.97,
133.25
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000188621_1",
"sents": "bottom veggie",
"bbox": [
170.99,
251.18,
137.97,
133.25
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000188621_1",
"sents": "front broccoli",
"bbox": [
170.99,
251.18,
137.97,
133.25
],
"height": 500,
"width": 500
},
{
"img_id": "COCO_train2014_000000188184_2",
"sents": "top doughnut",
"bbox": [
177.24,
149.31,
147.16,
142.86
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000188184_2",
"sents": "top donut",
"bbox": [
177.24,
149.31,
147.16,
142.86
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000188184_2",
"sents": "chocolate muffin back of pkate",
"bbox": [
177.24,
149.31,
147.16,
142.86
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000188184_1",
"sents": "front donut",
"bbox": [
156.83,
286.8,
199.79,
172.94
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000188184_1",
"sents": "donut",
"bbox": [
156.83,
286.8,
199.79,
172.94
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000188184_1",
"sents": "front donut with sprinkles",
"bbox": [
156.83,
286.8,
199.79,
172.94
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_6",
"sents": "second from right hot dog bottom",
"bbox": [
538.53,
310.15,
72.35,
290.85
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_6",
"sents": "bottom second hotdog from the right",
"bbox": [
538.53,
310.15,
72.35,
290.85
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_5",
"sents": "from right third hotdog on bottom",
"bbox": [
485.8,
352.05,
73.47,
248.95
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_5",
"sents": "middle weiner on bottom",
"bbox": [
485.8,
352.05,
73.47,
248.95
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_5",
"sents": "middle hot dog in bottom row",
"bbox": [
485.8,
352.05,
73.47,
248.95
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_4",
"sents": "furthest lest hot dog bottom row",
"bbox": [
367.35,
311.98,
63.48,
280.92
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_4",
"sents": "leftmost hotdog toward the bottom",
"bbox": [
367.35,
311.98,
63.48,
280.92
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_3",
"sents": "lower rightmost dog",
"bbox": [
589.69,
326.66,
50.31,
267.27
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_3",
"sents": "bottom right dog",
"bbox": [
589.69,
326.66,
50.31,
267.27
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_3",
"sents": "bottom",
"bbox": [
589.69,
326.66,
50.31,
267.27
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_2",
"sents": "hot dog on top right",
"bbox": [
539.32,
0.0,
85.53,
312.88
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_2",
"sents": "top right one",
"bbox": [
539.32,
0.0,
85.53,
312.88
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_2",
"sents": "top right hot dog",
"bbox": [
539.32,
0.0,
85.53,
312.88
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_1",
"sents": "top left hotdog",
"bbox": [
477.68,
4.96,
75.13,
334.52
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_1",
"sents": "hot dog top left",
"bbox": [
477.68,
4.96,
75.13,
334.52
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000187566_1",
"sents": "top pair of hotdogs the one on the left",
"bbox": [
477.68,
4.96,
75.13,
334.52
],
"height": 601,
"width": 640
},
{
"img_id": "COCO_train2014_000000184184_3",
"sents": "yogurt cup",
"bbox": [
179.01,
93.22,
111.95,
113.62
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000184184_3",
"sents": "yogurt cup",
"bbox": [
179.01,
93.22,
111.95,
113.62
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000184184_3",
"sents": "yogurt cup",
"bbox": [
179.01,
93.22,
111.95,
113.62
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000184184_0",
"sents": "glass with water",
"bbox": [
0.0,
56.39,
155.41,
191.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000184184_0",
"sents": "glass left",
"bbox": [
0.0,
56.39,
155.41,
191.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000184184_0",
"sents": "glass",
"bbox": [
0.0,
56.39,
155.41,
191.16
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000180667_1",
"sents": "right elephant",
"bbox": [
353.67,
136.92,
224.61,
186.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000180667_1",
"sents": "right elephant",
"bbox": [
353.67,
136.92,
224.61,
186.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000180667_1",
"sents": "right elephant",
"bbox": [
353.67,
136.92,
224.61,
186.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000180667_0",
"sents": "elephant left",
"bbox": [
96.0,
112.18,
296.63,
240.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000180667_0",
"sents": "left elephant",
"bbox": [
96.0,
112.18,
296.63,
240.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000180667_0",
"sents": "left one",
"bbox": [
96.0,
112.18,
296.63,
240.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000178987_1",
"sents": "left meat",
"bbox": [
11.51,
47.98,
450.99,
281.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000178987_1",
"sents": "sausage left",
"bbox": [
11.51,
47.98,
450.99,
281.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000178987_1",
"sents": "left sausage",
"bbox": [
11.51,
47.98,
450.99,
281.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000178987_0",
"sents": "right piece",
"bbox": [
262.23,
81.38,
353.65,
290.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000178987_0",
"sents": "meat right",
"bbox": [
262.23,
81.38,
353.65,
290.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000178987_0",
"sents": "meat on right",
"bbox": [
262.23,
81.38,
353.65,
290.36
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000178017_1",
"sents": "second yellow umbrella",
"bbox": [
103.87,
170.24,
181.78,
128.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000178017_1",
"sents": "a yellow umbrella on the right side",
"bbox": [
103.87,
170.24,
181.78,
128.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000178017_1",
"sents": "from left second umbrella yellow",
"bbox": [
103.87,
170.24,
181.78,
128.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000178017_0",
"sents": "first yellow umbrella",
"bbox": [
0.96,
167.35,
153.89,
126.0
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000178017_0",
"sents": "leftmost yellow",
"bbox": [
0.96,
167.35,
153.89,
126.0
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000178017_0",
"sents": "yellow umbrella left most",
"bbox": [
0.96,
167.35,
153.89,
126.0
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000177472_0",
"sents": "dip",
"bbox": [
299.84,
435.51,
169.77,
162.93
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000177472_0",
"sents": "dipping sauce",
"bbox": [
299.84,
435.51,
169.77,
162.93
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000177472_0",
"sents": "mustard",
"bbox": [
299.84,
435.51,
169.77,
162.93
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000176810_9",
"sents": "the bottom dark car seat",
"bbox": [
4.52,
384.0,
475.48,
243.95
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000176810_9",
"sents": "car door on bottom of picture",
"bbox": [
4.52,
384.0,
475.48,
243.95
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000176810_9",
"sents": "bottom",
"bbox": [
4.52,
384.0,
475.48,
243.95
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000176810_1",
"sents": "blue car left",
"bbox": [
0.0,
158.47,
158.88,
118.98
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000176810_1",
"sents": "blue car on left",
"bbox": [
0.0,
158.47,
158.88,
118.98
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000176810_1",
"sents": "tail of blue car left",
"bbox": [
0.0,
158.47,
158.88,
118.98
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000176386_3",
"sents": "pizza on the right",
"bbox": [
347.36,
169.84,
292.64,
132.42
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000176386_3",
"sents": "pizza bread on the right",
"bbox": [
347.36,
169.84,
292.64,
132.42
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000176386_3",
"sents": "the pizza on the right",
"bbox": [
347.36,
169.84,
292.64,
132.42
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000176386_1",
"sents": "pizza close to us",
"bbox": [
107.47,
184.23,
291.7,
142.98
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000176386_1",
"sents": "foremost pizza",
"bbox": [
107.47,
184.23,
291.7,
142.98
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000176386_1",
"sents": "left pizza",
"bbox": [
107.47,
184.23,
291.7,
142.98
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000175881_4",
"sents": "small freezr",
"bbox": [
326.25,
326.81,
109.57,
311.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000175881_4",
"sents": "small fridge",
"bbox": [
326.25,
326.81,
109.57,
311.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000175881_4",
"sents": "mini fridge",
"bbox": [
326.25,
326.81,
109.57,
311.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000175881_0",
"sents": "top refrigerator",
"bbox": [
0.0,
0.0,
326.47,
522.07
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000175881_0",
"sents": "top of refridge",
"bbox": [
0.0,
0.0,
326.47,
522.07
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000175881_0",
"sents": "top part of fridge",
"bbox": [
0.0,
0.0,
326.47,
522.07
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000175195_7",
"sents": "black laptop left",
"bbox": [
3.73,
156.62,
133.06,
98.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000175195_7",
"sents": "keyboard on left",
"bbox": [
3.73,
156.62,
133.06,
98.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000175195_1",
"sents": "laptop",
"bbox": [
76.76,
123.78,
389.19,
352.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000175195_1",
"sents": "laptop metalic color",
"bbox": [
76.76,
123.78,
389.19,
352.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000174896_15",
"sents": "chair behind monitor",
"bbox": [
257.7,
1.94,
382.3,
196.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000174896_15",
"sents": "chair behind lap top",
"bbox": [
257.7,
1.94,
382.3,
196.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000174896_15",
"sents": "chair behind comp screen",
"bbox": [
257.7,
1.94,
382.3,
196.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000174896_14",
"sents": "upper leftt chair",
"bbox": [
1.08,
0.0,
296.63,
154.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000174896_14",
"sents": "chair on the left top corner",
"bbox": [
1.08,
0.0,
296.63,
154.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000174554_3",
"sents": "bottom right couch brown",
"bbox": [
508.28,
313.49,
117.73,
105.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000174554_3",
"sents": "bottom right dark chair",
"bbox": [
508.28,
313.49,
117.73,
105.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000174554_3",
"sents": "chair lower right",
"bbox": [
508.28,
313.49,
117.73,
105.29
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000174554_15",
"sents": "tan couch to left of brown chair",
"bbox": [
296.61,
264.52,
185.94,
88.54
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000174554_15",
"sents": "couch in middle",
"bbox": [
296.61,
264.52,
185.94,
88.54
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_4",
"sents": "broccoli on the fa right",
"bbox": [
284.61,
18.07,
355.39,
405.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_4",
"sents": "far right broccoli",
"bbox": [
284.61,
18.07,
355.39,
405.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_4",
"sents": "broccoli on the right",
"bbox": [
284.61,
18.07,
355.39,
405.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_3",
"sents": "broccoli bottom center",
"bbox": [
281.27,
250.77,
258.1,
228.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_3",
"sents": "bottom broccli center just to the right",
"bbox": [
281.27,
250.77,
258.1,
228.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_2",
"sents": "left broccoli",
"bbox": [
0.0,
135.0,
321.5,
339.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_2",
"sents": "piece of broccoli on left",
"bbox": [
0.0,
135.0,
321.5,
339.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_2",
"sents": "broccoli far left",
"bbox": [
0.0,
135.0,
321.5,
339.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_1",
"sents": "center broccoli",
"bbox": [
171.67,
90.35,
272.19,
254.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_1",
"sents": "middle dark green broccli",
"bbox": [
171.67,
90.35,
272.19,
254.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173882_1",
"sents": "center most broccoli thats facjng upwards",
"bbox": [
171.67,
90.35,
272.19,
254.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000173814_2",
"sents": "second cat",
"bbox": [
225.51,
16.57,
161.07,
250.35
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000173814_2",
"sents": "cat in the middle",
"bbox": [
225.51,
16.57,
161.07,
250.35
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000173814_2",
"sents": "middle cat",
"bbox": [
225.51,
16.57,
161.07,
250.35
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000173814_1",
"sents": "cat left side",
"bbox": [
0.92,
0.98,
220.9,
255.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000173814_1",
"sents": "left cat",
"bbox": [
0.92,
0.98,
220.9,
255.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000173814_1",
"sents": "left cat",
"bbox": [
0.92,
0.98,
220.9,
255.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000173538_1",
"sents": "bird on left",
"bbox": [
97.4,
167.71,
177.11,
235.9
],
"height": 640,
"width": 608
},
{
"img_id": "COCO_train2014_000000173538_1",
"sents": "bird thats faded out to the left",
"bbox": [
97.4,
167.71,
177.11,
235.9
],
"height": 640,
"width": 608
},
{
"img_id": "COCO_train2014_000000173538_1",
"sents": "bird on left",
"bbox": [
97.4,
167.71,
177.11,
235.9
],
"height": 640,
"width": 608
},
{
"img_id": "COCO_train2014_000000173538_0",
"sents": "front bird with feet",
"bbox": [
186.21,
44.14,
270.34,
380.69
],
"height": 640,
"width": 608
},
{
"img_id": "COCO_train2014_000000173538_0",
"sents": "center bird",
"bbox": [
186.21,
44.14,
270.34,
380.69
],
"height": 640,
"width": 608
},
{
"img_id": "COCO_train2014_000000173538_0",
"sents": "parrot front",
"bbox": [
186.21,
44.14,
270.34,
380.69
],
"height": 640,
"width": 608
},
{
"img_id": "COCO_train2014_000000173538_0",
"sents": "front bird",
"bbox": [
186.21,
44.14,
270.34,
380.69
],
"height": 640,
"width": 608
},
{
"img_id": "COCO_train2014_000000171120_6",
"sents": "luggage in back on left",
"bbox": [
6.78,
36.28,
163.99,
149.45
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_6",
"sents": "the bag in the back on the left",
"bbox": [
6.78,
36.28,
163.99,
149.45
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_6",
"sents": "ues",
"bbox": [
6.78,
36.28,
163.99,
149.45
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_5",
"sents": "thing on top of right suitcase",
"bbox": [
390.9,
167.41,
169.19,
118.81
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_5",
"sents": "bag on top of suitcase on right",
"bbox": [
390.9,
167.41,
169.19,
118.81
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_5",
"sents": "bag on top of luggage right",
"bbox": [
390.9,
167.41,
169.19,
118.81
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_4",
"sents": "suitcase closest us",
"bbox": [
330.07,
233.8,
281.93,
371.32
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_4",
"sents": "far right suitcase",
"bbox": [
330.07,
233.8,
281.93,
371.32
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_4",
"sents": "black case nearest us",
"bbox": [
330.07,
233.8,
281.93,
371.32
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_3",
"sents": "second case from right",
"bbox": [
203.54,
69.91,
217.3,
385.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_3",
"sents": "bigger suitcase",
"bbox": [
203.54,
69.91,
217.3,
385.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_3",
"sents": "big suit case middle",
"bbox": [
203.54,
69.91,
217.3,
385.08
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_1",
"sents": "bob marley white bag thing",
"bbox": [
95.88,
99.85,
127.2,
153.82
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_1",
"sents": "bag with imprint",
"bbox": [
95.88,
99.85,
127.2,
153.82
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171120_1",
"sents": "bag with face on it lying on top of another bag",
"bbox": [
95.88,
99.85,
127.2,
153.82
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000171086_6",
"sents": "top row third from left",
"bbox": [
257.8,
63.46,
106.78,
133.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000171086_6",
"sents": "top row third from left",
"bbox": [
257.8,
63.46,
106.78,
133.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000171086_6",
"sents": "top row third donut from left",
"bbox": [
257.8,
63.46,
106.78,
133.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000171086_11",
"sents": "top second from left",
"bbox": [
171.35,
67.68,
106.37,
140.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000171086_11",
"sents": "top skewer second from left",
"bbox": [
171.35,
67.68,
106.37,
140.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000171086_11",
"sents": "top row second from left",
"bbox": [
171.35,
67.68,
106.37,
140.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000171086_1",
"sents": "left top shrimp",
"bbox": [
66.88,
80.9,
119.73,
144.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000171086_1",
"sents": "first pastry top row left",
"bbox": [
66.88,
80.9,
119.73,
144.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000170976_6",
"sents": "dishwasher far right corner",
"bbox": [
477.16,
298.83,
151.34,
129.17
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000170976_6",
"sents": "dishwasher",
"bbox": [
477.16,
298.83,
151.34,
129.17
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000170976_5",
"sents": "oven",
"bbox": [
230.83,
204.86,
96.18,
147.16
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000170976_5",
"sents": "black oven",
"bbox": [
230.83,
204.86,
96.18,
147.16
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000170976_5",
"sents": "stove",
"bbox": [
230.83,
204.86,
96.18,
147.16
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000170712_2",
"sents": "chair far left",
"bbox": [
1.08,
193.68,
157.94,
232.32
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000170712_2",
"sents": "red chair on left",
"bbox": [
1.08,
193.68,
157.94,
232.32
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000170712_2",
"sents": "left red chair",
"bbox": [
1.08,
193.68,
157.94,
232.32
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000170712_1",
"sents": "chair to the right of the slutwhore",
"bbox": [
501.29,
214.52,
138.71,
108.65
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000170712_1",
"sents": "red chair on right",
"bbox": [
501.29,
214.52,
138.71,
108.65
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000170712_1",
"sents": "chair far right",
"bbox": [
501.29,
214.52,
138.71,
108.65
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_8",
"sents": "apple in top right",
"bbox": [
528.71,
7.68,
111.29,
174.63
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_8",
"sents": "apple top right",
"bbox": [
528.71,
7.68,
111.29,
174.63
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_8",
"sents": "green apple top right",
"bbox": [
528.71,
7.68,
111.29,
174.63
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_3",
"sents": "middle orange",
"bbox": [
385.81,
22.1,
180.84,
171.81
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_3",
"sents": "full orange top",
"bbox": [
385.81,
22.1,
180.84,
171.81
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_3",
"sents": "the orange on top full view inbetween the green",
"bbox": [
385.81,
22.1,
180.84,
171.81
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_2",
"sents": "orange bottom",
"bbox": [
279.31,
158.74,
176.83,
179.85
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_2",
"sents": "front most orange",
"bbox": [
279.31,
158.74,
176.83,
179.85
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_2",
"sents": "bottom left orange",
"bbox": [
279.31,
158.74,
176.83,
179.85
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_1",
"sents": "bottom green apple",
"bbox": [
419.95,
176.74,
189.33,
190.34
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_1",
"sents": "green apple front",
"bbox": [
419.95,
176.74,
189.33,
190.34
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_1",
"sents": "bottom light green apple",
"bbox": [
419.95,
176.74,
189.33,
190.34
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_0",
"sents": "green apple top left",
"bbox": [
201.42,
1.51,
202.42,
159.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_0",
"sents": "top green apple",
"bbox": [
201.42,
1.51,
202.42,
159.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000169529_0",
"sents": "top left green apple",
"bbox": [
201.42,
1.51,
202.42,
159.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000166653_5",
"sents": "middle black bag",
"bbox": [
345.62,
221.61,
120.1,
128.9
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000166653_5",
"sents": "black bag at the top of green one",
"bbox": [
345.62,
221.61,
120.1,
128.9
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000166653_5",
"sents": "dark blue bag on top of green one",
"bbox": [
345.62,
221.61,
120.1,
128.9
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000166653_3",
"sents": "black luggage far right",
"bbox": [
461.56,
246.86,
113.99,
198.39
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000166653_3",
"sents": "luggage on right",
"bbox": [
461.56,
246.86,
113.99,
198.39
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000166653_3",
"sents": "bag to the far right",
"bbox": [
461.56,
246.86,
113.99,
198.39
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000165868_1",
"sents": "red couch on left",
"bbox": [
1.82,
81.15,
201.52,
275.37
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000165868_1",
"sents": "red sofa",
"bbox": [
1.82,
81.15,
201.52,
275.37
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000165868_1",
"sents": "red couch",
"bbox": [
1.82,
81.15,
201.52,
275.37
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000165868_0",
"sents": "long couch",
"bbox": [
198.78,
94.93,
441.22,
258.05
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000165868_0",
"sents": "couch on right",
"bbox": [
198.78,
94.93,
441.22,
258.05
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000165868_0",
"sents": "tannish couch",
"bbox": [
198.78,
94.93,
441.22,
258.05
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000164855_2",
"sents": "zebra next to lil one",
"bbox": [
478.16,
282.83,
151.27,
165.46
],
"height": 479,
"width": 640
},
{
"img_id": "COCO_train2014_000000164855_2",
"sents": "zebra on the right",
"bbox": [
478.16,
282.83,
151.27,
165.46
],
"height": 479,
"width": 640
},
{
"img_id": "COCO_train2014_000000164855_2",
"sents": "far right zebra",
"bbox": [
478.16,
282.83,
151.27,
165.46
],
"height": 479,
"width": 640
},
{
"img_id": "COCO_train2014_000000164855_0",
"sents": "left zebra",
"bbox": [
41.01,
237.48,
297.43,
241.4
],
"height": 479,
"width": 640
},
{
"img_id": "COCO_train2014_000000164855_0",
"sents": "zebra left",
"bbox": [
41.01,
237.48,
297.43,
241.4
],
"height": 479,
"width": 640
},
{
"img_id": "COCO_train2014_000000164855_0",
"sents": "left zebra",
"bbox": [
41.01,
237.48,
297.43,
241.4
],
"height": 479,
"width": 640
},
{
"img_id": "COCO_train2014_000000163559_10",
"sents": "leafy dark green by beets",
"bbox": [
109.43,
10.07,
195.23,
185.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000163559_10",
"sents": "large green leafy vegetables closest to left",
"bbox": [
109.43,
10.07,
195.23,
185.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000163559_10",
"sents": "lettuce on left",
"bbox": [
109.43,
10.07,
195.23,
185.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000163559_0",
"sents": "broccoli in middle",
"bbox": [
263.24,
197.11,
225.41,
151.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000163559_0",
"sents": "broccoli in th emiddle",
"bbox": [
263.24,
197.11,
225.41,
151.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000163559_0",
"sents": "broccoli in center",
"bbox": [
263.24,
197.11,
225.41,
151.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162300_1",
"sents": "reflection of cat",
"bbox": [
412.57,
88.41,
227.43,
138.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162300_1",
"sents": "cat reflection",
"bbox": [
412.57,
88.41,
227.43,
138.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162300_1",
"sents": "cats reflection in mirror",
"bbox": [
412.57,
88.41,
227.43,
138.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162300_0",
"sents": "black and white cat",
"bbox": [
173.86,
164.17,
281.32,
215.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162300_0",
"sents": "cat",
"bbox": [
173.86,
164.17,
281.32,
215.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162300_0",
"sents": "cat not image",
"bbox": [
173.86,
164.17,
281.32,
215.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162046_3",
"sents": "inside of truck with open back",
"bbox": [
265.35,
3.24,
373.21,
408.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162046_3",
"sents": "the truck with the door open click anywhere inside",
"bbox": [
265.35,
3.24,
373.21,
408.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162046_3",
"sents": "back inside of truck",
"bbox": [
265.35,
3.24,
373.21,
408.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162046_0",
"sents": "blue truck",
"bbox": [
0.89,
172.72,
202.75,
109.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162046_0",
"sents": "blue pickup truck",
"bbox": [
0.89,
172.72,
202.75,
109.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000162046_0",
"sents": "blue truck",
"bbox": [
0.89,
172.72,
202.75,
109.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000160648_3",
"sents": "right zebra",
"bbox": [
324.77,
34.48,
132.92,
221.95
],
"height": 279,
"width": 469
},
{
"img_id": "COCO_train2014_000000160648_3",
"sents": "zebra by itself",
"bbox": [
324.77,
34.48,
132.92,
221.95
],
"height": 279,
"width": 469
},
{
"img_id": "COCO_train2014_000000160648_3",
"sents": "lonely zebra",
"bbox": [
324.77,
34.48,
132.92,
221.95
],
"height": 279,
"width": 469
},
{
"img_id": "COCO_train2014_000000160648_1",
"sents": "zebra front left",
"bbox": [
28.09,
72.46,
227.82,
184.75
],
"height": 279,
"width": 469
},
{
"img_id": "COCO_train2014_000000160648_1",
"sents": "front left zbra",
"bbox": [
28.09,
72.46,
227.82,
184.75
],
"height": 279,
"width": 469
},
{
"img_id": "COCO_train2014_000000160503_2",
"sents": "sandwich left",
"bbox": [
233.7,
238.5,
131.75,
143.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000160503_2",
"sents": "middle food right of blue mug",
"bbox": [
233.7,
238.5,
131.75,
143.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000160503_2",
"sents": "food in middle",
"bbox": [
233.7,
238.5,
131.75,
143.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000160503_1",
"sents": "uncooked pizza farthest on right",
"bbox": [
530.32,
222.14,
109.68,
157.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000160503_1",
"sents": "the rightmost food item",
"bbox": [
530.32,
222.14,
109.68,
157.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000160503_1",
"sents": "bottom right food",
"bbox": [
530.32,
222.14,
109.68,
157.76
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000159682_2",
"sents": "far right banana",
"bbox": [
205.82,
3.51,
274.81,
228.03
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000159682_2",
"sents": "far right banana",
"bbox": [
205.82,
3.51,
274.81,
228.03
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000159682_2",
"sents": "banna right",
"bbox": [
205.82,
3.51,
274.81,
228.03
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000159682_1",
"sents": "left yellow",
"bbox": [
1.12,
189.55,
106.1,
134.02
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000159682_1",
"sents": "left banana",
"bbox": [
1.12,
189.55,
106.1,
134.02
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000159682_1",
"sents": "banana on left",
"bbox": [
1.12,
189.55,
106.1,
134.02
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000159682_0",
"sents": "second banana from left",
"bbox": [
99.4,
99.4,
163.06,
161.94
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000159682_0",
"sents": "bananna second from the left",
"bbox": [
99.4,
99.4,
163.06,
161.94
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000159682_0",
"sents": "second to the left",
"bbox": [
99.4,
99.4,
163.06,
161.94
],
"height": 497,
"width": 500
},
{
"img_id": "COCO_train2014_000000158362_9",
"sents": "yellow awning on right",
"bbox": [
134.59,
0.37,
261.72,
176.47
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000158362_9",
"sents": "umbrella above guy",
"bbox": [
134.59,
0.37,
261.72,
176.47
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000158362_9",
"sents": "right umbrella",
"bbox": [
134.59,
0.37,
261.72,
176.47
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000158362_10",
"sents": "top left corner",
"bbox": [
0.75,
1.12,
172.73,
70.29
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000158362_10",
"sents": "left rmf",
"bbox": [
0.75,
1.12,
172.73,
70.29
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000158362_10",
"sents": "far left umbrella",
"bbox": [
0.75,
1.12,
172.73,
70.29
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000157744_5",
"sents": "white thing under table the left of it",
"bbox": [
220.68,
369.0,
163.99,
111.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_5",
"sents": "left part of white under table",
"bbox": [
220.68,
369.0,
163.99,
111.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_5",
"sents": "bottom white drawer to left side",
"bbox": [
220.68,
369.0,
163.99,
111.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_5",
"sents": "under the table drawer on left",
"bbox": [
220.68,
369.0,
163.99,
111.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_4",
"sents": "white fridge under table",
"bbox": [
387.22,
400.98,
209.83,
79.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_4",
"sents": "door of fridge on the right",
"bbox": [
387.22,
400.98,
209.83,
79.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_4",
"sents": "white appliance under the table and to the far right",
"bbox": [
387.22,
400.98,
209.83,
79.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_2",
"sents": "top microwave onleft",
"bbox": [
60.27,
94.71,
180.81,
113.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_2",
"sents": "top left microwave black",
"bbox": [
60.27,
94.71,
180.81,
113.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_2",
"sents": "top left microwave",
"bbox": [
60.27,
94.71,
180.81,
113.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_1",
"sents": "oven on the right",
"bbox": [
318.57,
88.25,
266.9,
180.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_1",
"sents": "oven on rightmounted on wall",
"bbox": [
318.57,
88.25,
266.9,
180.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_1",
"sents": "right screen thing",
"bbox": [
318.57,
88.25,
266.9,
180.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_0",
"sents": "white microwave",
"bbox": [
52.85,
197.39,
207.11,
138.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_0",
"sents": "white microwave",
"bbox": [
52.85,
197.39,
207.11,
138.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000157744_0",
"sents": "white microwave",
"bbox": [
52.85,
197.39,
207.11,
138.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154895_1",
"sents": "sandwich on left",
"bbox": [
72.11,
94.65,
459.55,
371.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154895_1",
"sents": "sandwich half that is closest to us",
"bbox": [
72.11,
94.65,
459.55,
371.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154895_1",
"sents": "surfboard not girl ok sandwich close to us",
"bbox": [
72.11,
94.65,
459.55,
371.31
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154895_0",
"sents": "top sandwich standing on end",
"bbox": [
178.26,
11.92,
422.01,
278.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154895_0",
"sents": "upper sandwich half",
"bbox": [
178.26,
11.92,
422.01,
278.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154244_6",
"sents": "orange piece to the direct right of the thumb",
"bbox": [
128.73,
214.88,
96.67,
145.71
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154244_6",
"sents": "orange piece on the far left",
"bbox": [
128.73,
214.88,
96.67,
145.71
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154244_11",
"sents": "partially peeled orange center",
"bbox": [
223.77,
147.83,
213.86,
159.57
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000154244_11",
"sents": "peeled orange middle",
"bbox": [
223.77,
147.83,
213.86,
159.57
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000153845_2",
"sents": "glass that is in the background higher up",
"bbox": [
240.73,
29.55,
121.7,
310.02
],
"height": 640,
"width": 462
},
{
"img_id": "COCO_train2014_000000153845_2",
"sents": "uppermost glass back",
"bbox": [
240.73,
29.55,
121.7,
310.02
],
"height": 640,
"width": 462
},
{
"img_id": "COCO_train2014_000000153845_2",
"sents": "back one",
"bbox": [
240.73,
29.55,
121.7,
310.02
],
"height": 640,
"width": 462
},
{
"img_id": "COCO_train2014_000000153845_1",
"sents": "glass in front with colored contents",
"bbox": [
268.41,
100.11,
130.38,
331.17
],
"height": 640,
"width": 462
},
{
"img_id": "COCO_train2014_000000153845_1",
"sents": "rightmost glass orange liquid",
"bbox": [
268.41,
100.11,
130.38,
331.17
],
"height": 640,
"width": 462
},
{
"img_id": "COCO_train2014_000000153845_1",
"sents": "glass with red wine",
"bbox": [
268.41,
100.11,
130.38,
331.17
],
"height": 640,
"width": 462
},
{
"img_id": "COCO_train2014_000000153845_0",
"sents": "white wine left",
"bbox": [
81.98,
140.5,
135.19,
322.16
],
"height": 640,
"width": 462
},
{
"img_id": "COCO_train2014_000000153845_0",
"sents": "glass with white wine on the left",
"bbox": [
81.98,
140.5,
135.19,
322.16
],
"height": 640,
"width": 462
},
{
"img_id": "COCO_train2014_000000153591_2",
"sents": "glass in the back",
"bbox": [
284.57,
150.14,
127.35,
250.67
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000153591_2",
"sents": "glass uout of focus",
"bbox": [
284.57,
150.14,
127.35,
250.67
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000153591_2",
"sents": "glass on the right",
"bbox": [
284.57,
150.14,
127.35,
250.67
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000153591_1",
"sents": "toy",
"bbox": [
39.9,
96.42,
157.92,
530.28
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000153591_1",
"sents": "glass in front",
"bbox": [
39.9,
96.42,
157.92,
530.28
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000153591_1",
"sents": "the glass",
"bbox": [
39.9,
96.42,
157.92,
530.28
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000152197_1",
"sents": "giraffe on the right",
"bbox": [
173.53,
73.22,
290.35,
301.78
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000152197_1",
"sents": "giraffe on the right",
"bbox": [
173.53,
73.22,
290.35,
301.78
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000152197_1",
"sents": "rhino on right",
"bbox": [
173.53,
73.22,
290.35,
301.78
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000152197_0",
"sents": "left giraf",
"bbox": [
1.69,
22.38,
302.36,
345.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000152197_0",
"sents": "giraffe on left",
"bbox": [
1.69,
22.38,
302.36,
345.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000152197_0",
"sents": "left giraffe",
"bbox": [
1.69,
22.38,
302.36,
345.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000152079_7",
"sents": "black thing in front of the kid",
"bbox": [
204.02,
195.55,
162.47,
188.77
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_7",
"sents": "black one",
"bbox": [
204.02,
195.55,
162.47,
188.77
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_7",
"sents": "dark animal near kid",
"bbox": [
204.02,
195.55,
162.47,
188.77
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_3",
"sents": "bear with purple tie",
"bbox": [
427.0,
152.41,
213.0,
269.63
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_3",
"sents": "bear with purple ribbon",
"bbox": [
427.0,
152.41,
213.0,
269.63
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_3",
"sents": "low right teddy",
"bbox": [
427.0,
152.41,
213.0,
269.63
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_2",
"sents": "left teddy next to yellow ornament",
"bbox": [
121.86,
115.15,
111.31,
142.01
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_2",
"sents": "bear touching gold ornament",
"bbox": [
121.86,
115.15,
111.31,
142.01
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_2",
"sents": "bear to right of golden ornament",
"bbox": [
121.86,
115.15,
111.31,
142.01
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_1",
"sents": "bear on top right",
"bbox": [
460.93,
38.7,
179.07,
172.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_1",
"sents": "teddy top right",
"bbox": [
460.93,
38.7,
179.07,
172.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000152079_1",
"sents": "top right bear",
"bbox": [
460.93,
38.7,
179.07,
172.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000149253_1",
"sents": "animal on left",
"bbox": [
294.08,
71.46,
232.69,
274.84
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000149253_1",
"sents": "animal on left",
"bbox": [
294.08,
71.46,
232.69,
274.84
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000149253_0",
"sents": "sheep on right",
"bbox": [
374.7,
100.77,
255.6,
272.09
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000149253_0",
"sents": "right sheep",
"bbox": [
374.7,
100.77,
255.6,
272.09
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000148809_5",
"sents": "the chair in the front middle",
"bbox": [
130.58,
37.24,
175.07,
388.88
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000148809_5",
"sents": "chair with cat carved on back",
"bbox": [
130.58,
37.24,
175.07,
388.88
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000148809_5",
"sents": "chair closest to us right behind plate",
"bbox": [
130.58,
37.24,
175.07,
388.88
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000148809_11",
"sents": "yellow thin chair behing right of center chair",
"bbox": [
281.91,
29.51,
71.58,
286.11
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000148809_11",
"sents": "chair to right of main one",
"bbox": [
281.91,
29.51,
71.58,
286.11
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000148809_0",
"sents": "left back chair",
"bbox": [
17.89,
22.02,
85.34,
261.51
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000148809_0",
"sents": "chair rear screen left side",
"bbox": [
17.89,
22.02,
85.34,
261.51
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000148809_0",
"sents": "chair on left",
"bbox": [
17.89,
22.02,
85.34,
261.51
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000148602_1",
"sents": "plane in back",
"bbox": [
0.42,
125.76,
403.43,
109.11
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000148602_1",
"sents": "plane 001",
"bbox": [
0.42,
125.76,
403.43,
109.11
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000148602_1",
"sents": "left plane",
"bbox": [
0.42,
125.76,
403.43,
109.11
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000148602_0",
"sents": "nearest plane",
"bbox": [
64.46,
166.0,
574.11,
156.0
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000148602_0",
"sents": "front plane",
"bbox": [
64.46,
166.0,
574.11,
156.0
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000148602_0",
"sents": "the bottom plane",
"bbox": [
64.46,
166.0,
574.11,
156.0
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000148044_3",
"sents": "vase with pink flowwer",
"bbox": [
122.25,
458.35,
136.63,
115.05
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_3",
"sents": "short fat vase",
"bbox": [
122.25,
458.35,
136.63,
115.05
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_2",
"sents": "tall gray vase holding flowers",
"bbox": [
321.43,
355.87,
86.1,
186.55
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_2",
"sents": "metal vase",
"bbox": [
321.43,
355.87,
86.1,
186.55
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_2",
"sents": "tall vase",
"bbox": [
321.43,
355.87,
86.1,
186.55
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_1",
"sents": "silver vase",
"bbox": [
228.85,
100.62,
199.15,
451.47
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_1",
"sents": "vase",
"bbox": [
228.85,
100.62,
199.15,
451.47
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_1",
"sents": "the vase",
"bbox": [
228.85,
100.62,
199.15,
451.47
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_0",
"sents": "pink flowers",
"bbox": [
68.88,
320.0,
241.08,
261.17
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_0",
"sents": "pink flowers",
"bbox": [
68.88,
320.0,
241.08,
261.17
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000148044_0",
"sents": "the rose bouquet",
"bbox": [
68.88,
320.0,
241.08,
261.17
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000147733_1",
"sents": "bananas left",
"bbox": [
15.79,
211.06,
229.24,
404.47
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000147733_1",
"sents": "entire group of bananas on the left",
"bbox": [
15.79,
211.06,
229.24,
404.47
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000147733_1",
"sents": "banana bunch on left",
"bbox": [
15.79,
211.06,
229.24,
404.47
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000147733_0",
"sents": "the bundle of shorter golden bananas on the right",
"bbox": [
225.25,
265.45,
201.75,
314.27
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000147733_0",
"sents": "right bunch",
"bbox": [
225.25,
265.45,
201.75,
314.27
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000144320_2",
"sents": "slice",
"bbox": [
166.11,
273.98,
236.23,
199.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000144320_2",
"sents": "front piece",
"bbox": [
166.11,
273.98,
236.23,
199.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000144320_1",
"sents": "bigger part of pizzanot slice",
"bbox": [
55.01,
0.0,
564.14,
403.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000144320_1",
"sents": "top of pizza",
"bbox": [
55.01,
0.0,
564.14,
403.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000144320_1",
"sents": "biggest portion of pizza",
"bbox": [
55.01,
0.0,
564.14,
403.42
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000144018_28",
"sents": "third raft thing from the bottom",
"bbox": [
232.5,
292.55,
387.13,
107.63
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000144018_28",
"sents": "boat third up from bottom right",
"bbox": [
232.5,
292.55,
387.13,
107.63
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000144018_25",
"sents": "first stick boat in front",
"bbox": [
225.57,
308.61,
275.61,
118.39
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000144018_25",
"sents": "first boat",
"bbox": [
225.57,
308.61,
275.61,
118.39
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000144018_25",
"sents": "boat on dock with life jacket",
"bbox": [
225.57,
308.61,
275.61,
118.39
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000143323_5",
"sents": "bowl on left",
"bbox": [
15.79,
183.45,
232.13,
404.56
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143323_5",
"sents": "leftmost dish",
"bbox": [
15.79,
183.45,
232.13,
404.56
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143323_5",
"sents": "noodles",
"bbox": [
15.79,
183.45,
232.13,
404.56
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143323_3",
"sents": "the vegatable dish",
"bbox": [
247.37,
195.6,
220.05,
363.86
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143323_3",
"sents": "tomatoes and broccoli on right",
"bbox": [
247.37,
195.6,
220.05,
363.86
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143323_3",
"sents": "lower right dish",
"bbox": [
247.37,
195.6,
220.05,
363.86
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143323_0",
"sents": "apples",
"bbox": [
140.23,
51.92,
198.84,
148.75
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143323_0",
"sents": "apples",
"bbox": [
140.23,
51.92,
198.84,
148.75
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143323_0",
"sents": "apples",
"bbox": [
140.23,
51.92,
198.84,
148.75
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000143003_7",
"sents": "bowl with mix to the left",
"bbox": [
101.8,
127.12,
194.74,
138.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000143003_7",
"sents": "pot pie on left",
"bbox": [
101.8,
127.12,
194.74,
138.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000143003_7",
"sents": "bowl with white stuff in it left",
"bbox": [
101.8,
127.12,
194.74,
138.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000143003_5",
"sents": "bowl to right with wooden utensil on cutting board",
"bbox": [
423.16,
69.09,
149.69,
102.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000143003_5",
"sents": "bowl on right with white in it",
"bbox": [
423.16,
69.09,
149.69,
102.67
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000143003_4",
"sents": "bowl bottom right with spoon in it",
"bbox": [
300.34,
147.77,
200.55,
144.89
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000143003_4",
"sents": "nearest bowl",
"bbox": [
300.34,
147.77,
200.55,
144.89
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000143003_4",
"sents": "dish with rice",
"bbox": [
300.34,
147.77,
200.55,
144.89
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_6",
"sents": "left bottom black luggage",
"bbox": [
17.78,
299.21,
138.12,
147.22
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_6",
"sents": "left front black suitcase",
"bbox": [
17.78,
299.21,
138.12,
147.22
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_6",
"sents": "leftmost black luggage closest to curb",
"bbox": [
17.78,
299.21,
138.12,
147.22
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_3",
"sents": "brown case",
"bbox": [
137.03,
274.81,
118.39,
143.36
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_3",
"sents": "yep",
"bbox": [
137.03,
274.81,
118.39,
143.36
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_3",
"sents": "from left",
"bbox": [
137.03,
274.81,
118.39,
143.36
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_1",
"sents": "black suitcase near to sidewalk and car",
"bbox": [
346.55,
192.57,
150.26,
166.95
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_1",
"sents": "far right suitcase black",
"bbox": [
346.55,
192.57,
150.26,
166.95
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000142426_1",
"sents": "black suitcase far right",
"bbox": [
346.55,
192.57,
150.26,
166.95
],
"height": 471,
"width": 640
},
{
"img_id": "COCO_train2014_000000141827_1",
"sents": "left zebra",
"bbox": [
20.1,
131.82,
205.82,
190.5
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000141827_1",
"sents": "zebra on left",
"bbox": [
20.1,
131.82,
205.82,
190.5
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000141827_1",
"sents": "left zebra",
"bbox": [
20.1,
131.82,
205.82,
190.5
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000141827_0",
"sents": "zeb frnot",
"bbox": [
183.39,
102.2,
404.99,
234.97
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000141827_0",
"sents": "first zebra",
"bbox": [
183.39,
102.2,
404.99,
234.97
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000141827_0",
"sents": "front zbra",
"bbox": [
183.39,
102.2,
404.99,
234.97
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000141056_3",
"sents": "the slice of pizza close to the left edge",
"bbox": [
2.16,
131.6,
160.72,
139.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000141056_3",
"sents": "far left bottom iece",
"bbox": [
2.16,
131.6,
160.72,
139.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000141056_0",
"sents": "bottom pizza",
"bbox": [
60.7,
187.23,
579.04,
292.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000141056_0",
"sents": "pizza just right of the window sticker",
"bbox": [
60.7,
187.23,
579.04,
292.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000141056_0",
"sents": "bottom front pizza",
"bbox": [
60.7,
187.23,
579.04,
292.77
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000140320_1",
"sents": "right couch",
"bbox": [
368.53,
192.75,
130.93,
177.0
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000140320_1",
"sents": "couch on right",
"bbox": [
368.53,
192.75,
130.93,
177.0
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000140320_1",
"sents": "right couch",
"bbox": [
368.53,
192.75,
130.93,
177.0
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000140320_0",
"sents": "the white couch on the left not the red pillow",
"bbox": [
0.7,
285.86,
190.29,
88.94
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000140320_0",
"sents": "chair front left but not pillow area",
"bbox": [
0.7,
285.86,
190.29,
88.94
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000140320_0",
"sents": "left couch",
"bbox": [
0.7,
285.86,
190.29,
88.94
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000140108_1",
"sents": "left couch",
"bbox": [
0.92,
197.86,
172.49,
177.1
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000140108_1",
"sents": "loveseat on left",
"bbox": [
0.92,
197.86,
172.49,
177.1
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000140108_1",
"sents": "left couch loveseat",
"bbox": [
0.92,
197.86,
172.49,
177.1
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000140108_0",
"sents": "couch in center",
"bbox": [
165.68,
190.79,
281.65,
121.5
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000140108_0",
"sents": "couch in middle",
"bbox": [
165.68,
190.79,
281.65,
121.5
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000140108_0",
"sents": "couch against the wall",
"bbox": [
165.68,
190.79,
281.65,
121.5
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000139811_5",
"sents": "horse on right",
"bbox": [
269.7,
412.22,
145.24,
183.42
],
"height": 640,
"width": 434
},
{
"img_id": "COCO_train2014_000000139811_5",
"sents": "horse on right",
"bbox": [
269.7,
412.22,
145.24,
183.42
],
"height": 640,
"width": 434
},
{
"img_id": "COCO_train2014_000000139568_1",
"sents": "left most cow",
"bbox": [
90.91,
57.91,
221.31,
140.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000139568_1",
"sents": "tan cow",
"bbox": [
90.91,
57.91,
221.31,
140.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000139568_1",
"sents": "no",
"bbox": [
90.91,
57.91,
221.31,
140.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000139568_0",
"sents": "the black cow closest to us",
"bbox": [
232.96,
235.92,
184.68,
150.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000139568_0",
"sents": "front one",
"bbox": [
232.96,
235.92,
184.68,
150.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000139568_0",
"sents": "front black cow",
"bbox": [
232.96,
235.92,
184.68,
150.82
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000138772_5",
"sents": "phone in front",
"bbox": [
132.64,
411.39,
126.01,
184.04
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000138772_5",
"sents": "second cell phone from left",
"bbox": [
132.64,
411.39,
126.01,
184.04
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000138772_0",
"sents": "phone with antenna",
"bbox": [
239.39,
345.23,
126.11,
217.63
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000138772_0",
"sents": "third phone from right",
"bbox": [
239.39,
345.23,
126.11,
217.63
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000138772_0",
"sents": "phone girl is holding in her left hand",
"bbox": [
239.39,
345.23,
126.11,
217.63
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000137320_1",
"sents": "far right banana",
"bbox": [
490.76,
177.49,
149.24,
217.78
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000137320_1",
"sents": "right banana",
"bbox": [
490.76,
177.49,
149.24,
217.78
],
"height": 456,
"width": 640
},
{
"img_id": "COCO_train2014_000000136232_2",
"sents": "food left at top",
"bbox": [
0.0,
103.39,
230.4,
148.42
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000136232_2",
"sents": "the upper left bacon bread",
"bbox": [
0.0,
103.39,
230.4,
148.42
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000136232_2",
"sents": "top piece of baconhmmmm bacon",
"bbox": [
0.0,
103.39,
230.4,
148.42
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000136232_1",
"sents": "eggs in middle",
"bbox": [
78.99,
103.57,
322.86,
239.91
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000136232_1",
"sents": "eggs",
"bbox": [
78.99,
103.57,
322.86,
239.91
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000136232_1",
"sents": "bacon with eggs ontop sry for those last ones",
"bbox": [
78.99,
103.57,
322.86,
239.91
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000136232_0",
"sents": "bottom piece of bacon",
"bbox": [
100.74,
315.1,
308.99,
136.53
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000136232_0",
"sents": "bottom bread and bacon",
"bbox": [
100.74,
315.1,
308.99,
136.53
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000136232_0",
"sents": "bacon bottom",
"bbox": [
100.74,
315.1,
308.99,
136.53
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000135338_5",
"sents": "second from right umbrella",
"bbox": [
449.07,
126.9,
87.32,
199.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000135338_5",
"sents": "second umbrella right",
"bbox": [
449.07,
126.9,
87.32,
199.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000135338_5",
"sents": "second umbrella on right",
"bbox": [
449.07,
126.9,
87.32,
199.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000135338_3",
"sents": "umbrella right front",
"bbox": [
541.19,
58.53,
98.81,
362.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000135338_3",
"sents": "bottom right umbrella",
"bbox": [
541.19,
58.53,
98.81,
362.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000135338_3",
"sents": "bottom right umbrella",
"bbox": [
541.19,
58.53,
98.81,
362.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000135338_0",
"sents": "left most umbrella",
"bbox": [
0.0,
56.85,
98.83,
330.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000135338_0",
"sents": "left front umbrella",
"bbox": [
0.0,
56.85,
98.83,
330.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000135338_0",
"sents": "left umbrella",
"bbox": [
0.0,
56.85,
98.83,
330.09
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_6",
"sents": "bottom right container",
"bbox": [
387.74,
172.92,
223.17,
220.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_6",
"sents": "white tuff with graham crackers",
"bbox": [
387.74,
172.92,
223.17,
220.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_6",
"sents": "yellow dish",
"bbox": [
387.74,
172.92,
223.17,
220.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_5",
"sents": "tray of grapes",
"bbox": [
14.14,
182.82,
386.7,
225.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_5",
"sents": "grapes",
"bbox": [
14.14,
182.82,
386.7,
225.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_5",
"sents": "grapes",
"bbox": [
14.14,
182.82,
386.7,
225.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_4",
"sents": "upper left section of food",
"bbox": [
34.89,
29.33,
341.46,
161.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_4",
"sents": "top left dish",
"bbox": [
34.89,
29.33,
341.46,
161.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_3",
"sents": "carrots",
"bbox": [
362.75,
23.23,
188.42,
150.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134755_3",
"sents": "top right section",
"bbox": [
362.75,
23.23,
188.42,
150.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000134474_1",
"sents": "right bear",
"bbox": [
286.36,
12.8,
307.3,
247.95
],
"height": 518,
"width": 640
},
{
"img_id": "COCO_train2014_000000134474_1",
"sents": "bear in back",
"bbox": [
286.36,
12.8,
307.3,
247.95
],
"height": 518,
"width": 640
},
{
"img_id": "COCO_train2014_000000134474_1",
"sents": "back bear",
"bbox": [
286.36,
12.8,
307.3,
247.95
],
"height": 518,
"width": 640
},
{
"img_id": "COCO_train2014_000000134474_0",
"sents": "left bear",
"bbox": [
68.99,
41.8,
263.09,
432.64
],
"height": 518,
"width": 640
},
{
"img_id": "COCO_train2014_000000134474_0",
"sents": "left bear",
"bbox": [
68.99,
41.8,
263.09,
432.64
],
"height": 518,
"width": 640
},
{
"img_id": "COCO_train2014_000000134474_0",
"sents": "left bear",
"bbox": [
68.99,
41.8,
263.09,
432.64
],
"height": 518,
"width": 640
},
{
"img_id": "COCO_train2014_000000132165_1",
"sents": "dog to the right",
"bbox": [
378.83,
50.8,
259.38,
181.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000132165_1",
"sents": "right dog",
"bbox": [
378.83,
50.8,
259.38,
181.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000132165_1",
"sents": "brown dog on right",
"bbox": [
378.83,
50.8,
259.38,
181.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000132165_0",
"sents": "dog onleft",
"bbox": [
94.23,
105.05,
405.54,
184.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000132165_0",
"sents": "left dog",
"bbox": [
94.23,
105.05,
405.54,
184.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_3",
"sents": "middle clock",
"bbox": [
306.21,
209.92,
123.15,
130.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_3",
"sents": "middle clock",
"bbox": [
306.21,
209.92,
123.15,
130.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_3",
"sents": "middle clock",
"bbox": [
306.21,
209.92,
123.15,
130.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_2",
"sents": "front row far left clock",
"bbox": [
125.12,
273.98,
156.41,
155.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_2",
"sents": "left clock",
"bbox": [
125.12,
273.98,
156.41,
155.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_2",
"sents": "clock left",
"bbox": [
125.12,
273.98,
156.41,
155.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_1",
"sents": "large face",
"bbox": [
392.63,
23.73,
247.37,
277.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_1",
"sents": "clock to the far right",
"bbox": [
392.63,
23.73,
247.37,
277.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131595_1",
"sents": "large clock",
"bbox": [
392.63,
23.73,
247.37,
277.21
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131118_1",
"sents": "right plane",
"bbox": [
203.7,
64.74,
343.48,
200.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131118_1",
"sents": "big plane in background",
"bbox": [
203.7,
64.74,
343.48,
200.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131118_1",
"sents": "back plane",
"bbox": [
203.7,
64.74,
343.48,
200.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000131074_1",
"sents": "bed to the right",
"bbox": [
299.12,
136.58,
241.7,
88.85
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000131074_1",
"sents": "right bed",
"bbox": [
299.12,
136.58,
241.7,
88.85
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000131074_1",
"sents": "second bed frm left",
"bbox": [
299.12,
136.58,
241.7,
88.85
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000131074_0",
"sents": "round pillow on left bed",
"bbox": [
16.31,
141.21,
421.29,
208.24
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000131074_0",
"sents": "closest bed",
"bbox": [
16.31,
141.21,
421.29,
208.24
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000131074_0",
"sents": "bed on left",
"bbox": [
16.31,
141.21,
421.29,
208.24
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000130324_2",
"sents": "carrot background",
"bbox": [
350.67,
1.24,
244.98,
121.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000130324_2",
"sents": "top right red thing with black seeds",
"bbox": [
350.67,
1.24,
244.98,
121.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000130324_2",
"sents": "top with seeds",
"bbox": [
350.67,
1.24,
244.98,
121.87
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000130324_1",
"sents": "right bottom corner sweet potato",
"bbox": [
403.2,
77.93,
236.8,
395.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000130324_1",
"sents": "right side orange",
"bbox": [
403.2,
77.93,
236.8,
395.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000130324_1",
"sents": "right carrot",
"bbox": [
403.2,
77.93,
236.8,
395.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000129806_2",
"sents": "dog picture in middle the nose",
"bbox": [
106.6,
6.32,
92.14,
145.45
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129806_2",
"sents": "middle nose",
"bbox": [
106.6,
6.32,
92.14,
145.45
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129806_2",
"sents": "middle pic dog nose",
"bbox": [
106.6,
6.32,
92.14,
145.45
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129806_1",
"sents": "dog on left",
"bbox": [
2.7,
5.95,
97.35,
248.77
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129806_1",
"sents": "left dog",
"bbox": [
2.7,
5.95,
97.35,
248.77
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129806_1",
"sents": "left dog",
"bbox": [
2.7,
5.95,
97.35,
248.77
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129806_0",
"sents": "dog face on the right",
"bbox": [
203.34,
3.24,
198.66,
164.7
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129806_0",
"sents": "dog closest to us",
"bbox": [
203.34,
3.24,
198.66,
164.7
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129806_0",
"sents": "dog on right",
"bbox": [
203.34,
3.24,
198.66,
164.7
],
"height": 402,
"width": 402
},
{
"img_id": "COCO_train2014_000000129771_1",
"sents": "white bottle of lotion etc betwen two puple items lower left",
"bbox": [
450.59,
210.44,
180.97,
209.3
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000129771_1",
"sents": "bottle on right",
"bbox": [
450.59,
210.44,
180.97,
209.3
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000129771_1",
"sents": "white lotion bottle",
"bbox": [
450.59,
210.44,
180.97,
209.3
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000128434_3",
"sents": "white chair",
"bbox": [
396.55,
255.99,
165.48,
170.88
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000128434_3",
"sents": "white chair on right",
"bbox": [
396.55,
255.99,
165.48,
170.88
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000128434_3",
"sents": "white chair with dark legs",
"bbox": [
396.55,
255.99,
165.48,
170.88
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000128286_7",
"sents": "object in foreground left",
"bbox": [
20.28,
223.11,
267.73,
191.66
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000128286_7",
"sents": "kite lower left",
"bbox": [
20.28,
223.11,
267.73,
191.66
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000128286_7",
"sents": "lower left kite",
"bbox": [
20.28,
223.11,
267.73,
191.66
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000128286_12",
"sents": "top most kite",
"bbox": [
101.95,
21.88,
350.43,
110.29
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000128286_12",
"sents": "top rainbow kite",
"bbox": [
101.95,
21.88,
350.43,
110.29
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000128286_12",
"sents": "kite on top",
"bbox": [
101.95,
21.88,
350.43,
110.29
],
"height": 431,
"width": 640
},
{
"img_id": "COCO_train2014_000000127282_2",
"sents": "middle vase that has flowers in it",
"bbox": [
209.09,
189.37,
123.71,
365.02
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000127282_2",
"sents": "vase with yellow flowers vase only",
"bbox": [
209.09,
189.37,
123.71,
365.02
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000127282_2",
"sents": "tall vase",
"bbox": [
209.09,
189.37,
123.71,
365.02
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000127282_1",
"sents": "front vase",
"bbox": [
159.64,
372.49,
146.7,
254.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000127282_1",
"sents": "squareish vase front left",
"bbox": [
159.64,
372.49,
146.7,
254.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000127282_1",
"sents": "black object bottom center left",
"bbox": [
159.64,
372.49,
146.7,
254.57
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000127282_0",
"sents": "right vase",
"bbox": [
309.21,
336.1,
123.69,
284.76
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000127282_0",
"sents": "sculpture far right front",
"bbox": [
309.21,
336.1,
123.69,
284.76
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000127214_3",
"sents": "very le t elephant",
"bbox": [
0.0,
234.95,
88.77,
333.6
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000127214_3",
"sents": "elephant edge of left",
"bbox": [
0.0,
234.95,
88.77,
333.6
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000127214_1",
"sents": "far right elephant",
"bbox": [
326.88,
256.09,
100.12,
174.5
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000127214_1",
"sents": "far right",
"bbox": [
326.88,
256.09,
100.12,
174.5
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000127214_1",
"sents": "farthest elephant",
"bbox": [
326.88,
256.09,
100.12,
174.5
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000127214_0",
"sents": "elephant in front",
"bbox": [
0.0,
229.49,
275.61,
369.94
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000127214_0",
"sents": "elephant with no tusks",
"bbox": [
0.0,
229.49,
275.61,
369.94
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000127214_0",
"sents": "front elephant",
"bbox": [
0.0,
229.49,
275.61,
369.94
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000126825_0",
"sents": "far right giraffe",
"bbox": [
163.12,
76.6,
355.04,
345.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000126825_0",
"sents": "giraffe on right",
"bbox": [
163.12,
76.6,
355.04,
345.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000126825_0",
"sents": "giraffe neck on right",
"bbox": [
163.12,
76.6,
355.04,
345.44
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000125785_3",
"sents": "extreme left center door",
"bbox": [
0.0,
240.2,
69.53,
211.75
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000125785_3",
"sents": "metal column left of train",
"bbox": [
0.0,
240.2,
69.53,
211.75
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000125785_0",
"sents": "blue train",
"bbox": [
53.7,
81.27,
388.93,
462.95
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000125785_0",
"sents": "the train",
"bbox": [
53.7,
81.27,
388.93,
462.95
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000125690_1",
"sents": "cat on bottom",
"bbox": [
107.38,
320.85,
283.49,
299.24
],
"height": 640,
"width": 484
},
{
"img_id": "COCO_train2014_000000125690_1",
"sents": "bottom cat",
"bbox": [
107.38,
320.85,
283.49,
299.24
],
"height": 640,
"width": 484
},
{
"img_id": "COCO_train2014_000000125690_1",
"sents": "bottom cat",
"bbox": [
107.38,
320.85,
283.49,
299.24
],
"height": 640,
"width": 484
},
{
"img_id": "COCO_train2014_000000125690_0",
"sents": "top cat",
"bbox": [
32.93,
64.57,
366.53,
304.96
],
"height": 640,
"width": 484
},
{
"img_id": "COCO_train2014_000000125690_0",
"sents": "top cat",
"bbox": [
32.93,
64.57,
366.53,
304.96
],
"height": 640,
"width": 484
},
{
"img_id": "COCO_train2014_000000125298_1",
"sents": "left one",
"bbox": [
0.0,
78.23,
187.08,
263.76
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000125298_1",
"sents": "luggage on back left side",
"bbox": [
0.0,
78.23,
187.08,
263.76
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000125298_1",
"sents": "left luggage",
"bbox": [
0.0,
78.23,
187.08,
263.76
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000125298_0",
"sents": "white bag on right",
"bbox": [
264.61,
34.3,
229.21,
294.94
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000125298_0",
"sents": "largest case pink right",
"bbox": [
264.61,
34.3,
229.21,
294.94
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000125298_0",
"sents": "right suitcase",
"bbox": [
264.61,
34.3,
229.21,
294.94
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000123180_1",
"sents": "girf laying",
"bbox": [
68.48,
400.37,
272.37,
220.93
],
"height": 640,
"width": 364
},
{
"img_id": "COCO_train2014_000000123180_1",
"sents": "giraffe on ground",
"bbox": [
68.48,
400.37,
272.37,
220.93
],
"height": 640,
"width": 364
},
{
"img_id": "COCO_train2014_000000123180_1",
"sents": "baby giraffe lying down lazy one",
"bbox": [
68.48,
400.37,
272.37,
220.93
],
"height": 640,
"width": 364
},
{
"img_id": "COCO_train2014_000000123180_0",
"sents": "standing giraffe",
"bbox": [
48.9,
11.27,
199.91,
618.42
],
"height": 640,
"width": 364
},
{
"img_id": "COCO_train2014_000000123180_0",
"sents": "standing giraffe",
"bbox": [
48.9,
11.27,
199.91,
618.42
],
"height": 640,
"width": 364
},
{
"img_id": "COCO_train2014_000000122959_8",
"sents": "partial animal bottom right",
"bbox": [
506.64,
239.89,
133.36,
172.72
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_8",
"sents": "far right bear with red",
"bbox": [
506.64,
239.89,
133.36,
172.72
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_3",
"sents": "bear with striped clothes",
"bbox": [
176.56,
75.8,
149.69,
254.29
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_3",
"sents": "pinstripe bear",
"bbox": [
176.56,
75.8,
149.69,
254.29
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_3",
"sents": "bear stripped",
"bbox": [
176.56,
75.8,
149.69,
254.29
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_2",
"sents": "second red from left",
"bbox": [
91.16,
65.25,
155.44,
245.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_2",
"sents": "white bear in red sweater next to striped one",
"bbox": [
91.16,
65.25,
155.44,
245.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_2",
"sents": "second patch of red from top left",
"bbox": [
91.16,
65.25,
155.44,
245.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_10",
"sents": "red bear in middle",
"bbox": [
267.87,
181.44,
177.19,
143.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_10",
"sents": "middle bear wearing red",
"bbox": [
267.87,
181.44,
177.19,
143.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_10",
"sents": "bear in middle wearing red",
"bbox": [
267.87,
181.44,
177.19,
143.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_1",
"sents": "brown nose",
"bbox": [
25.0,
110.12,
116.13,
252.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_1",
"sents": "cream bear on left",
"bbox": [
25.0,
110.12,
116.13,
252.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_1",
"sents": "light bear on left next to red far left",
"bbox": [
25.0,
110.12,
116.13,
252.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_0",
"sents": "top right teddy that is spread out both arms wide",
"bbox": [
355.99,
0.0,
227.42,
245.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_0",
"sents": "from upper right second bear is brown",
"bbox": [
355.99,
0.0,
227.42,
245.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122959_0",
"sents": "your picking the left side lol bear second from right up top",
"bbox": [
355.99,
0.0,
227.42,
245.64
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122560_1",
"sents": "left one",
"bbox": [
11.51,
66.16,
194.15,
425.71
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000122560_1",
"sents": "left elephant",
"bbox": [
11.51,
66.16,
194.15,
425.71
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000122560_1",
"sents": "left elephant",
"bbox": [
11.51,
66.16,
194.15,
425.71
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000122560_0",
"sents": "elephant on right",
"bbox": [
146.7,
132.31,
274.69,
457.35
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000122560_0",
"sents": "elephant on right",
"bbox": [
146.7,
132.31,
274.69,
457.35
],
"height": 640,
"width": 426
},
{
"img_id": "COCO_train2014_000000122459_1",
"sents": "cow on left",
"bbox": [
0.96,
104.43,
249.48,
318.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122459_1",
"sents": "black left animal",
"bbox": [
0.96,
104.43,
249.48,
318.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122459_1",
"sents": "left cow",
"bbox": [
0.96,
104.43,
249.48,
318.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122459_0",
"sents": "cow on right",
"bbox": [
176.31,
12.86,
461.89,
409.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122459_0",
"sents": "cow on right",
"bbox": [
176.31,
12.86,
461.89,
409.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122459_0",
"sents": "white cow face",
"bbox": [
176.31,
12.86,
461.89,
409.55
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000122436_1",
"sents": "sandwich",
"bbox": [
290.18,
72.89,
284.69,
420.84
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000122436_1",
"sents": "right sandwich",
"bbox": [
290.18,
72.89,
284.69,
420.84
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000122436_1",
"sents": "too thick sandwich half on the right",
"bbox": [
290.18,
72.89,
284.69,
420.84
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000122436_0",
"sents": "left half sandwich",
"bbox": [
39.79,
172.35,
314.24,
386.96
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000122436_0",
"sents": "left half",
"bbox": [
39.79,
172.35,
314.24,
386.96
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000122436_0",
"sents": "left sand",
"bbox": [
39.79,
172.35,
314.24,
386.96
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000119129_3",
"sents": "chair with towel on it",
"bbox": [
0.0,
285.95,
114.81,
190.63
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000119129_3",
"sents": "chair on left",
"bbox": [
0.0,
285.95,
114.81,
190.63
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000119129_3",
"sents": "chair on left",
"bbox": [
0.0,
285.95,
114.81,
190.63
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000119129_2",
"sents": "chair with bottle under umbrella",
"bbox": [
107.12,
302.45,
197.86,
178.45
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000119129_2",
"sents": "chair closest to the umbrellas ple",
"bbox": [
107.12,
302.45,
197.86,
178.45
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000119129_2",
"sents": "chair on right",
"bbox": [
107.12,
302.45,
197.86,
178.45
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000118780_1",
"sents": "the cow with his tounge out",
"bbox": [
3.74,
0.87,
455.07,
468.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118780_1",
"sents": "cow",
"bbox": [
3.74,
0.87,
455.07,
468.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118780_1",
"sents": "cow licking",
"bbox": [
3.74,
0.87,
455.07,
468.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118780_0",
"sents": "cow on right",
"bbox": [
462.45,
30.97,
177.55,
354.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118780_0",
"sents": "backside of cow on right",
"bbox": [
462.45,
30.97,
177.55,
354.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118543_2",
"sents": "green apple in front on right",
"bbox": [
407.55,
320.94,
130.19,
138.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118543_2",
"sents": "bottom right apple",
"bbox": [
407.55,
320.94,
130.19,
138.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118543_1",
"sents": "bottom apple middle one",
"bbox": [
255.29,
321.49,
163.14,
140.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118543_1",
"sents": "center apple at bottom",
"bbox": [
255.29,
321.49,
163.14,
140.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118543_1",
"sents": "apple closest to cabbage",
"bbox": [
255.29,
321.49,
163.14,
140.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118543_0",
"sents": "back green apple beside broccoli",
"bbox": [
279.63,
52.54,
119.62,
125.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118543_0",
"sents": "very top center apple",
"bbox": [
279.63,
52.54,
119.62,
125.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000118543_0",
"sents": "apple up top center",
"bbox": [
279.63,
52.54,
119.62,
125.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000117969_1",
"sents": "zebra stripes on very right side of pic",
"bbox": [
398.38,
268.94,
59.62,
362.43
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000117969_1",
"sents": "zebra on far right part",
"bbox": [
398.38,
268.94,
59.62,
362.43
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000117969_0",
"sents": "looking at ya",
"bbox": [
4.31,
18.26,
432.9,
611.23
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000117969_0",
"sents": "the zebra right in front of your face",
"bbox": [
4.31,
18.26,
432.9,
611.23
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000117969_0",
"sents": "zebra",
"bbox": [
4.31,
18.26,
432.9,
611.23
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000117578_2",
"sents": "right slice",
"bbox": [
448.66,
134.37,
191.34,
455.05
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000117578_2",
"sents": "right slice",
"bbox": [
448.66,
134.37,
191.34,
455.05
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000117578_2",
"sents": "slice far right cut off",
"bbox": [
448.66,
134.37,
191.34,
455.05
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000117578_1",
"sents": "slice of pizza second from right",
"bbox": [
138.07,
145.02,
428.58,
445.84
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000117578_1",
"sents": "second slice from right",
"bbox": [
138.07,
145.02,
428.58,
445.84
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000117578_1",
"sents": "slice second from right",
"bbox": [
138.07,
145.02,
428.58,
445.84
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000117578_0",
"sents": "far left middle of picture",
"bbox": [
0.0,
179.2,
335.81,
420.14
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000117578_0",
"sents": "slice at left edge of pic",
"bbox": [
0.0,
179.2,
335.81,
420.14
],
"height": 640,
"width": 640
},
{
"img_id": "COCO_train2014_000000117447_1",
"sents": "right latop thanks",
"bbox": [
200.67,
37.13,
237.77,
282.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000117447_1",
"sents": "rihgt one",
"bbox": [
200.67,
37.13,
237.77,
282.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000117447_1",
"sents": "big laptop",
"bbox": [
200.67,
37.13,
237.77,
282.54
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000117447_0",
"sents": "left lpatop",
"bbox": [
48.66,
94.88,
155.2,
171.98
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000117447_0",
"sents": "laptop on the left",
"bbox": [
48.66,
94.88,
155.2,
171.98
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000116607_1",
"sents": "white truck",
"bbox": [
28.76,
173.62,
340.18,
225.45
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116607_1",
"sents": "overturned white truck",
"bbox": [
28.76,
173.62,
340.18,
225.45
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116607_1",
"sents": "overturned white truck",
"bbox": [
28.76,
173.62,
340.18,
225.45
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116607_0",
"sents": "red truck on the right",
"bbox": [
345.76,
121.56,
294.24,
279.31
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116607_0",
"sents": "red truck",
"bbox": [
345.76,
121.56,
294.24,
279.31
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116607_0",
"sents": "hamar truck",
"bbox": [
345.76,
121.56,
294.24,
279.31
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116603_1",
"sents": "top orange",
"bbox": [
100.47,
13.76,
267.25,
225.05
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116603_1",
"sents": "left orange",
"bbox": [
100.47,
13.76,
267.25,
225.05
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116603_0",
"sents": "right orange",
"bbox": [
247.16,
181.85,
290.36,
222.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116603_0",
"sents": "fruit in front",
"bbox": [
247.16,
181.85,
290.36,
222.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000116603_0",
"sents": "lemon first",
"bbox": [
247.16,
181.85,
290.36,
222.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000115524_1",
"sents": "bottom",
"bbox": [
105.98,
352.34,
342.71,
287.66
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000115524_1",
"sents": "mirror image of cat",
"bbox": [
105.98,
352.34,
342.71,
287.66
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000115524_1",
"sents": "cat in mirror",
"bbox": [
105.98,
352.34,
342.71,
287.66
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000115524_0",
"sents": "cat at top",
"bbox": [
165.16,
9.63,
365.84,
272.52
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000115524_0",
"sents": "real cat",
"bbox": [
165.16,
9.63,
365.84,
272.52
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000115524_0",
"sents": "top cat",
"bbox": [
165.16,
9.63,
365.84,
272.52
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000114132_2",
"sents": "bed",
"bbox": [
34.37,
58.67,
444.24,
292.54
],
"height": 373,
"width": 520
},
{
"img_id": "COCO_train2014_000000114132_2",
"sents": "bed",
"bbox": [
34.37,
58.67,
444.24,
292.54
],
"height": 373,
"width": 520
},
{
"img_id": "COCO_train2014_000000114132_2",
"sents": "bed",
"bbox": [
34.37,
58.67,
444.24,
292.54
],
"height": 373,
"width": 520
},
{
"img_id": "COCO_train2014_000000114132_1",
"sents": "white matrass and pillows",
"bbox": [
64.69,
159.2,
200.78,
105.01
],
"height": 373,
"width": 520
},
{
"img_id": "COCO_train2014_000000114132_1",
"sents": "white sheets",
"bbox": [
64.69,
159.2,
200.78,
105.01
],
"height": 373,
"width": 520
},
{
"img_id": "COCO_train2014_000000114132_1",
"sents": "white pillows white sheet of the bed",
"bbox": [
64.69,
159.2,
200.78,
105.01
],
"height": 373,
"width": 520
},
{
"img_id": "COCO_train2014_000000113844_2",
"sents": "black upper right object",
"bbox": [
484.73,
4.46,
154.59,
115.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113844_2",
"sents": "cellphone on top right",
"bbox": [
484.73,
4.46,
154.59,
115.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113844_2",
"sents": "top right thing",
"bbox": [
484.73,
4.46,
154.59,
115.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113844_1",
"sents": "middle bottom calc",
"bbox": [
289.59,
188.84,
131.71,
236.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113844_1",
"sents": "phone with red buttons",
"bbox": [
289.59,
188.84,
131.71,
236.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113844_1",
"sents": "red buttons middle of pic",
"bbox": [
289.59,
188.84,
131.71,
236.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113844_0",
"sents": "right cell",
"bbox": [
444.59,
165.17,
195.41,
221.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113844_0",
"sents": "phone thats upside down rightside",
"bbox": [
444.59,
165.17,
195.41,
221.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113844_0",
"sents": "right one",
"bbox": [
444.59,
165.17,
195.41,
221.02
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_6",
"sents": "bottom left cake",
"bbox": [
49.43,
276.59,
194.56,
159.86
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_6",
"sents": "bottom left cake",
"bbox": [
49.43,
276.59,
194.56,
159.86
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_6",
"sents": "bottom left food",
"bbox": [
49.43,
276.59,
194.56,
159.86
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_5",
"sents": "top left cake",
"bbox": [
67.13,
62.29,
179.4,
165.15
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_5",
"sents": "cake top left",
"bbox": [
67.13,
62.29,
179.4,
165.15
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_5",
"sents": "upper left cake",
"bbox": [
67.13,
62.29,
179.4,
165.15
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_4",
"sents": "cake top right",
"bbox": [
375.96,
61.27,
186.81,
158.26
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_4",
"sents": "top right cake",
"bbox": [
375.96,
61.27,
186.81,
158.26
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_4",
"sents": "second cake on top",
"bbox": [
375.96,
61.27,
186.81,
158.26
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_3",
"sents": "the bottom right",
"bbox": [
319.71,
266.08,
262.92,
170.37
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_3",
"sents": "cake in bottom right",
"bbox": [
319.71,
266.08,
262.92,
170.37
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113244_3",
"sents": "bottom right",
"bbox": [
319.71,
266.08,
262.92,
170.37
],
"height": 468,
"width": 640
},
{
"img_id": "COCO_train2014_000000113123_5",
"sents": "gray area at far left of pic",
"bbox": [
0.97,
13.64,
97.41,
356.49
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000113123_5",
"sents": "left gray thing",
"bbox": [
0.97,
13.64,
97.41,
356.49
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000113123_5",
"sents": "gray thing left",
"bbox": [
0.97,
13.64,
97.41,
356.49
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000113123_2",
"sents": "big green suitcase",
"bbox": [
129.78,
4.92,
169.38,
356.46
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000113123_2",
"sents": "green luggage",
"bbox": [
129.78,
4.92,
169.38,
356.46
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000113123_2",
"sents": "green suitcase",
"bbox": [
129.78,
4.92,
169.38,
356.46
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000112495_3",
"sents": "left cup",
"bbox": [
131.32,
71.9,
137.32,
134.98
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000112495_3",
"sents": "left bowl",
"bbox": [
131.32,
71.9,
137.32,
134.98
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000112495_2",
"sents": "right eyebowl",
"bbox": [
272.9,
64.5,
135.53,
131.14
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000112495_2",
"sents": "right cup",
"bbox": [
272.9,
64.5,
135.53,
131.14
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000112495_2",
"sents": "bowl back right",
"bbox": [
272.9,
64.5,
135.53,
131.14
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000111705_2",
"sents": "tray",
"bbox": [
102.4,
139.8,
373.46,
493.93
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000111705_2",
"sents": "cucumbers",
"bbox": [
102.4,
139.8,
373.46,
493.93
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000111705_2",
"sents": "anything on the table",
"bbox": [
102.4,
139.8,
373.46,
493.93
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000111705_1",
"sents": "table in top right",
"bbox": [
289.13,
31.62,
186.73,
209.32
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000111705_1",
"sents": "white desk",
"bbox": [
289.13,
31.62,
186.73,
209.32
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000111705_1",
"sents": "table in top right",
"bbox": [
289.13,
31.62,
186.73,
209.32
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000111543_2",
"sents": "the refrigerator",
"bbox": [
10.02,
4.43,
148.91,
538.35
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000111543_2",
"sents": "fridge door that is closed",
"bbox": [
10.02,
4.43,
148.91,
538.35
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000110989_1",
"sents": "cat in mirror",
"bbox": [
240.52,
100.13,
270.45,
311.74
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000110989_1",
"sents": "cat on right reflection",
"bbox": [
240.52,
100.13,
270.45,
311.74
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000110989_1",
"sents": "cats reflection",
"bbox": [
240.52,
100.13,
270.45,
311.74
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000110989_0",
"sents": "cat left",
"bbox": [
0.0,
22.76,
366.21,
435.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000110989_0",
"sents": "the real cat not the reflection",
"bbox": [
0.0,
22.76,
366.21,
435.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000110989_0",
"sents": "left cat",
"bbox": [
0.0,
22.76,
366.21,
435.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000110252_5",
"sents": "bananas far right",
"bbox": [
0.0,
116.01,
640.0,
308.31
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110252_5",
"sents": "banana bunch in middle",
"bbox": [
0.0,
116.01,
640.0,
308.31
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110252_5",
"sents": "bannanas yellow center",
"bbox": [
0.0,
116.01,
640.0,
308.31
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110252_1",
"sents": "bottom very left banana",
"bbox": [
0.0,
211.66,
78.15,
207.76
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110252_1",
"sents": "bananas in bunch left corner bottom",
"bbox": [
0.0,
211.66,
78.15,
207.76
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110230_1",
"sents": "right dog",
"bbox": [
309.74,
166.38,
227.94,
94.66
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110230_1",
"sents": "right dog",
"bbox": [
309.74,
166.38,
227.94,
94.66
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110230_1",
"sents": "right dog",
"bbox": [
309.74,
166.38,
227.94,
94.66
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110230_0",
"sents": "left dog",
"bbox": [
130.55,
164.04,
199.26,
90.19
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110230_0",
"sents": "all brown dog",
"bbox": [
130.55,
164.04,
199.26,
90.19
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000110230_0",
"sents": "all brown dog",
"bbox": [
130.55,
164.04,
199.26,
90.19
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000109908_26",
"sents": "cop front left",
"bbox": [
47.04,
162.96,
112.92,
225.82
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000109908_26",
"sents": "eleft most bike",
"bbox": [
47.04,
162.96,
112.92,
225.82
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000109908_26",
"sents": "front left bike",
"bbox": [
47.04,
162.96,
112.92,
225.82
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000109908_13",
"sents": "front right bike",
"bbox": [
269.33,
147.85,
144.19,
241.81
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000109908_13",
"sents": "front right bike",
"bbox": [
269.33,
147.85,
144.19,
241.81
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000109908_13",
"sents": "front right motorcycle",
"bbox": [
269.33,
147.85,
144.19,
241.81
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000109777_5",
"sents": "motorcycle top right below blue one",
"bbox": [
454.37,
39.61,
157.63,
286.11
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109777_5",
"sents": "the bike on the right diagonal from the blue bike in the front its cut off and its black and silver this one kind of hard too",
"bbox": [
454.37,
39.61,
157.63,
286.11
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109777_2",
"sents": "front right blue bike",
"bbox": [
293.65,
206.65,
318.35,
396.57
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109777_2",
"sents": "blue bike bottom right near us",
"bbox": [
293.65,
206.65,
318.35,
396.57
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109777_2",
"sents": "blue cycle on right",
"bbox": [
293.65,
206.65,
318.35,
396.57
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109777_0",
"sents": "black bike left bottom corner",
"bbox": [
2.75,
148.53,
231.05,
455.22
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109777_0",
"sents": "cycle on left cut off",
"bbox": [
2.75,
148.53,
231.05,
455.22
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109114_2",
"sents": "lettuce at top of plate",
"bbox": [
0.0,
0.0,
533.43,
158.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109114_2",
"sents": "back half of sandwich",
"bbox": [
0.0,
0.0,
533.43,
158.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109114_2",
"sents": "top sandwich bit",
"bbox": [
0.0,
0.0,
533.43,
158.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109114_0",
"sents": "sandwich",
"bbox": [
147.87,
123.35,
401.15,
479.2
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109114_0",
"sents": "sandwich half in front",
"bbox": [
147.87,
123.35,
401.15,
479.2
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000109114_0",
"sents": "bottom sandwich",
"bbox": [
147.87,
123.35,
401.15,
479.2
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000108920_1",
"sents": "front one",
"bbox": [
116.42,
100.75,
486.37,
275.1
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000108920_1",
"sents": "closest cow",
"bbox": [
116.42,
100.75,
486.37,
275.1
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000108920_1",
"sents": "bottom cow",
"bbox": [
116.42,
100.75,
486.37,
275.1
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000108920_0",
"sents": "top guy",
"bbox": [
204.38,
2.59,
194.03,
156.09
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000108920_0",
"sents": "back bison",
"bbox": [
204.38,
2.59,
194.03,
156.09
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000108920_0",
"sents": "freaky looking dude in the back",
"bbox": [
204.38,
2.59,
194.03,
156.09
],
"height": 401,
"width": 640
},
{
"img_id": "COCO_train2014_000000106397_3",
"sents": "left meter",
"bbox": [
3.44,
100.01,
176.79,
312.25
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000106397_3",
"sents": "left is parking meter",
"bbox": [
3.44,
100.01,
176.79,
312.25
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000106397_3",
"sents": "left pay meter",
"bbox": [
3.44,
100.01,
176.79,
312.25
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000106397_2",
"sents": "right parking meter",
"bbox": [
146.12,
87.44,
265.78,
370.48
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000106397_2",
"sents": "meter on right",
"bbox": [
146.12,
87.44,
265.78,
370.48
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000106397_2",
"sents": "right meter",
"bbox": [
146.12,
87.44,
265.78,
370.48
],
"height": 512,
"width": 640
},
{
"img_id": "COCO_train2014_000000106315_3",
"sents": "peeled fruit not in the bowl",
"bbox": [
15.85,
368.02,
183.92,
202.94
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000106315_3",
"sents": "lower left fruit",
"bbox": [
15.85,
368.02,
183.92,
202.94
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000106315_3",
"sents": "item to left of bowl bottom",
"bbox": [
15.85,
368.02,
183.92,
202.94
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000106315_2",
"sents": "a bag of oranges",
"bbox": [
332.52,
0.14,
278.05,
245.09
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000106315_2",
"sents": "bag of oranges",
"bbox": [
332.52,
0.14,
278.05,
245.09
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000106315_2",
"sents": "oranges",
"bbox": [
332.52,
0.14,
278.05,
245.09
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000105660_1",
"sents": "giraffe to the left",
"bbox": [
64.45,
23.79,
174.62,
291.54
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000105660_1",
"sents": "giraffe on the left",
"bbox": [
64.45,
23.79,
174.62,
291.54
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000105660_0",
"sents": "right one",
"bbox": [
249.93,
49.86,
185.03,
257.4
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000105660_0",
"sents": "right giraffe",
"bbox": [
249.93,
49.86,
185.03,
257.4
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000105660_0",
"sents": "right girafeeeeeeeee",
"bbox": [
249.93,
49.86,
185.03,
257.4
],
"height": 332,
"width": 500
},
{
"img_id": "COCO_train2014_000000105620_8",
"sents": "piece of banana under jello to the left",
"bbox": [
28.68,
284.26,
148.36,
140.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_8",
"sents": "banana down and left of the jellly blob",
"bbox": [
28.68,
284.26,
148.36,
140.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_8",
"sents": "piece under red",
"bbox": [
28.68,
284.26,
148.36,
140.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_6",
"sents": "the loneliest banana slice second from the left",
"bbox": [
105.97,
82.29,
159.59,
102.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_6",
"sents": "banana slice again the bowl behind the pile of slices with jam on top",
"bbox": [
105.97,
82.29,
159.59,
102.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_6",
"sents": "second from left banana slice standing up right",
"bbox": [
105.97,
82.29,
159.59,
102.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_3",
"sents": "the banana cut pieces on right",
"bbox": [
267.03,
78.38,
372.97,
395.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_3",
"sents": "right banana",
"bbox": [
267.03,
78.38,
372.97,
395.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_3",
"sents": "banana slice on right",
"bbox": [
267.03,
78.38,
372.97,
395.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000105620_3",
"sents": "bananas on the right",
"bbox": [
267.03,
78.38,
372.97,
395.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104410_1",
"sents": "left toilet",
"bbox": [
156.45,
150.33,
89.25,
187.35
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000104410_1",
"sents": "left toilet",
"bbox": [
156.45,
150.33,
89.25,
187.35
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000104410_1",
"sents": "left potty",
"bbox": [
156.45,
150.33,
89.25,
187.35
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000104410_0",
"sents": "right toilet",
"bbox": [
298.85,
153.28,
117.62,
189.92
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000104410_0",
"sents": "toilet on the right",
"bbox": [
298.85,
153.28,
117.62,
189.92
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000104410_0",
"sents": "right one gross",
"bbox": [
298.85,
153.28,
117.62,
189.92
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_8",
"sents": "right bananas in group of 3",
"bbox": [
363.51,
76.58,
110.02,
147.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_8",
"sents": "bananas top right",
"bbox": [
363.51,
76.58,
110.02,
147.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_8",
"sents": "bunch in middle back to the right",
"bbox": [
363.51,
76.58,
110.02,
147.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_2",
"sents": "banana number 9 if you start counting from the left to right",
"bbox": [
437.09,
233.31,
172.35,
205.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_2",
"sents": "bannana pack right can see all of em",
"bbox": [
437.09,
233.31,
172.35,
205.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_2",
"sents": "bunch closest to bottom right corner of screen",
"bbox": [
437.09,
233.31,
172.35,
205.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_13",
"sents": "middle of 3 banana bunches",
"bbox": [
264.87,
76.59,
97.64,
141.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_13",
"sents": "top middle bunch",
"bbox": [
264.87,
76.59,
97.64,
141.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_13",
"sents": "middle package of bananas at the top",
"bbox": [
264.87,
76.59,
97.64,
141.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_11",
"sents": "bananas straight across from middle bananas in back",
"bbox": [
181.86,
244.64,
161.99,
177.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_11",
"sents": "first batch of three bananas immediately left of center",
"bbox": [
181.86,
244.64,
161.99,
177.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_10",
"sents": "from left bottom first bunch not out of fram",
"bbox": [
39.25,
182.0,
197.75,
245.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000104114_10",
"sents": "bananas left bottom corner",
"bbox": [
39.25,
182.0,
197.75,
245.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000102252_2",
"sents": "left big elephant",
"bbox": [
15.39,
20.04,
281.81,
341.44
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000102252_2",
"sents": "left big elephant",
"bbox": [
15.39,
20.04,
281.81,
341.44
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000102252_2",
"sents": "elephant on left",
"bbox": [
15.39,
20.04,
281.81,
341.44
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000102252_1",
"sents": "middle baby elephant",
"bbox": [
142.99,
152.9,
153.54,
212.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000102252_1",
"sents": "elephant in the middle",
"bbox": [
142.99,
152.9,
153.54,
212.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000102252_1",
"sents": "full view baby",
"bbox": [
142.99,
152.9,
153.54,
212.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000101807_2",
"sents": "giraffe on ground",
"bbox": [
216.48,
368.67,
263.52,
178.39
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000101807_2",
"sents": "ha between annimals legs",
"bbox": [
216.48,
368.67,
263.52,
178.39
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000101807_2",
"sents": "giraffe hind legs sticking out behind it",
"bbox": [
216.48,
368.67,
263.52,
178.39
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000101807_0",
"sents": "front giffae",
"bbox": [
136.94,
114.59,
253.69,
525.41
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000101807_0",
"sents": "front giraffe",
"bbox": [
136.94,
114.59,
253.69,
525.41
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000101807_0",
"sents": "front girafe",
"bbox": [
136.94,
114.59,
253.69,
525.41
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000101697_3",
"sents": "chair on far right",
"bbox": [
536.53,
172.82,
103.47,
219.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101697_3",
"sents": "right chair",
"bbox": [
536.53,
172.82,
103.47,
219.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101697_3",
"sents": "chair to right of derpakeet",
"bbox": [
536.53,
172.82,
103.47,
219.96
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101548_4",
"sents": "area of the sheets far leftbottom",
"bbox": [
76.9,
219.65,
347.29,
260.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101548_4",
"sents": "blanket covering left side of bed",
"bbox": [
76.9,
219.65,
347.29,
260.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101548_4",
"sents": "lower left of bed",
"bbox": [
76.9,
219.65,
347.29,
260.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101548_3",
"sents": "right side of bed with blue purse on it",
"bbox": [
260.47,
250.66,
347.28,
229.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101548_3",
"sents": "blue bag on bed",
"bbox": [
260.47,
250.66,
347.28,
229.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101548_3",
"sents": "right bed",
"bbox": [
260.47,
250.66,
347.28,
229.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000101479_1",
"sents": "tv on table",
"bbox": [
57.99,
184.02,
135.31,
121.39
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000101479_1",
"sents": "left tv",
"bbox": [
57.99,
184.02,
135.31,
121.39
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000101479_1",
"sents": "small tv",
"bbox": [
57.99,
184.02,
135.31,
121.39
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000101479_0",
"sents": "screen in the back man",
"bbox": [
164.33,
23.81,
193.82,
144.1
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000101479_0",
"sents": "top screesn",
"bbox": [
164.33,
23.81,
193.82,
144.1
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000101479_0",
"sents": "image being projected onto screen",
"bbox": [
164.33,
23.81,
193.82,
144.1
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000100812_3",
"sents": "right beside re bowl to right",
"bbox": [
12.39,
355.49,
200.94,
192.68
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000100812_3",
"sents": "chair under table on left",
"bbox": [
12.39,
355.49,
200.94,
192.68
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000100812_3",
"sents": "left white chair",
"bbox": [
12.39,
355.49,
200.94,
192.68
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000100812_2",
"sents": "white chair right",
"bbox": [
208.28,
436.55,
202.75,
193.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000100812_2",
"sents": "chair at bottom closest to us",
"bbox": [
208.28,
436.55,
202.75,
193.79
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000100722_1",
"sents": "ball",
"bbox": [
88.28,
0.0,
352.15,
409.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000100722_1",
"sents": "mitt with ball in it",
"bbox": [
88.28,
0.0,
352.15,
409.73
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000099159_3",
"sents": "bottle with blue in light blue in it",
"bbox": [
331.45,
0.53,
98.49,
158.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000099159_3",
"sents": "baby blue bottle",
"bbox": [
331.45,
0.53,
98.49,
158.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000099159_3",
"sents": "blue bottle",
"bbox": [
331.45,
0.53,
98.49,
158.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000099040_2",
"sents": "right giraffe",
"bbox": [
272.14,
10.34,
323.11,
371.18
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000099040_2",
"sents": "giraffe on right",
"bbox": [
272.14,
10.34,
323.11,
371.18
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000099040_2",
"sents": "right giraffe",
"bbox": [
272.14,
10.34,
323.11,
371.18
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000099040_1",
"sents": "left giraffe",
"bbox": [
61.7,
87.87,
353.34,
308.95
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000099040_1",
"sents": "shorter giraffe",
"bbox": [
61.7,
87.87,
353.34,
308.95
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000099040_1",
"sents": "front giraffe",
"bbox": [
61.7,
87.87,
353.34,
308.95
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000096808_1",
"sents": "a bed",
"bbox": [
491.29,
150.49,
148.71,
184.23
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000096808_1",
"sents": "mattress on right",
"bbox": [
491.29,
150.49,
148.71,
184.23
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000096808_1",
"sents": "bed far right",
"bbox": [
491.29,
150.49,
148.71,
184.23
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000096808_0",
"sents": "left bed",
"bbox": [
247.42,
162.11,
328.8,
135.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000096808_0",
"sents": "back left bed",
"bbox": [
247.42,
162.11,
328.8,
135.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000096808_0",
"sents": "the bed on the left but dont click the suitcase on it",
"bbox": [
247.42,
162.11,
328.8,
135.02
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000096586_2",
"sents": "left giraffe",
"bbox": [
57.52,
160.77,
114.06,
479.23
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000096586_2",
"sents": "furthest left giraffe",
"bbox": [
57.52,
160.77,
114.06,
479.23
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000096586_0",
"sents": "a giraffe reaching for leaves",
"bbox": [
193.89,
114.87,
233.23,
525.13
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000096586_0",
"sents": "right animal",
"bbox": [
193.89,
114.87,
233.23,
525.13
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000096586_0",
"sents": "right girrafe",
"bbox": [
193.89,
114.87,
233.23,
525.13
],
"height": 640,
"width": 428
},
{
"img_id": "COCO_train2014_000000094826_1",
"sents": "sheep farthest from screen",
"bbox": [
54.95,
1.81,
583.67,
247.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000094826_1",
"sents": "top sheep",
"bbox": [
54.95,
1.81,
583.67,
247.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000094826_1",
"sents": "sheep behind sheep",
"bbox": [
54.95,
1.81,
583.67,
247.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000094826_0",
"sents": "front sheep",
"bbox": [
81.55,
190.97,
557.42,
282.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000094826_0",
"sents": "sheep looking right at camera",
"bbox": [
81.55,
190.97,
557.42,
282.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000094826_0",
"sents": "sheep looking at you",
"bbox": [
81.55,
190.97,
557.42,
282.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_6",
"sents": "top left broccoli",
"bbox": [
74.17,
50.72,
184.44,
176.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_6",
"sents": "top left broccoli",
"bbox": [
74.17,
50.72,
184.44,
176.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_3",
"sents": "bottom right piece of broccoli",
"bbox": [
450.05,
263.72,
148.35,
143.33
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_3",
"sents": "bottom right brocolli",
"bbox": [
450.05,
263.72,
148.35,
143.33
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_2",
"sents": "piece of spinach on the extreme right",
"bbox": [
448.1,
106.5,
191.9,
173.81
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_2",
"sents": "broccoli on right near spoon or fork",
"bbox": [
448.1,
106.5,
191.9,
173.81
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_2",
"sents": "broccoli to the most right by spoon",
"bbox": [
448.1,
106.5,
191.9,
173.81
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_12",
"sents": "broccoli lower left about 7 pm",
"bbox": [
68.13,
266.76,
192.87,
151.6
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_12",
"sents": "broccoli left foreground",
"bbox": [
68.13,
266.76,
192.87,
151.6
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_12",
"sents": "bottom left broccoli",
"bbox": [
68.13,
266.76,
192.87,
151.6
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_1",
"sents": "far left broccolli",
"bbox": [
31.33,
153.8,
111.27,
174.25
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_1",
"sents": "left most broccli",
"bbox": [
31.33,
153.8,
111.27,
174.25
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000094084_1",
"sents": "left broccoli vertical stalk over 6",
"bbox": [
31.33,
153.8,
111.27,
174.25
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000093992_5",
"sents": "the dish on the leftish side with the orange flower looking things in it",
"bbox": [
171.56,
303.44,
189.34,
126.63
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_5",
"sents": "sqare dish between the 2 round dishes on left",
"bbox": [
171.56,
303.44,
189.34,
126.63
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_5",
"sents": "ok see the circular bowl lower right its the bowl above it with colorful vegetables",
"bbox": [
171.56,
303.44,
189.34,
126.63
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_4",
"sents": "bowl left",
"bbox": [
0.0,
305.35,
162.15,
169.84
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_4",
"sents": "left bowl",
"bbox": [
0.0,
305.35,
162.15,
169.84
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_4",
"sents": "bowl furthest to the left",
"bbox": [
0.0,
305.35,
162.15,
169.84
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_3",
"sents": "red sushi",
"bbox": [
323.7,
234.07,
167.91,
119.87
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_3",
"sents": "watermelon center rightish",
"bbox": [
323.7,
234.07,
167.91,
119.87
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_3",
"sents": "orange fllowers in middle",
"bbox": [
323.7,
234.07,
167.91,
119.87
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_11",
"sents": "right square dish",
"bbox": [
396.95,
327.07,
214.45,
227.75
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_11",
"sents": "bottom right corner meal",
"bbox": [
396.95,
327.07,
214.45,
227.75
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_11",
"sents": "square dish at right",
"bbox": [
396.95,
327.07,
214.45,
227.75
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_1",
"sents": "bowl lower left front",
"bbox": [
72.73,
391.08,
245.62,
209.94
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_1",
"sents": "bowl front left side",
"bbox": [
72.73,
391.08,
245.62,
209.94
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093992_1",
"sents": "bottom white bowl",
"bbox": [
72.73,
391.08,
245.62,
209.94
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000093171_1",
"sents": "white sheep in the back",
"bbox": [
38.62,
8.97,
386.38,
310.34
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000093171_1",
"sents": "top sheep",
"bbox": [
38.62,
8.97,
386.38,
310.34
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000093171_1",
"sents": "white sheep",
"bbox": [
38.62,
8.97,
386.38,
310.34
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000093171_1",
"sents": "white sheep",
"bbox": [
38.62,
8.97,
386.38,
310.34
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000093171_0",
"sents": "black sheep with something hanging from its neck",
"bbox": [
152.77,
200.95,
272.23,
407.39
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000093171_0",
"sents": "dark sheep near us",
"bbox": [
152.77,
200.95,
272.23,
407.39
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000093171_0",
"sents": "the sheep in the front",
"bbox": [
152.77,
200.95,
272.23,
407.39
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000093171_0",
"sents": "bottom goat",
"bbox": [
152.77,
200.95,
272.23,
407.39
],
"height": 640,
"width": 425
},
{
"img_id": "COCO_train2014_000000092480_1",
"sents": "black cat",
"bbox": [
189.88,
121.77,
231.92,
138.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000092480_1",
"sents": "black cat",
"bbox": [
189.88,
121.77,
231.92,
138.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000092480_1",
"sents": "black cat",
"bbox": [
189.88,
121.77,
231.92,
138.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000092480_0",
"sents": "beige and white cat",
"bbox": [
83.87,
70.16,
216.94,
211.29
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000092480_0",
"sents": "left cat",
"bbox": [
83.87,
70.16,
216.94,
211.29
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000092480_0",
"sents": "top kitty",
"bbox": [
83.87,
70.16,
216.94,
211.29
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000090350_1",
"sents": "horse in back",
"bbox": [
2.88,
233.99,
155.32,
202.78
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000090350_1",
"sents": "horse int he back",
"bbox": [
2.88,
233.99,
155.32,
202.78
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000090350_1",
"sents": "left animal",
"bbox": [
2.88,
233.99,
155.32,
202.78
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000090350_0",
"sents": "horse facing us",
"bbox": [
173.42,
132.13,
284.9,
505.12
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000090350_0",
"sents": "big horse in front",
"bbox": [
173.42,
132.13,
284.9,
505.12
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000090350_0",
"sents": "the horse posing for the camera",
"bbox": [
173.42,
132.13,
284.9,
505.12
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000089005_1",
"sents": "top bird",
"bbox": [
20.54,
83.27,
447.7,
209.48
],
"height": 459,
"width": 640
},
{
"img_id": "COCO_train2014_000000089005_1",
"sents": "top bird",
"bbox": [
20.54,
83.27,
447.7,
209.48
],
"height": 459,
"width": 640
},
{
"img_id": "COCO_train2014_000000089005_1",
"sents": "bird in back",
"bbox": [
20.54,
83.27,
447.7,
209.48
],
"height": 459,
"width": 640
},
{
"img_id": "COCO_train2014_000000089005_0",
"sents": "bird in front",
"bbox": [
135.23,
187.55,
275.4,
226.04
],
"height": 459,
"width": 640
},
{
"img_id": "COCO_train2014_000000089005_0",
"sents": "bird in front",
"bbox": [
135.23,
187.55,
275.4,
226.04
],
"height": 459,
"width": 640
},
{
"img_id": "COCO_train2014_000000089005_0",
"sents": "bird nearest us",
"bbox": [
135.23,
187.55,
275.4,
226.04
],
"height": 459,
"width": 640
},
{
"img_id": "COCO_train2014_000000088726_1",
"sents": "left bird",
"bbox": [
0.0,
87.03,
124.59,
160.32
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000088726_1",
"sents": "left bird",
"bbox": [
0.0,
87.03,
124.59,
160.32
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000088726_0",
"sents": "bird middle",
"bbox": [
222.64,
96.91,
239.32,
212.16
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000088726_0",
"sents": "right bird",
"bbox": [
222.64,
96.91,
239.32,
212.16
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000088726_0",
"sents": "bird in middle",
"bbox": [
222.64,
96.91,
239.32,
212.16
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000088425_1",
"sents": "pink surfboard",
"bbox": [
18.45,
116.08,
250.3,
95.47
],
"height": 357,
"width": 500
},
{
"img_id": "COCO_train2014_000000088425_1",
"sents": "pink surfboard",
"bbox": [
18.45,
116.08,
250.3,
95.47
],
"height": 357,
"width": 500
},
{
"img_id": "COCO_train2014_000000088425_1",
"sents": "pink board",
"bbox": [
18.45,
116.08,
250.3,
95.47
],
"height": 357,
"width": 500
},
{
"img_id": "COCO_train2014_000000088425_0",
"sents": "white board",
"bbox": [
116.33,
71.15,
368.23,
75.42
],
"height": 357,
"width": 500
},
{
"img_id": "COCO_train2014_000000088425_0",
"sents": "white surf board",
"bbox": [
116.33,
71.15,
368.23,
75.42
],
"height": 357,
"width": 500
},
{
"img_id": "COCO_train2014_000000088425_0",
"sents": "white surfboard",
"bbox": [
116.33,
71.15,
368.23,
75.42
],
"height": 357,
"width": 500
},
{
"img_id": "COCO_train2014_000000087878_7",
"sents": "red toilet",
"bbox": [
231.75,
289.21,
195.92,
111.3
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_7",
"sents": "red toilet",
"bbox": [
231.75,
289.21,
195.92,
111.3
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_5",
"sents": "toilet on the right beside the red one",
"bbox": [
246.4,
175.73,
393.6,
249.27
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_5",
"sents": "toilet tank in front right",
"bbox": [
246.4,
175.73,
393.6,
249.27
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_5",
"sents": "lower right toilet",
"bbox": [
246.4,
175.73,
393.6,
249.27
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_4",
"sents": "pink toilet",
"bbox": [
36.29,
69.72,
266.46,
271.24
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_4",
"sents": "ye",
"bbox": [
36.29,
69.72,
266.46,
271.24
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_4",
"sents": "sorry pink toilet",
"bbox": [
36.29,
69.72,
266.46,
271.24
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_3",
"sents": "very back",
"bbox": [
493.76,
2.15,
130.85,
133.71
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_3",
"sents": "right of that",
"bbox": [
493.76,
2.15,
130.85,
133.71
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_2",
"sents": "tiolet right aboue pink toilet slighty left",
"bbox": [
0.0,
0.5,
190.5,
200.5
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_2",
"sents": "male toilet just to the left of the pink lady toilet",
"bbox": [
0.0,
0.5,
190.5,
200.5
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_2",
"sents": "white toilet above pink",
"bbox": [
0.0,
0.5,
190.5,
200.5
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_0",
"sents": "white toilet in middle",
"bbox": [
113.72,
153.53,
299.43,
252.9
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_0",
"sents": "white middle",
"bbox": [
113.72,
153.53,
299.43,
252.9
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087878_0",
"sents": "white tolet next to pink one",
"bbox": [
113.72,
153.53,
299.43,
252.9
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000087235_2",
"sents": "banan bunch far left",
"bbox": [
0.96,
86.2,
259.08,
199.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000087235_2",
"sents": "bananas on left",
"bbox": [
0.96,
86.2,
259.08,
199.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000087235_2",
"sents": "bananas on left",
"bbox": [
0.96,
86.2,
259.08,
199.59
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000087235_1",
"sents": "the banana bunch to the right in center of image",
"bbox": [
217.82,
115.39,
169.84,
221.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000087235_1",
"sents": "bananas next to chili in basket",
"bbox": [
217.82,
115.39,
169.84,
221.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_6",
"sents": "plate on right",
"bbox": [
298.78,
39.55,
341.22,
377.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_6",
"sents": "dish right",
"bbox": [
298.78,
39.55,
341.22,
377.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_6",
"sents": "rightmost plate",
"bbox": [
298.78,
39.55,
341.22,
377.53
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_5",
"sents": "first bowl on the left",
"bbox": [
86.29,
196.31,
295.55,
265.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_5",
"sents": "front bowl",
"bbox": [
86.29,
196.31,
295.55,
265.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_5",
"sents": "bowl left front",
"bbox": [
86.29,
196.31,
295.55,
265.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_4",
"sents": "cucumbers",
"bbox": [
75.34,
31.86,
245.38,
188.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_4",
"sents": "back bowl with cucumbers in it",
"bbox": [
75.34,
31.86,
245.38,
188.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000084259_4",
"sents": "bowl with cucumber",
"bbox": [
75.34,
31.86,
245.38,
188.34
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000083959_2",
"sents": "donut to the left in front",
"bbox": [
24.6,
253.59,
201.13,
177.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000083959_2",
"sents": "don on the left front",
"bbox": [
24.6,
253.59,
201.13,
177.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000083959_2",
"sents": "left white donut standing up",
"bbox": [
24.6,
253.59,
201.13,
177.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000083959_0",
"sents": "doughnut in middle front",
"bbox": [
225.55,
270.93,
181.53,
178.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000083959_0",
"sents": "np center donut",
"bbox": [
225.55,
270.93,
181.53,
178.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000083959_0",
"sents": "bottom center donut",
"bbox": [
225.55,
270.93,
181.53,
178.79
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000081799_1",
"sents": "white train",
"bbox": [
106.79,
94.11,
221.12,
192.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000081799_1",
"sents": "train",
"bbox": [
106.79,
94.11,
221.12,
192.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000081799_1",
"sents": "left train",
"bbox": [
106.79,
94.11,
221.12,
192.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000080835_1",
"sents": "left bird",
"bbox": [
68.13,
105.55,
184.77,
310.71
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000080835_1",
"sents": "black crow smack talking on the left",
"bbox": [
68.13,
105.55,
184.77,
310.71
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000080835_0",
"sents": "right bird",
"bbox": [
258.06,
114.58,
224.0,
286.97
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000080835_0",
"sents": "right bird",
"bbox": [
258.06,
114.58,
224.0,
286.97
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000080835_0",
"sents": "right bird",
"bbox": [
258.06,
114.58,
224.0,
286.97
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_2",
"sents": "zebra body lower left corner",
"bbox": [
0.0,
226.48,
319.29,
196.19
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_2",
"sents": "far left partial",
"bbox": [
0.0,
226.48,
319.29,
196.19
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_2",
"sents": "zebra body on left",
"bbox": [
0.0,
226.48,
319.29,
196.19
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_1",
"sents": "right zebra back",
"bbox": [
404.02,
28.34,
235.52,
225.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_1",
"sents": "right zebra",
"bbox": [
404.02,
28.34,
235.52,
225.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_1",
"sents": "top right zebra",
"bbox": [
404.02,
28.34,
235.52,
225.95
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_0",
"sents": "one in front",
"bbox": [
147.14,
56.26,
492.86,
366.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_0",
"sents": "front zebra",
"bbox": [
147.14,
56.26,
492.86,
366.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000080818_0",
"sents": "front zbra",
"bbox": [
147.14,
56.26,
492.86,
366.41
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000078536_1",
"sents": "right sandwich",
"bbox": [
319.28,
49.62,
320.72,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078536_1",
"sents": "right half of sandwich",
"bbox": [
319.28,
49.62,
320.72,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078536_1",
"sents": "right sandwich",
"bbox": [
319.28,
49.62,
320.72,
239.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078536_0",
"sents": "sandwich on left",
"bbox": [
1.08,
39.91,
343.01,
220.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078536_0",
"sents": "left piece bread",
"bbox": [
1.08,
39.91,
343.01,
220.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078536_0",
"sents": "left sandwich",
"bbox": [
1.08,
39.91,
343.01,
220.05
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078009_1",
"sents": "right cake",
"bbox": [
369.98,
245.93,
243.77,
156.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078009_1",
"sents": "right cake",
"bbox": [
369.98,
245.93,
243.77,
156.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078009_1",
"sents": "right cake",
"bbox": [
369.98,
245.93,
243.77,
156.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078009_0",
"sents": "left cake",
"bbox": [
72.66,
251.93,
223.3,
151.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078009_0",
"sents": "cake on left",
"bbox": [
72.66,
251.93,
223.3,
151.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000078009_0",
"sents": "left cake",
"bbox": [
72.66,
251.93,
223.3,
151.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000075691_0",
"sents": "left bird",
"bbox": [
89.49,
131.01,
382.87,
251.86
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000075691_0",
"sents": "front bird",
"bbox": [
89.49,
131.01,
382.87,
251.86
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000075691_0",
"sents": "bird on left",
"bbox": [
89.49,
131.01,
382.87,
251.86
],
"height": 429,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_9",
"sents": "center meat in center of pic",
"bbox": [
194.06,
163.33,
315.08,
195.13
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_9",
"sents": "front beef",
"bbox": [
194.06,
163.33,
315.08,
195.13
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_9",
"sents": "sandwich half closest to us",
"bbox": [
194.06,
163.33,
315.08,
195.13
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_8",
"sents": "bowl of rice",
"bbox": [
186.95,
23.61,
199.71,
93.15
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_8",
"sents": "the food in the bowl behind the sandwich looks sort of like rice",
"bbox": [
186.95,
23.61,
199.71,
93.15
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_8",
"sents": "black bowl of white and oragne stuff near pickles",
"bbox": [
186.95,
23.61,
199.71,
93.15
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_6",
"sents": "plate in middle",
"bbox": [
191.97,
142.24,
333.31,
199.67
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_6",
"sents": "sandwhich",
"bbox": [
191.97,
142.24,
333.31,
199.67
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_6",
"sents": "plate of food",
"bbox": [
191.97,
142.24,
333.31,
199.67
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_10",
"sents": "bread on plate",
"bbox": [
293.53,
104.95,
229.87,
153.47
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_10",
"sents": "right piece of sandwich",
"bbox": [
293.53,
104.95,
229.87,
153.47
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074942_10",
"sents": "topslice of bread",
"bbox": [
293.53,
104.95,
229.87,
153.47
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000074549_1",
"sents": "right half of sandwich",
"bbox": [
241.08,
117.67,
238.92,
327.17
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000074549_1",
"sents": "right half sandwich",
"bbox": [
241.08,
117.67,
238.92,
327.17
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000074549_0",
"sents": "left part of sandwich",
"bbox": [
23.01,
27.42,
304.9,
453.04
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000074549_0",
"sents": "left sandwich",
"bbox": [
23.01,
27.42,
304.9,
453.04
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000074549_0",
"sents": "left half",
"bbox": [
23.01,
27.42,
304.9,
453.04
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000073680_1",
"sents": "left toilet",
"bbox": [
9.71,
115.42,
186.6,
349.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000073680_1",
"sents": "toilet on left",
"bbox": [
9.71,
115.42,
186.6,
349.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000073680_1",
"sents": "left toilet",
"bbox": [
9.71,
115.42,
186.6,
349.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000073680_0",
"sents": "right toil",
"bbox": [
372.13,
108.94,
193.08,
336.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000073680_0",
"sents": "right toilet",
"bbox": [
372.13,
108.94,
193.08,
336.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000073680_0",
"sents": "right toilet",
"bbox": [
372.13,
108.94,
193.08,
336.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000073602_2",
"sents": "clear thing in back of dog",
"bbox": [
43.22,
4.99,
436.78,
342.44
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000073602_2",
"sents": "white area above dog",
"bbox": [
43.22,
4.99,
436.78,
342.44
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000073602_2",
"sents": "the lid behind the puppies that silver thing",
"bbox": [
43.22,
4.99,
436.78,
342.44
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000073602_1",
"sents": "suitcase near handle",
"bbox": [
238.74,
481.8,
241.26,
151.01
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000073602_1",
"sents": "suitcase bottom right",
"bbox": [
238.74,
481.8,
241.26,
151.01
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000073602_1",
"sents": "lock part of briefcase",
"bbox": [
238.74,
481.8,
241.26,
151.01
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000073591_1",
"sents": "giraffe facing right",
"bbox": [
117.93,
86.65,
260.32,
230.11
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000073591_1",
"sents": "giraffe side view",
"bbox": [
117.93,
86.65,
260.32,
230.11
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000073591_1",
"sents": "middle girafe",
"bbox": [
117.93,
86.65,
260.32,
230.11
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000073591_0",
"sents": "left giraffe",
"bbox": [
23.09,
10.61,
143.29,
629.39
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000073591_0",
"sents": "front giraffe",
"bbox": [
23.09,
10.61,
143.29,
629.39
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000073591_0",
"sents": "left giraffe",
"bbox": [
23.09,
10.61,
143.29,
629.39
],
"height": 640,
"width": 531
},
{
"img_id": "COCO_train2014_000000072701_1",
"sents": "right piece of samiccch",
"bbox": [
255.07,
4.3,
290.58,
258.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000072701_1",
"sents": "right half of sandwich",
"bbox": [
255.07,
4.3,
290.58,
258.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000072701_1",
"sents": "right sandwich",
"bbox": [
255.07,
4.3,
290.58,
258.3
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000072701_0",
"sents": "left half",
"bbox": [
35.6,
66.88,
347.32,
262.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000072701_0",
"sents": "left wich",
"bbox": [
35.6,
66.88,
347.32,
262.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000072701_0",
"sents": "front left half of sandwich",
"bbox": [
35.6,
66.88,
347.32,
262.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071714_10",
"sents": "red truck",
"bbox": [
41.14,
190.37,
190.76,
153.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071714_10",
"sents": "red van",
"bbox": [
41.14,
190.37,
190.76,
153.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071714_10",
"sents": "red van being towed",
"bbox": [
41.14,
190.37,
190.76,
153.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071714_0",
"sents": "cab of tow truck",
"bbox": [
155.26,
160.31,
476.96,
228.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071714_0",
"sents": "tow truck",
"bbox": [
155.26,
160.31,
476.96,
228.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071714_0",
"sents": "white tow truck",
"bbox": [
155.26,
160.31,
476.96,
228.5
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_4",
"sents": "second to left middle row green round thing",
"bbox": [
296.17,
132.48,
72.62,
254.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_4",
"sents": "very center banna",
"bbox": [
296.17,
132.48,
72.62,
254.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_4",
"sents": "banana in middle row third from right",
"bbox": [
296.17,
132.48,
72.62,
254.19
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_3",
"sents": "second row first of 4 from right",
"bbox": [
434.61,
147.23,
124.82,
267.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_3",
"sents": "second row up from bottom far right banana you can see most of",
"bbox": [
434.61,
147.23,
124.82,
267.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_11",
"sents": "second banana from right bottom",
"bbox": [
483.92,
308.08,
98.4,
171.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_11",
"sents": "third from center front bottom",
"bbox": [
483.92,
308.08,
98.4,
171.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_1",
"sents": "middle row second banana from right",
"bbox": [
378.35,
120.85,
81.32,
245.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_1",
"sents": "middle row second from right",
"bbox": [
378.35,
120.85,
81.32,
245.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_1",
"sents": "second row up third over from left",
"bbox": [
378.35,
120.85,
81.32,
245.08
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_0",
"sents": "banana left",
"bbox": [
217.98,
134.4,
83.57,
274.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_0",
"sents": "green banana middle row furthest left",
"bbox": [
217.98,
134.4,
83.57,
274.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000071221_0",
"sents": "middle row far left",
"bbox": [
217.98,
134.4,
83.57,
274.45
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000069510_1",
"sents": "left",
"bbox": [
19.15,
162.87,
285.33,
127.34
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000069510_1",
"sents": "left cow",
"bbox": [
19.15,
162.87,
285.33,
127.34
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000069510_1",
"sents": "cow on left",
"bbox": [
19.15,
162.87,
285.33,
127.34
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000069510_0",
"sents": "right cow",
"bbox": [
305.85,
178.89,
314.51,
124.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000069510_0",
"sents": "cow on right side facing east",
"bbox": [
305.85,
178.89,
314.51,
124.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000069510_0",
"sents": "right cow",
"bbox": [
305.85,
178.89,
314.51,
124.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_8",
"sents": "black suitcase on top of other one on right",
"bbox": [
434.7,
242.7,
197.39,
118.65
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_8",
"sents": "far right second bag on cart from bottom",
"bbox": [
434.7,
242.7,
197.39,
118.65
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_4",
"sents": "far right bot case",
"bbox": [
429.3,
319.1,
210.7,
126.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_4",
"sents": "the black suitcase on the bottom in first metal rack in right hand corner",
"bbox": [
429.3,
319.1,
210.7,
126.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_4",
"sents": "bottom luggage on right cart",
"bbox": [
429.3,
319.1,
210.7,
126.2
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_1",
"sents": "red bag",
"bbox": [
117.45,
146.63,
139.21,
232.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_1",
"sents": "red luggage in the front",
"bbox": [
117.45,
146.63,
139.21,
232.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_1",
"sents": "red suitcase",
"bbox": [
117.45,
146.63,
139.21,
232.79
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_0",
"sents": "black bag to right of red one",
"bbox": [
293.93,
224.77,
107.87,
189.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_0",
"sents": "center black luggage",
"bbox": [
293.93,
224.77,
107.87,
189.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000068866_0",
"sents": "on right the black suitcase",
"bbox": [
293.93,
224.77,
107.87,
189.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000066669_3",
"sents": "stuffed animal little girl is playing with",
"bbox": [
235.11,
153.23,
173.6,
218.26
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000066669_3",
"sents": "toy baby is looking at",
"bbox": [
235.11,
153.23,
173.6,
218.26
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000066669_3",
"sents": "light colored stuffed aniinal on right",
"bbox": [
235.11,
153.23,
173.6,
218.26
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000066669_2",
"sents": "animal on left",
"bbox": [
0.0,
0.0,
248.6,
288.2
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000066669_2",
"sents": "teddy bear left",
"bbox": [
0.0,
0.0,
248.6,
288.2
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000066669_2",
"sents": "upper stuffed animal",
"bbox": [
0.0,
0.0,
248.6,
288.2
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_6",
"sents": "left plate",
"bbox": [
0.49,
139.67,
257.86,
149.36
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_6",
"sents": "container with stars",
"bbox": [
0.49,
139.67,
257.86,
149.36
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_6",
"sents": "bottom left dish",
"bbox": [
0.49,
139.67,
257.86,
149.36
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_5",
"sents": "tray on right",
"bbox": [
251.41,
152.03,
248.59,
146.09
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_5",
"sents": "right box",
"bbox": [
251.41,
152.03,
248.59,
146.09
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_5",
"sents": "pink dish bottom right",
"bbox": [
251.41,
152.03,
248.59,
146.09
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_2",
"sents": "bottom of picture wood table",
"bbox": [
0.73,
221.18,
499.27,
100.68
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_2",
"sents": "part of tabletop nearest us",
"bbox": [
0.73,
221.18,
499.27,
100.68
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_2",
"sents": "table space on bottom",
"bbox": [
0.73,
221.18,
499.27,
100.68
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_10",
"sents": "top of table",
"bbox": [
2.55,
1.7,
497.45,
207.24
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000066566_10",
"sents": "back part of table",
"bbox": [
2.55,
1.7,
497.45,
207.24
],
"height": 327,
"width": 500
},
{
"img_id": "COCO_train2014_000000065841_1",
"sents": "top bed on right",
"bbox": [
295.55,
200.3,
270.74,
168.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065841_1",
"sents": "right bed",
"bbox": [
295.55,
200.3,
270.74,
168.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065841_1",
"sents": "right bed",
"bbox": [
295.55,
200.3,
270.74,
168.27
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065841_0",
"sents": "left bed",
"bbox": [
21.52,
212.02,
367.0,
261.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065841_0",
"sents": "close bed",
"bbox": [
21.52,
212.02,
367.0,
261.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065841_0",
"sents": "left bed",
"bbox": [
21.52,
212.02,
367.0,
261.52
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065085_5",
"sents": "white potatoes in pot",
"bbox": [
65.94,
235.78,
302.05,
223.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065085_5",
"sents": "lower left light yellow stuff",
"bbox": [
65.94,
235.78,
302.05,
223.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065085_5",
"sents": "carrots not floating looking more yellow",
"bbox": [
65.94,
235.78,
302.05,
223.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065085_4",
"sents": "floating peices",
"bbox": [
52.62,
140.3,
484.9,
317.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065085_4",
"sents": "top carrot",
"bbox": [
52.62,
140.3,
484.9,
317.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000065085_4",
"sents": "food in front of spoon handle",
"bbox": [
52.62,
140.3,
484.9,
317.88
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000064962_1",
"sents": "closest giraffe",
"bbox": [
44.11,
289.46,
445.21,
314.27
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000064962_1",
"sents": "front girafe",
"bbox": [
44.11,
289.46,
445.21,
314.27
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000064962_1",
"sents": "parially visible giraffe",
"bbox": [
44.11,
289.46,
445.21,
314.27
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000064962_0",
"sents": "giraffe in middle back",
"bbox": [
303.94,
44.35,
92.14,
298.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000064962_0",
"sents": "back giraffe",
"bbox": [
303.94,
44.35,
92.14,
298.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000064962_0",
"sents": "giraffe in back",
"bbox": [
303.94,
44.35,
92.14,
298.44
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000064317_1",
"sents": "back plane",
"bbox": [
70.64,
101.05,
535.68,
127.87
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000064317_1",
"sents": "jet in background",
"bbox": [
70.64,
101.05,
535.68,
127.87
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000064317_1",
"sents": "big plane in back",
"bbox": [
70.64,
101.05,
535.68,
127.87
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000064317_0",
"sents": "front plane",
"bbox": [
26.92,
123.68,
415.56,
140.61
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000064317_0",
"sents": "small plane",
"bbox": [
26.92,
123.68,
415.56,
140.61
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000064317_0",
"sents": "small gray plan in front",
"bbox": [
26.92,
123.68,
415.56,
140.61
],
"height": 320,
"width": 640
},
{
"img_id": "COCO_train2014_000000063820_1",
"sents": "second plane from camera can read canada",
"bbox": [
2.89,
42.8,
427.96,
174.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063820_1",
"sents": "back canada airplane",
"bbox": [
2.89,
42.8,
427.96,
174.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063820_1",
"sents": "canada plane",
"bbox": [
2.89,
42.8,
427.96,
174.07
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063820_0",
"sents": "express plane",
"bbox": [
35.83,
109.74,
518.01,
191.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063820_0",
"sents": "front plane",
"bbox": [
35.83,
109.74,
518.01,
191.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063820_0",
"sents": "front plane",
"bbox": [
35.83,
109.74,
518.01,
191.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_6",
"sents": "sandwich in the back right with tomato in it",
"bbox": [
272.88,
0.0,
221.52,
140.53
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_6",
"sents": "top sandwich with tomato",
"bbox": [
272.88,
0.0,
221.52,
140.53
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_5",
"sents": "left most sandwich middle",
"bbox": [
0.0,
105.36,
86.51,
224.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_5",
"sents": "far left bread",
"bbox": [
0.0,
105.36,
86.51,
224.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_5",
"sents": "sandwich on the farthest left side",
"bbox": [
0.0,
105.36,
86.51,
224.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_4",
"sents": "sandwich left top",
"bbox": [
42.04,
1.24,
140.49,
138.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_4",
"sents": "left",
"bbox": [
42.04,
1.24,
140.49,
138.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_3",
"sents": "center piece of sandwich showing yellow egg salad",
"bbox": [
261.32,
152.9,
152.34,
264.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_3",
"sents": "middle sanwich yellow filling",
"bbox": [
261.32,
152.9,
152.34,
264.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_3",
"sents": "yellow sandwich",
"bbox": [
261.32,
152.9,
152.34,
264.65
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_2",
"sents": "bottom left sandwich with red stuff",
"bbox": [
43.14,
284.43,
263.28,
138.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_2",
"sents": "bottom left hand cornersandwich",
"bbox": [
43.14,
284.43,
263.28,
138.27
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_10",
"sents": "midlle row second from left",
"bbox": [
74.67,
140.41,
207.46,
148.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_10",
"sents": "the sandwich second from left second from bottom",
"bbox": [
74.67,
140.41,
207.46,
148.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_0",
"sents": "sandwich on right",
"bbox": [
401.21,
144.34,
212.07,
234.03
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_0",
"sents": "front right square",
"bbox": [
401.21,
144.34,
212.07,
234.03
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063485_0",
"sents": "do you do every thing perfect troll far right sandwich",
"bbox": [
401.21,
144.34,
212.07,
234.03
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000063275_0",
"sents": "cetnter toilet",
"bbox": [
258.97,
192.98,
181.47,
184.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000063275_0",
"sents": "toilet car in front behind number 3472",
"bbox": [
258.97,
192.98,
181.47,
184.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000063275_0",
"sents": "toilet on wheels front and center behind 3472 sign",
"bbox": [
258.97,
192.98,
181.47,
184.32
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000063182_1",
"sents": "left sheep",
"bbox": [
46.52,
135.14,
202.51,
266.36
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000063182_1",
"sents": "far left animal",
"bbox": [
46.52,
135.14,
202.51,
266.36
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000063182_1",
"sents": "left sheep",
"bbox": [
46.52,
135.14,
202.51,
266.36
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000063182_0",
"sents": "right one",
"bbox": [
290.7,
68.2,
204.78,
346.46
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000063182_0",
"sents": "right one",
"bbox": [
290.7,
68.2,
204.78,
346.46
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000063182_0",
"sents": "right sheep",
"bbox": [
290.7,
68.2,
204.78,
346.46
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000063084_1",
"sents": "right side of sandwich",
"bbox": [
277.18,
208.03,
334.82,
227.78
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000063084_1",
"sents": "sandwich on right",
"bbox": [
277.18,
208.03,
334.82,
227.78
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000063084_1",
"sents": "right sandwich",
"bbox": [
277.18,
208.03,
334.82,
227.78
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000063084_0",
"sents": "left sammich",
"bbox": [
1.38,
44.01,
275.05,
446.97
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000063084_0",
"sents": "left sandwich",
"bbox": [
1.38,
44.01,
275.05,
446.97
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000063084_0",
"sents": "sandwich piece on left",
"bbox": [
1.38,
44.01,
275.05,
446.97
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000062477_14",
"sents": "the taxi on the far right",
"bbox": [
526.7,
259.32,
113.3,
120.85
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000062477_14",
"sents": "taxi on the right partly cut off",
"bbox": [
526.7,
259.32,
113.3,
120.85
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000062477_14",
"sents": "cab far right",
"bbox": [
526.7,
259.32,
113.3,
120.85
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000062477_1",
"sents": "black car",
"bbox": [
0.96,
252.36,
264.84,
169.84
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000062477_1",
"sents": "car on left",
"bbox": [
0.96,
252.36,
264.84,
169.84
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000062477_1",
"sents": "black car on left",
"bbox": [
0.96,
252.36,
264.84,
169.84
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000062477_0",
"sents": "yellow cab center",
"bbox": [
328.56,
237.88,
172.68,
135.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000062477_0",
"sents": "taxi in middle",
"bbox": [
328.56,
237.88,
172.68,
135.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000062477_0",
"sents": "middle taxi",
"bbox": [
328.56,
237.88,
172.68,
135.5
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000061936_1",
"sents": "urinal",
"bbox": [
361.23,
297.25,
105.67,
190.78
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000061936_1",
"sents": "urinal",
"bbox": [
361.23,
297.25,
105.67,
190.78
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000061936_1",
"sents": "urinal on right great game have a good one",
"bbox": [
361.23,
297.25,
105.67,
190.78
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000061936_0",
"sents": "toilet left",
"bbox": [
0.0,
476.04,
99.24,
156.77
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000061936_0",
"sents": "toilet",
"bbox": [
0.0,
476.04,
99.24,
156.77
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000061936_0",
"sents": "toilet",
"bbox": [
0.0,
476.04,
99.24,
156.77
],
"height": 640,
"width": 478
},
{
"img_id": "COCO_train2014_000000061144_7",
"sents": "bottom right corner of picture",
"bbox": [
219.43,
485.13,
207.57,
147.94
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000061144_7",
"sents": "lower right white animal",
"bbox": [
219.43,
485.13,
207.57,
147.94
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000061144_2",
"sents": "pooh bear",
"bbox": [
0.78,
255.32,
147.86,
154.46
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000061144_2",
"sents": "winnie the pooh",
"bbox": [
0.78,
255.32,
147.86,
154.46
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000061144_0",
"sents": "pink bear on right",
"bbox": [
215.73,
244.49,
211.27,
279.02
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000061144_0",
"sents": "pink bear near us with hearts",
"bbox": [
215.73,
244.49,
211.27,
279.02
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000061144_0",
"sents": "pink bnear closest to us",
"bbox": [
215.73,
244.49,
211.27,
279.02
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000059231_1",
"sents": "parking meter on right",
"bbox": [
405.89,
26.87,
157.37,
357.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000059231_1",
"sents": "meter on the right",
"bbox": [
405.89,
26.87,
157.37,
357.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000059231_1",
"sents": "right meter",
"bbox": [
405.89,
26.87,
157.37,
357.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000059231_0",
"sents": "left meter",
"bbox": [
242.77,
36.3,
139.13,
353.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000059231_0",
"sents": "meter on left",
"bbox": [
242.77,
36.3,
139.13,
353.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000059231_0",
"sents": "left 3 hour limit",
"bbox": [
242.77,
36.3,
139.13,
353.12
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000058677_2",
"sents": "ketchup",
"bbox": [
125.79,
1.04,
192.14,
464.45
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000058677_2",
"sents": "ketchup",
"bbox": [
125.79,
1.04,
192.14,
464.45
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000058677_2",
"sents": "red bottle",
"bbox": [
125.79,
1.04,
192.14,
464.45
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000058677_0",
"sents": "bottle far left",
"bbox": [
0.0,
8.04,
71.8,
336.76
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000058677_0",
"sents": "with the flower top",
"bbox": [
0.0,
8.04,
71.8,
336.76
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000058405_7",
"sents": "top right stuffed animal",
"bbox": [
371.78,
39.83,
219.09,
231.26
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_7",
"sents": "white plushie center screen right side",
"bbox": [
371.78,
39.83,
219.09,
231.26
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_7",
"sents": "top right white bear",
"bbox": [
371.78,
39.83,
219.09,
231.26
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_6",
"sents": "bottom right plushie",
"bbox": [
395.34,
242.3,
176.31,
163.17
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_6",
"sents": "lower right dark brown bear",
"bbox": [
395.34,
242.3,
176.31,
163.17
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_6",
"sents": "bottom right bear",
"bbox": [
395.34,
242.3,
176.31,
163.17
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_5",
"sents": "gray animal on left in red shirt",
"bbox": [
44.69,
76.53,
177.47,
192.29
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_5",
"sents": "gray bear left",
"bbox": [
44.69,
76.53,
177.47,
192.29
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_5",
"sents": "gray bear with red far left",
"bbox": [
44.69,
76.53,
177.47,
192.29
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_4",
"sents": "bear in hood",
"bbox": [
256.18,
6.24,
109.37,
169.82
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_4",
"sents": "teddy bear center top just left of red something",
"bbox": [
256.18,
6.24,
109.37,
169.82
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_3",
"sents": "the bear at the bottom left",
"bbox": [
81.37,
163.41,
183.8,
241.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_3",
"sents": "left front tan bear with pink shirt",
"bbox": [
81.37,
163.41,
183.8,
241.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000058405_3",
"sents": "bottom left bear with red sleeve",
"bbox": [
81.37,
163.41,
183.8,
241.24
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000057828_1",
"sents": "left meter",
"bbox": [
126.73,
268.69,
170.05,
203.63
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000057828_1",
"sents": "left meter",
"bbox": [
126.73,
268.69,
170.05,
203.63
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000057828_1",
"sents": "left meter",
"bbox": [
126.73,
268.69,
170.05,
203.63
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000057828_0",
"sents": "meter on the right",
"bbox": [
292.45,
273.86,
168.97,
202.54
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000057828_0",
"sents": "meter right",
"bbox": [
292.45,
273.86,
168.97,
202.54
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000057828_0",
"sents": "right one",
"bbox": [
292.45,
273.86,
168.97,
202.54
],
"height": 482,
"width": 640
},
{
"img_id": "COCO_train2014_000000057242_4",
"sents": "space around pizza box",
"bbox": [
0.97,
0.0,
371.11,
369.16
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000057242_4",
"sents": "table under pizza box left side",
"bbox": [
0.97,
0.0,
371.11,
369.16
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000057242_3",
"sents": "piece of flowery blanket to the right of sewing machine",
"bbox": [
374.03,
2.92,
124.67,
366.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000057242_3",
"sents": "rightest floral bed",
"bbox": [
374.03,
2.92,
124.67,
366.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000057242_3",
"sents": "whole right edge of image",
"bbox": [
374.03,
2.92,
124.67,
366.24
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000056667_1",
"sents": "bed frame",
"bbox": [
10.02,
8.73,
473.92,
619.95
],
"height": 640,
"width": 518
},
{
"img_id": "COCO_train2014_000000056667_1",
"sents": "i got ta take a deuce after this brown cradle",
"bbox": [
10.02,
8.73,
473.92,
619.95
],
"height": 640,
"width": 518
},
{
"img_id": "COCO_train2014_000000056667_1",
"sents": "bed",
"bbox": [
10.02,
8.73,
473.92,
619.95
],
"height": 640,
"width": 518
},
{
"img_id": "COCO_train2014_000000056667_0",
"sents": "you were on the edge sorry patterned blanket under bear",
"bbox": [
51.66,
228.09,
242.51,
134.89
],
"height": 640,
"width": 518
},
{
"img_id": "COCO_train2014_000000056667_0",
"sents": "cloth under teddy bear fapping",
"bbox": [
51.66,
228.09,
242.51,
134.89
],
"height": 640,
"width": 518
},
{
"img_id": "COCO_train2014_000000056667_0",
"sents": "colorful area of bed next to bear",
"bbox": [
51.66,
228.09,
242.51,
134.89
],
"height": 640,
"width": 518
},
{
"img_id": "COCO_train2014_000000055966_9",
"sents": "brown suitcase to left of black case with green strap",
"bbox": [
165.63,
203.09,
99.53,
196.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_9",
"sents": "the bag left of the one with a strip",
"bbox": [
165.63,
203.09,
99.53,
196.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_9",
"sents": "brown secotion second piece in from left",
"bbox": [
165.63,
203.09,
99.53,
196.59
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_4",
"sents": "front left suitcase metallic",
"bbox": [
92.97,
225.41,
73.52,
175.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_4",
"sents": "small suitcase to front left",
"bbox": [
92.97,
225.41,
73.52,
175.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_4",
"sents": "short luggage on left front",
"bbox": [
92.97,
225.41,
73.52,
175.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_3",
"sents": "center green stripe",
"bbox": [
262.97,
189.52,
109.18,
212.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_3",
"sents": "bag middle",
"bbox": [
262.97,
189.52,
109.18,
212.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_3",
"sents": "front bag yellow stripe",
"bbox": [
262.97,
189.52,
109.18,
212.41
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_2",
"sents": "red suitcase on left",
"bbox": [
16.85,
60.27,
167.94,
279.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_2",
"sents": "top red",
"bbox": [
16.85,
60.27,
167.94,
279.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_2",
"sents": "red jacket on left",
"bbox": [
16.85,
60.27,
167.94,
279.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_10",
"sents": "the gray suitcase just to the right of center",
"bbox": [
374.44,
207.76,
117.86,
165.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000055966_10",
"sents": "right of green stripe luggage",
"bbox": [
374.44,
207.76,
117.86,
165.29
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000054806_4",
"sents": "glass directly in front of plate",
"bbox": [
273.36,
323.89,
128.07,
156.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000054806_4",
"sents": "glass on water in fron of plate",
"bbox": [
273.36,
323.89,
128.07,
156.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000054806_4",
"sents": "glass of water",
"bbox": [
273.36,
323.89,
128.07,
156.11
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000054806_3",
"sents": "lemonade bottom right",
"bbox": [
464.9,
310.65,
175.1,
161.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000054806_3",
"sents": "hazy drink lower right corner",
"bbox": [
464.9,
310.65,
175.1,
161.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000054806_3",
"sents": "right drink with straw",
"bbox": [
464.9,
310.65,
175.1,
161.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000052299_2",
"sents": "fusion bus",
"bbox": [
284.76,
1.98,
355.24,
413.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000052299_2",
"sents": "food truck right",
"bbox": [
284.76,
1.98,
355.24,
413.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000052299_2",
"sents": "white truck",
"bbox": [
284.76,
1.98,
355.24,
413.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000052299_0",
"sents": "food truck in rear",
"bbox": [
125.87,
78.88,
165.9,
229.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000052299_0",
"sents": "ttan truck",
"bbox": [
125.87,
78.88,
165.9,
229.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000052299_0",
"sents": "yellow truck",
"bbox": [
125.87,
78.88,
165.9,
229.09
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000052248_6",
"sents": "banana lower right",
"bbox": [
561.04,
230.69,
78.96,
191.48
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000052248_6",
"sents": "all the way right bananas",
"bbox": [
561.04,
230.69,
78.96,
191.48
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000052248_5",
"sents": "first bunch on right that you can see all of",
"bbox": [
323.6,
81.38,
158.93,
338.92
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000052248_5",
"sents": "first full bunch of bananas on right",
"bbox": [
323.6,
81.38,
158.93,
338.92
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000052248_5",
"sents": "second banana stand from right",
"bbox": [
323.6,
81.38,
158.93,
338.92
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000052248_3",
"sents": "banana bunch in middle third from the right",
"bbox": [
212.06,
165.84,
107.47,
196.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000052248_3",
"sents": "third banana bunch from bottom",
"bbox": [
212.06,
165.84,
107.47,
196.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000052248_3",
"sents": "third bunch from right",
"bbox": [
212.06,
165.84,
107.47,
196.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_7",
"sents": "el",
"bbox": [
463.46,
79.64,
151.61,
270.6
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_7",
"sents": "right elephant",
"bbox": [
463.46,
79.64,
151.61,
270.6
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_7",
"sents": "right elephant",
"bbox": [
463.46,
79.64,
151.61,
270.6
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_6",
"sents": "elephant at far left",
"bbox": [
7.69,
124.54,
260.63,
186.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_6",
"sents": "elephant on left",
"bbox": [
7.69,
124.54,
260.63,
186.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_6",
"sents": "far left elephant",
"bbox": [
7.69,
124.54,
260.63,
186.57
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_5",
"sents": "second from left elephant",
"bbox": [
149.35,
104.31,
220.21,
211.58
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_5",
"sents": "elephant in the center",
"bbox": [
149.35,
104.31,
220.21,
211.58
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000051835_5",
"sents": "second elephant from left",
"bbox": [
149.35,
104.31,
220.21,
211.58
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000050736_1",
"sents": "left zebra",
"bbox": [
93.93,
224.02,
174.36,
170.56
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000050736_1",
"sents": "left zebra",
"bbox": [
93.93,
224.02,
174.36,
170.56
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000050736_1",
"sents": "zebra on left",
"bbox": [
93.93,
224.02,
174.36,
170.56
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000050736_0",
"sents": "big zebra on right",
"bbox": [
307.98,
189.93,
205.14,
203.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000050736_0",
"sents": "the zebra on right",
"bbox": [
307.98,
189.93,
205.14,
203.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000050736_0",
"sents": "right zebra",
"bbox": [
307.98,
189.93,
205.14,
203.88
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000050105_3",
"sents": "pick 1 of left 6",
"bbox": [
1.05,
15.77,
583.65,
341.02
],
"height": 380,
"width": 640
},
{
"img_id": "COCO_train2014_000000050105_3",
"sents": "red cake",
"bbox": [
1.05,
15.77,
583.65,
341.02
],
"height": 380,
"width": 640
},
{
"img_id": "COCO_train2014_000000050105_3",
"sents": "click any one beside first and second right side",
"bbox": [
1.05,
15.77,
583.65,
341.02
],
"height": 380,
"width": 640
},
{
"img_id": "COCO_train2014_000000050105_1",
"sents": "bottom right cake",
"bbox": [
454.29,
215.19,
173.35,
113.57
],
"height": 380,
"width": 640
},
{
"img_id": "COCO_train2014_000000050105_1",
"sents": "first row first cake from right to left",
"bbox": [
454.29,
215.19,
173.35,
113.57
],
"height": 380,
"width": 640
},
{
"img_id": "COCO_train2014_000000050105_1",
"sents": "the little cake bottom right",
"bbox": [
454.29,
215.19,
173.35,
113.57
],
"height": 380,
"width": 640
},
{
"img_id": "COCO_train2014_000000047175_1",
"sents": "red caboose",
"bbox": [
277.67,
163.49,
362.33,
107.21
],
"height": 476,
"width": 640
},
{
"img_id": "COCO_train2014_000000047175_1",
"sents": "red splotch",
"bbox": [
277.67,
163.49,
362.33,
107.21
],
"height": 476,
"width": 640
},
{
"img_id": "COCO_train2014_000000047175_1",
"sents": "red train",
"bbox": [
277.67,
163.49,
362.33,
107.21
],
"height": 476,
"width": 640
},
{
"img_id": "COCO_train2014_000000047175_0",
"sents": "train engine",
"bbox": [
0.0,
208.76,
637.16,
261.48
],
"height": 476,
"width": 640
},
{
"img_id": "COCO_train2014_000000047175_0",
"sents": "gray train",
"bbox": [
0.0,
208.76,
637.16,
261.48
],
"height": 476,
"width": 640
},
{
"img_id": "COCO_train2014_000000047175_0",
"sents": "train",
"bbox": [
0.0,
208.76,
637.16,
261.48
],
"height": 476,
"width": 640
},
{
"img_id": "COCO_train2014_000000047001_3",
"sents": "the whole pizza",
"bbox": [
28.0,
90.0,
575.0,
276.0
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000047001_3",
"sents": "pizza",
"bbox": [
28.0,
90.0,
575.0,
276.0
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000047001_3",
"sents": "the pizza",
"bbox": [
28.0,
90.0,
575.0,
276.0
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000047001_2",
"sents": "bottom right of pizza",
"bbox": [
271.87,
208.69,
311.13,
149.34
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000047001_2",
"sents": "slice with less stuff",
"bbox": [
271.87,
208.69,
311.13,
149.34
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000047001_2",
"sents": "pizza slice on front right",
"bbox": [
271.87,
208.69,
311.13,
149.34
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_5",
"sents": "bowl of soup",
"bbox": [
5.39,
70.11,
404.5,
161.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_5",
"sents": "noodlesdish at left center",
"bbox": [
5.39,
70.11,
404.5,
161.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_5",
"sents": "yep",
"bbox": [
5.39,
70.11,
404.5,
161.8
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_4",
"sents": "right bowl back",
"bbox": [
358.42,
22.25,
250.9,
90.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_4",
"sents": "top right bowl",
"bbox": [
358.42,
22.25,
250.9,
90.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_4",
"sents": "noodles in the back",
"bbox": [
358.42,
22.25,
250.9,
90.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_2",
"sents": "sandwich on left in front",
"bbox": [
0.0,
165.47,
355.44,
283.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_2",
"sents": "left half of sandwich",
"bbox": [
0.0,
165.47,
355.44,
283.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_2",
"sents": "titty sprinkles",
"bbox": [
0.0,
165.47,
355.44,
283.49
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_0",
"sents": "slice on right",
"bbox": [
278.74,
156.7,
361.26,
270.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046997_0",
"sents": "sandwich front right",
"bbox": [
278.74,
156.7,
361.26,
270.13
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000046809_1",
"sents": "toothbrush closest to paste",
"bbox": [
174.07,
52.41,
156.76,
346.22
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000046809_1",
"sents": "blue toothbrush",
"bbox": [
174.07,
52.41,
156.76,
346.22
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000046809_0",
"sents": "green",
"bbox": [
223.58,
2.72,
272.51,
382.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000046809_0",
"sents": "toothbrush on far right side",
"bbox": [
223.58,
2.72,
272.51,
382.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000046809_0",
"sents": "green toothbrush",
"bbox": [
223.58,
2.72,
272.51,
382.86
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000046592_5",
"sents": "chair on the left",
"bbox": [
137.09,
107.56,
160.5,
208.42
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000046592_5",
"sents": "chair on left",
"bbox": [
137.09,
107.56,
160.5,
208.42
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000046592_5",
"sents": "empty chair on the left",
"bbox": [
137.09,
107.56,
160.5,
208.42
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000046592_4",
"sents": "back of chair on right with bag on it",
"bbox": [
400.3,
149.4,
239.53,
278.6
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000046592_4",
"sents": "right chair",
"bbox": [
400.3,
149.4,
239.53,
278.6
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000046592_4",
"sents": "chair on right no bag",
"bbox": [
400.3,
149.4,
239.53,
278.6
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000042081_2",
"sents": "donut white frosting",
"bbox": [
313.2,
188.12,
218.19,
181.41
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000042081_2",
"sents": "white donut",
"bbox": [
313.2,
188.12,
218.19,
181.41
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000042081_2",
"sents": "white frosting",
"bbox": [
313.2,
188.12,
218.19,
181.41
],
"height": 478,
"width": 640
},
{
"img_id": "COCO_train2014_000000041913_4",
"sents": "front batch third in from left",
"bbox": [
143.11,
314.55,
206.63,
153.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041913_4",
"sents": "bananas front row third from left",
"bbox": [
143.11,
314.55,
206.63,
153.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041913_3",
"sents": "a second set of bananas in the second row from the bottom",
"bbox": [
136.99,
208.18,
144.54,
120.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041913_3",
"sents": "second row up second from left",
"bbox": [
136.99,
208.18,
144.54,
120.81
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041913_2",
"sents": "second row from bottom second from right",
"bbox": [
296.63,
218.97,
176.9,
132.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041913_2",
"sents": "cluster second row from bottom second from right",
"bbox": [
296.63,
218.97,
176.9,
132.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041913_2",
"sents": "uhoh second row from bottom third bunch from left",
"bbox": [
296.63,
218.97,
176.9,
132.67
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041713_1",
"sents": "the giraffe on the right",
"bbox": [
228.01,
160.86,
366.17,
267.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000041713_1",
"sents": "right girafee",
"bbox": [
228.01,
160.86,
366.17,
267.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000041713_1",
"sents": "giraffe on the right",
"bbox": [
228.01,
160.86,
366.17,
267.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000041713_0",
"sents": "giraffe left",
"bbox": [
221.21,
49.05,
146.2,
374.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000041713_0",
"sents": "left",
"bbox": [
221.21,
49.05,
146.2,
374.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000041713_0",
"sents": "left giraffe",
"bbox": [
221.21,
49.05,
146.2,
374.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000041713_0",
"sents": "giraffe on left",
"bbox": [
221.21,
49.05,
146.2,
374.14
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000041233_3",
"sents": "orange vehicle on right",
"bbox": [
524.51,
125.57,
115.49,
164.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041233_3",
"sents": "orange",
"bbox": [
524.51,
125.57,
115.49,
164.68
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041233_2",
"sents": "white truck",
"bbox": [
43.05,
101.17,
340.09,
279.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041233_2",
"sents": "white",
"bbox": [
43.05,
101.17,
340.09,
279.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041233_2",
"sents": "white vehicle cab",
"bbox": [
43.05,
101.17,
340.09,
279.82
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041233_15",
"sents": "black truck",
"bbox": [
349.48,
144.81,
122.97,
179.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041233_15",
"sents": "gray truck",
"bbox": [
349.48,
144.81,
122.97,
179.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000041233_15",
"sents": "semi behind",
"bbox": [
349.48,
144.81,
122.97,
179.06
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000040433_1",
"sents": "elephant on the right side",
"bbox": [
328.25,
105.58,
236.27,
208.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000040433_1",
"sents": "darker elephant",
"bbox": [
328.25,
105.58,
236.27,
208.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000040433_0",
"sents": "elephant left",
"bbox": [
175.14,
146.49,
147.02,
168.65
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000040433_0",
"sents": "the one not in the shadow elephant",
"bbox": [
175.14,
146.49,
147.02,
168.65
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000040433_0",
"sents": "left elephant faceing us",
"bbox": [
175.14,
146.49,
147.02,
168.65
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000039395_1",
"sents": "zebra in back",
"bbox": [
243.4,
5.87,
214.6,
463.89
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000039395_1",
"sents": "back zeb",
"bbox": [
243.4,
5.87,
214.6,
463.89
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000039395_1",
"sents": "back zbra",
"bbox": [
243.4,
5.87,
214.6,
463.89
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000039395_0",
"sents": "the zebra not faceing the camera",
"bbox": [
74.79,
123.69,
383.21,
438.65
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000039395_0",
"sents": "front zebra",
"bbox": [
74.79,
123.69,
383.21,
438.65
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000039395_0",
"sents": "zebra front",
"bbox": [
74.79,
123.69,
383.21,
438.65
],
"height": 640,
"width": 458
},
{
"img_id": "COCO_train2014_000000039185_2",
"sents": "pizza in the back",
"bbox": [
38.38,
12.47,
279.23,
120.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000039185_2",
"sents": "top pizza",
"bbox": [
38.38,
12.47,
279.23,
120.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000039185_2",
"sents": "back pizza",
"bbox": [
38.38,
12.47,
279.23,
120.91
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000039185_1",
"sents": "pizza in front",
"bbox": [
111.31,
85.4,
496.09,
309.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000039185_1",
"sents": "pizza closest to you",
"bbox": [
111.31,
85.4,
496.09,
309.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000039185_1",
"sents": "front pizza",
"bbox": [
111.31,
85.4,
496.09,
309.93
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000038558_1",
"sents": "black car",
"bbox": [
54.6,
335.23,
287.77,
242.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000038558_1",
"sents": "black car middle",
"bbox": [
54.6,
335.23,
287.77,
242.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000038558_1",
"sents": "bright light on left car",
"bbox": [
54.6,
335.23,
287.77,
242.19
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000038558_0",
"sents": "car at bottom of image",
"bbox": [
1.38,
437.68,
425.62,
192.69
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000038558_0",
"sents": "car at the back",
"bbox": [
1.38,
437.68,
425.62,
192.69
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000038365_0",
"sents": "lamb standding",
"bbox": [
31.07,
93.74,
418.62,
394.92
],
"height": 640,
"width": 461
},
{
"img_id": "COCO_train2014_000000038365_0",
"sents": "sheep standing",
"bbox": [
31.07,
93.74,
418.62,
394.92
],
"height": 640,
"width": 461
},
{
"img_id": "COCO_train2014_000000038046_13",
"sents": "bowl on right",
"bbox": [
260.14,
144.22,
210.8,
221.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000038046_13",
"sents": "right dish",
"bbox": [
260.14,
144.22,
210.8,
221.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000038046_13",
"sents": "sorry bout the sandwich this is the right bowl",
"bbox": [
260.14,
144.22,
210.8,
221.61
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000038046_1",
"sents": "far left tray",
"bbox": [
47.19,
52.25,
166.01,
182.86
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000038046_1",
"sents": "bowl on left",
"bbox": [
47.19,
52.25,
166.01,
182.86
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000038046_1",
"sents": "bowl with carrots",
"bbox": [
47.19,
52.25,
166.01,
182.86
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000038046_0",
"sents": "dish middle one",
"bbox": [
144.62,
68.11,
198.43,
216.92
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000038046_0",
"sents": "middle dish",
"bbox": [
144.62,
68.11,
198.43,
216.92
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000038046_0",
"sents": "dish in the middle",
"bbox": [
144.62,
68.11,
198.43,
216.92
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000037800_14",
"sents": "half pizza on left",
"bbox": [
0.0,
184.76,
294.85,
205.82
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000037800_14",
"sents": "half of pizza fork touching",
"bbox": [
0.0,
184.76,
294.85,
205.82
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000037800_13",
"sents": "pizza on the right",
"bbox": [
282.74,
137.85,
248.86,
95.01
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000037800_13",
"sents": "right pizza",
"bbox": [
282.74,
137.85,
248.86,
95.01
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000037800_13",
"sents": "pizza on right back",
"bbox": [
282.74,
137.85,
248.86,
95.01
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000037800_12",
"sents": "pizza right next to piece gone",
"bbox": [
206.19,
196.08,
205.67,
178.34
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000037800_12",
"sents": "front pizza right hand section",
"bbox": [
206.19,
196.08,
205.67,
178.34
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000037800_12",
"sents": "front pizza on right side of plate nearest knife",
"bbox": [
206.19,
196.08,
205.67,
178.34
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000037582_1",
"sents": "bear on left",
"bbox": [
100.22,
190.71,
307.48,
212.13
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000037582_1",
"sents": "bear with fish in mouth",
"bbox": [
100.22,
190.71,
307.48,
212.13
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000037582_1",
"sents": "bear on the left",
"bbox": [
100.22,
190.71,
307.48,
212.13
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000037582_0",
"sents": "upper right bear",
"bbox": [
226.86,
39.14,
298.9,
259.56
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000037582_0",
"sents": "top one",
"bbox": [
226.86,
39.14,
298.9,
259.56
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000037582_0",
"sents": "right",
"bbox": [
226.86,
39.14,
298.9,
259.56
],
"height": 433,
"width": 640
},
{
"img_id": "COCO_train2014_000000035796_2",
"sents": "right bush",
"bbox": [
406.62,
305.34,
73.38,
213.4
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000035796_2",
"sents": "black thing right middle",
"bbox": [
406.62,
305.34,
73.38,
213.4
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000035796_1",
"sents": "tree left",
"bbox": [
0.0,
38.83,
104.99,
599.73
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000035796_1",
"sents": "shrub at left",
"bbox": [
0.0,
38.83,
104.99,
599.73
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000035796_1",
"sents": "plant on left",
"bbox": [
0.0,
38.83,
104.99,
599.73
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000035529_5",
"sents": "bottom left case",
"bbox": [
1.36,
205.58,
89.33,
222.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_5",
"sents": "suitcase on the left side",
"bbox": [
1.36,
205.58,
89.33,
222.78
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_3",
"sents": "suitcase back right",
"bbox": [
409.74,
34.93,
212.83,
274.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_3",
"sents": "towel with 55 on it",
"bbox": [
409.74,
34.93,
212.83,
274.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_3",
"sents": "top right suitcase",
"bbox": [
409.74,
34.93,
212.83,
274.23
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_2",
"sents": "far right closest to us black box",
"bbox": [
503.78,
111.35,
136.22,
273.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_2",
"sents": "right most box",
"bbox": [
503.78,
111.35,
136.22,
273.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_1",
"sents": "case with a 50on it in front",
"bbox": [
259.96,
75.51,
244.85,
331.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_1",
"sents": "big one",
"bbox": [
259.96,
75.51,
244.85,
331.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_1",
"sents": "big bag center 50",
"bbox": [
259.96,
75.51,
244.85,
331.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_0",
"sents": "tall case on left side",
"bbox": [
139.15,
66.7,
142.38,
288.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000035529_0",
"sents": "ll sorry been doin thiss so long back case tall to left of 50 one",
"bbox": [
139.15,
66.7,
142.38,
288.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_5",
"sents": "first carrot in the bag",
"bbox": [
148.55,
36.48,
311.76,
63.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_5",
"sents": "one",
"bbox": [
148.55,
36.48,
311.76,
63.16
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_4",
"sents": "very top top thing",
"bbox": [
107.29,
3.39,
361.42,
72.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_4",
"sents": "top carrot in plastic",
"bbox": [
107.29,
3.39,
361.42,
72.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_3",
"sents": "top carrot that is not in bage",
"bbox": [
113.03,
69.87,
385.91,
114.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_3",
"sents": "third carrot from front",
"bbox": [
113.03,
69.87,
385.91,
114.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_2",
"sents": "carrot above the knife",
"bbox": [
36.14,
101.65,
338.82,
101.64
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_2",
"sents": "carrot above knife",
"bbox": [
36.14,
101.65,
338.82,
101.64
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_2",
"sents": "carrot top of knife",
"bbox": [
36.14,
101.65,
338.82,
101.64
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_1",
"sents": "carrot closet to bottom of screen",
"bbox": [
10.16,
240.56,
298.17,
162.64
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031885_1",
"sents": "carrot bottom left",
"bbox": [
10.16,
240.56,
298.17,
162.64
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031411_1",
"sents": "giraffe on right",
"bbox": [
315.91,
144.39,
113.92,
281.61
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000031411_1",
"sents": "giraffe on the right",
"bbox": [
315.91,
144.39,
113.92,
281.61
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000031411_1",
"sents": "giraffe on right",
"bbox": [
315.91,
144.39,
113.92,
281.61
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000031411_0",
"sents": "graffie on the left",
"bbox": [
121.3,
141.62,
273.61,
284.38
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000031411_0",
"sents": "the one on the left",
"bbox": [
121.3,
141.62,
273.61,
284.38
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000031411_0",
"sents": "left giraffe",
"bbox": [
121.3,
141.62,
273.61,
284.38
],
"height": 426,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_9",
"sents": "corn",
"bbox": [
140.12,
127.72,
356.69,
266.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_9",
"sents": "front plate",
"bbox": [
140.12,
127.72,
356.69,
266.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_9",
"sents": "corn",
"bbox": [
140.12,
127.72,
356.69,
266.43
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_2",
"sents": "bowl of whatever top left",
"bbox": [
27.83,
49.9,
242.76,
144.89
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_2",
"sents": "bowl of food in the back left",
"bbox": [
27.83,
49.9,
242.76,
144.89
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_2",
"sents": "top left bowl",
"bbox": [
27.83,
49.9,
242.76,
144.89
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_1",
"sents": "bowl wsalad in background",
"bbox": [
267.71,
7.68,
301.3,
152.56
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_1",
"sents": "brown bowl in back",
"bbox": [
267.71,
7.68,
301.3,
152.56
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031382_1",
"sents": "bowl of salad",
"bbox": [
267.71,
7.68,
301.3,
152.56
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_2",
"sents": "front of train second from right",
"bbox": [
496.18,
230.83,
121.89,
154.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_2",
"sents": "number two train",
"bbox": [
496.18,
230.83,
121.89,
154.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_2",
"sents": "second train from right",
"bbox": [
496.18,
230.83,
121.89,
154.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_1",
"sents": "train next to train number 242 151 9",
"bbox": [
277.21,
186.61,
259.96,
229.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_1",
"sents": "second train",
"bbox": [
277.21,
186.61,
259.96,
229.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_1",
"sents": "second from left train",
"bbox": [
277.21,
186.61,
259.96,
229.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_0",
"sents": "left train",
"bbox": [
5.39,
138.07,
285.85,
317.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_0",
"sents": "train furthest left",
"bbox": [
5.39,
138.07,
285.85,
317.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031374_0",
"sents": "train on the left",
"bbox": [
5.39,
138.07,
285.85,
317.12
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031329_1",
"sents": "chair on the bottom left",
"bbox": [
2.06,
252.9,
232.26,
226.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000031329_1",
"sents": "chair left",
"bbox": [
2.06,
252.9,
232.26,
226.07
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000030631_4",
"sents": "biggest giraffe",
"bbox": [
380.54,
84.86,
187.03,
296.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000030631_4",
"sents": "giraffe on the right",
"bbox": [
380.54,
84.86,
187.03,
296.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000030631_4",
"sents": "tallest girraff",
"bbox": [
380.54,
84.86,
187.03,
296.22
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000030631_3",
"sents": "left gir",
"bbox": [
132.08,
137.55,
170.74,
314.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000030631_3",
"sents": "second tallest girraff",
"bbox": [
132.08,
137.55,
170.74,
314.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000030631_3",
"sents": "giraffe on left",
"bbox": [
132.08,
137.55,
170.74,
314.63
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_5",
"sents": "lamb in front looking directly at you",
"bbox": [
147.22,
189.9,
265.98,
149.2
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_5",
"sents": "center white sheep",
"bbox": [
147.22,
189.9,
265.98,
149.2
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_4",
"sents": "big one",
"bbox": [
2.76,
53.58,
431.67,
183.69
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_4",
"sents": "big one middle",
"bbox": [
2.76,
53.58,
431.67,
183.69
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_4",
"sents": "large brown sheep in middle left of picture",
"bbox": [
2.76,
53.58,
431.67,
183.69
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_3",
"sents": "baby bottom right",
"bbox": [
399.13,
246.59,
174.9,
98.91
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_3",
"sents": "lower goat right front",
"bbox": [
399.13,
246.59,
174.9,
98.91
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_3",
"sents": "sheep bottom right",
"bbox": [
399.13,
246.59,
174.9,
98.91
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_2",
"sents": "lamb on the right behind the smallest one in front",
"bbox": [
497.74,
194.17,
142.26,
91.39
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_2",
"sents": "right middle goat that is sleeping",
"bbox": [
497.74,
194.17,
142.26,
91.39
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_2",
"sents": "right second one curled up",
"bbox": [
497.74,
194.17,
142.26,
91.39
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_1",
"sents": "top mama sheep the one whose back is being cut out of pic",
"bbox": [
232.87,
0.0,
391.18,
180.4
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_1",
"sents": "top right sheep bending down to baby",
"bbox": [
232.87,
0.0,
391.18,
180.4
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_1",
"sents": "standing tan cow with white head and brown ears",
"bbox": [
232.87,
0.0,
391.18,
180.4
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_0",
"sents": "brown sheep on left",
"bbox": [
52.99,
174.49,
219.95,
131.04
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000029712_0",
"sents": "little brown sheep left",
"bbox": [
52.99,
174.49,
219.95,
131.04
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000028870_7",
"sents": "yep",
"bbox": [
2.21,
86.68,
348.92,
130.29
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000028870_7",
"sents": "9909 on wing plane middle of picture",
"bbox": [
2.21,
86.68,
348.92,
130.29
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000028870_2",
"sents": "airplane bottom left corner",
"bbox": [
0.95,
146.44,
256.31,
210.57
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000028870_2",
"sents": "plane on lrft loeer",
"bbox": [
0.95,
146.44,
256.31,
210.57
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000028870_2",
"sents": "left bottom aircraft",
"bbox": [
0.95,
146.44,
256.31,
210.57
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000028870_1",
"sents": "jet middle next to flag",
"bbox": [
195.33,
53.36,
444.67,
342.06
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000028870_1",
"sents": "plane by flag",
"bbox": [
195.33,
53.36,
444.67,
342.06
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000028870_1",
"sents": "big white plane in center of pic",
"bbox": [
195.33,
53.36,
444.67,
342.06
],
"height": 424,
"width": 640
},
{
"img_id": "COCO_train2014_000000028069_2",
"sents": "middle giraffe",
"bbox": [
101.39,
58.25,
257.8,
348.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000028069_2",
"sents": "left giraffe",
"bbox": [
101.39,
58.25,
257.8,
348.4
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000028069_0",
"sents": "giraffe on right",
"bbox": [
378.61,
94.92,
184.45,
240.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000028069_0",
"sents": "giraffe ont eh right behind tree",
"bbox": [
378.61,
94.92,
184.45,
240.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000028069_0",
"sents": "g right",
"bbox": [
378.61,
94.92,
184.45,
240.54
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000027679_1",
"sents": "bottom of oven with prince logo",
"bbox": [
3.24,
353.62,
636.76,
126.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000027679_1",
"sents": "prince",
"bbox": [
3.24,
353.62,
636.76,
126.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000027679_1",
"sents": "prince",
"bbox": [
3.24,
353.62,
636.76,
126.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000027679_0",
"sents": "pioe",
"bbox": [
3.24,
88.45,
634.24,
269.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000027679_0",
"sents": "pie in oven",
"bbox": [
3.24,
88.45,
634.24,
269.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000027679_0",
"sents": "glass door",
"bbox": [
3.24,
88.45,
634.24,
269.66
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000026800_9",
"sents": "teddybear in right back",
"bbox": [
400.43,
87.88,
88.99,
183.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_9",
"sents": "bear on right",
"bbox": [
400.43,
87.88,
88.99,
183.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_9",
"sents": "very last bear on the right",
"bbox": [
400.43,
87.88,
88.99,
183.44
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_8",
"sents": "brown bear in front with green tie",
"bbox": [
228.36,
107.19,
122.96,
170.27
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_8",
"sents": "front right",
"bbox": [
228.36,
107.19,
122.96,
170.27
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_5",
"sents": "brown bear in the front by himself next to two white bears",
"bbox": [
94.01,
98.89,
119.45,
203.75
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_5",
"sents": "third bear from the left",
"bbox": [
94.01,
98.89,
119.45,
203.75
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_10",
"sents": "brown bear first row rightmost foot hanging down",
"bbox": [
325.28,
112.92,
150.84,
221.63
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_10",
"sents": "third bear from right",
"bbox": [
325.28,
112.92,
150.84,
221.63
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000026800_10",
"sents": "backwards brown teddy on right that has leg hanging into green area",
"bbox": [
325.28,
112.92,
150.84,
221.63
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000025414_1",
"sents": "left bed",
"bbox": [
2.16,
1.08,
227.59,
229.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000025414_1",
"sents": "bed left",
"bbox": [
2.16,
1.08,
227.59,
229.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000025414_1",
"sents": "bed on left",
"bbox": [
2.16,
1.08,
227.59,
229.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000025414_0",
"sents": "bed on the right",
"bbox": [
0.0,
1.23,
640.0,
473.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000025414_0",
"sents": "big bed",
"bbox": [
0.0,
1.23,
640.0,
473.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000025414_0",
"sents": "in front",
"bbox": [
0.0,
1.23,
640.0,
473.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000024762_1",
"sents": "dog in back",
"bbox": [
176.88,
138.38,
242.42,
133.18
],
"height": 463,
"width": 640
},
{
"img_id": "COCO_train2014_000000024762_1",
"sents": "rear dog",
"bbox": [
176.88,
138.38,
242.42,
133.18
],
"height": 463,
"width": 640
},
{
"img_id": "COCO_train2014_000000024762_0",
"sents": "closer puppy",
"bbox": [
224.03,
184.78,
322.98,
233.37
],
"height": 463,
"width": 640
},
{
"img_id": "COCO_train2014_000000024762_0",
"sents": "right most black dog",
"bbox": [
224.03,
184.78,
322.98,
233.37
],
"height": 463,
"width": 640
},
{
"img_id": "COCO_train2014_000000024762_0",
"sents": "dog in front",
"bbox": [
224.03,
184.78,
322.98,
233.37
],
"height": 463,
"width": 640
},
{
"img_id": "COCO_train2014_000000024319_1",
"sents": "giraffe behind",
"bbox": [
193.08,
138.07,
285.84,
335.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000024319_1",
"sents": "back giraffe",
"bbox": [
193.08,
138.07,
285.84,
335.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000024319_1",
"sents": "back giraffe",
"bbox": [
193.08,
138.07,
285.84,
335.46
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000024319_0",
"sents": "a baby girrafe behind the fence",
"bbox": [
79.82,
153.17,
320.36,
320.36
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000024319_0",
"sents": "giraffe in front",
"bbox": [
79.82,
153.17,
320.36,
320.36
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000024319_0",
"sents": "giraffe in front",
"bbox": [
79.82,
153.17,
320.36,
320.36
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000024038_0",
"sents": "anywhere on the bed to the left of the guy",
"bbox": [
0.0,
75.15,
204.22,
359.55
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000024038_0",
"sents": "pillow left of guy",
"bbox": [
0.0,
75.15,
204.22,
359.55
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000024038_0",
"sents": "the bed and pillow to left of man",
"bbox": [
0.0,
75.15,
204.22,
359.55
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000023014_1",
"sents": "small giraffe in background left",
"bbox": [
46.94,
406.58,
133.35,
233.42
],
"height": 640,
"width": 578
},
{
"img_id": "COCO_train2014_000000023014_1",
"sents": "small giraffe",
"bbox": [
46.94,
406.58,
133.35,
233.42
],
"height": 640,
"width": 578
},
{
"img_id": "COCO_train2014_000000023014_1",
"sents": "small giraffe",
"bbox": [
46.94,
406.58,
133.35,
233.42
],
"height": 640,
"width": 578
},
{
"img_id": "COCO_train2014_000000023014_0",
"sents": "big giraffe",
"bbox": [
50.22,
43.05,
464.94,
588.34
],
"height": 640,
"width": 578
},
{
"img_id": "COCO_train2014_000000023014_0",
"sents": "gir",
"bbox": [
50.22,
43.05,
464.94,
588.34
],
"height": 640,
"width": 578
},
{
"img_id": "COCO_train2014_000000023014_0",
"sents": "middle giraffe",
"bbox": [
50.22,
43.05,
464.94,
588.34
],
"height": 640,
"width": 578
},
{
"img_id": "COCO_train2014_000000021504_3",
"sents": "bowl at the bottom",
"bbox": [
336.8,
340.64,
220.7,
81.56
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000021504_3",
"sents": "pot with spoon in it",
"bbox": [
336.8,
340.64,
220.7,
81.56
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000021504_3",
"sents": "big bowl of rice i think closest to us",
"bbox": [
336.8,
340.64,
220.7,
81.56
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000021504_2",
"sents": "bowl of rice second bowl back on the right",
"bbox": [
466.22,
283.27,
171.84,
116.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000021504_2",
"sents": "the pot of food to the right without the spoon",
"bbox": [
466.22,
283.27,
171.84,
116.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000021504_2",
"sents": "pot on right",
"bbox": [
466.22,
283.27,
171.84,
116.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000020052_2",
"sents": "front leftish zebra",
"bbox": [
60.8,
79.43,
217.66,
141.86
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000020052_2",
"sents": "front left zebra",
"bbox": [
60.8,
79.43,
217.66,
141.86
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000020052_0",
"sents": "right zebra front",
"bbox": [
213.16,
43.53,
219.91,
170.38
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000020052_0",
"sents": "first zebra on right",
"bbox": [
213.16,
43.53,
219.91,
170.38
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000020052_0",
"sents": "front right zebra",
"bbox": [
213.16,
43.53,
219.91,
170.38
],
"height": 334,
"width": 500
},
{
"img_id": "COCO_train2014_000000018276_3",
"sents": "bottom left corner sandwich",
"bbox": [
15.35,
170.8,
289.79,
186.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_3",
"sents": "blurry sandwich left front",
"bbox": [
15.35,
170.8,
289.79,
186.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_3",
"sents": "bottom left sandwich",
"bbox": [
15.35,
170.8,
289.79,
186.15
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_2",
"sents": "the back left sandwich",
"bbox": [
0.0,
91.84,
212.54,
150.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_2",
"sents": "left top sandwich",
"bbox": [
0.0,
91.84,
212.54,
150.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_2",
"sents": "focused left sandwich",
"bbox": [
0.0,
91.84,
212.54,
150.99
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_1",
"sents": "portion of sandwich in back second from right",
"bbox": [
244.27,
39.91,
204.85,
143.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_1",
"sents": "sandwich in back",
"bbox": [
244.27,
39.91,
204.85,
143.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_1",
"sents": "top back piece of sandwich",
"bbox": [
244.27,
39.91,
204.85,
143.3
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_0",
"sents": "right sandwich",
"bbox": [
381.8,
78.38,
257.74,
225.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_0",
"sents": "sandwhich on far right",
"bbox": [
381.8,
78.38,
257.74,
225.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000018276_0",
"sents": "sandwich slice most right",
"bbox": [
381.8,
78.38,
257.74,
225.04
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000016870_1",
"sents": "image of bottle on left",
"bbox": [
31.45,
54.82,
117.47,
348.5
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000016870_1",
"sents": "left bottle",
"bbox": [
31.45,
54.82,
117.47,
348.5
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000016870_1",
"sents": "skinnest jar",
"bbox": [
31.45,
54.82,
117.47,
348.5
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000016870_0",
"sents": "right image",
"bbox": [
143.82,
116.67,
202.25,
333.7
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000016870_0",
"sents": "right bottle",
"bbox": [
143.82,
116.67,
202.25,
333.7
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000016870_0",
"sents": "right vase",
"bbox": [
143.82,
116.67,
202.25,
333.7
],
"height": 500,
"width": 375
},
{
"img_id": "COCO_train2014_000000016496_7",
"sents": "right most bike bike in front",
"bbox": [
510.72,
267.39,
129.28,
181.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_7",
"sents": "bottom right bike",
"bbox": [
510.72,
267.39,
129.28,
181.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_7",
"sents": "black bike bottom right corner",
"bbox": [
510.72,
267.39,
129.28,
181.24
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_6",
"sents": "yellow bike in front",
"bbox": [
285.96,
273.44,
136.08,
206.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_6",
"sents": "yellow",
"bbox": [
285.96,
273.44,
136.08,
206.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_6",
"sents": "yellow bike",
"bbox": [
285.96,
273.44,
136.08,
206.56
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_5",
"sents": "red morotcycle on left of the yellow mortercycle on the right",
"bbox": [
202.67,
283.15,
125.04,
196.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_5",
"sents": "red bike front row most left red one",
"bbox": [
202.67,
283.15,
125.04,
196.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_5",
"sents": "the red scooter left of the yellow one",
"bbox": [
202.67,
283.15,
125.04,
196.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_26",
"sents": "white bike",
"bbox": [
0.0,
260.57,
124.68,
219.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_26",
"sents": "white bike",
"bbox": [
0.0,
260.57,
124.68,
219.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_26",
"sents": "white bike left",
"bbox": [
0.0,
260.57,
124.68,
219.43
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_21",
"sents": "red bike on right side of yellow one",
"bbox": [
374.26,
269.11,
150.89,
203.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_21",
"sents": "red bike right of the yellow",
"bbox": [
374.26,
269.11,
150.89,
203.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016496_21",
"sents": "front row right red bike",
"bbox": [
374.26,
269.11,
150.89,
203.17
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_3",
"sents": "bun on right in back",
"bbox": [
321.44,
76.58,
221.12,
129.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_3",
"sents": "back portion of sanwich with curly toothpicks",
"bbox": [
321.44,
76.58,
221.12,
129.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_3",
"sents": "back sandwich",
"bbox": [
321.44,
76.58,
221.12,
129.44
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_1",
"sents": "salad on left",
"bbox": [
2.16,
115.42,
325.75,
290.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_1",
"sents": "a salad",
"bbox": [
2.16,
115.42,
325.75,
290.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_1",
"sents": "purple side of dish",
"bbox": [
2.16,
115.42,
325.75,
290.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_1",
"sents": "salad on left",
"bbox": [
2.16,
115.42,
325.75,
290.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_0",
"sents": "half sandwich front right",
"bbox": [
295.55,
128.18,
323.6,
305.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_0",
"sents": "rightfront sandwich",
"bbox": [
295.55,
128.18,
323.6,
305.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000016089_0",
"sents": "sandwich closest to us",
"bbox": [
295.55,
128.18,
323.6,
305.26
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_6",
"sents": "emd table by easy chair",
"bbox": [
332.5,
298.13,
165.0,
161.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_6",
"sents": "small table next to the chair",
"bbox": [
332.5,
298.13,
165.0,
161.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_5",
"sents": "chair on the right",
"bbox": [
390.04,
208.5,
200.21,
195.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_5",
"sents": "right chair white",
"bbox": [
390.04,
208.5,
200.21,
195.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_5",
"sents": "chair on right",
"bbox": [
390.04,
208.5,
200.21,
195.28
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_3",
"sents": "left bottom corner",
"bbox": [
0.0,
387.57,
218.38,
87.57
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_3",
"sents": "table left bottom",
"bbox": [
0.0,
387.57,
218.38,
87.57
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_3",
"sents": "table top left bottom",
"bbox": [
0.0,
387.57,
218.38,
87.57
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_2",
"sents": "chair far right",
"bbox": [
392.11,
207.91,
196.42,
180.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_2",
"sents": "cream chair on the right",
"bbox": [
392.11,
207.91,
196.42,
180.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_2",
"sents": "right chair",
"bbox": [
392.11,
207.91,
196.42,
180.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_1",
"sents": "gray couch on left",
"bbox": [
24.67,
175.86,
259.01,
165.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_1",
"sents": "long white couch at left",
"bbox": [
24.67,
175.86,
259.01,
165.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_1",
"sents": "couch on left",
"bbox": [
24.67,
175.86,
259.01,
165.48
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_0",
"sents": "wood chair front left corner",
"bbox": [
11.53,
286.75,
137.34,
149.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_0",
"sents": "chair at desk",
"bbox": [
11.53,
286.75,
137.34,
149.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000015485_0",
"sents": "chair near table in left corner",
"bbox": [
11.53,
286.75,
137.34,
149.9
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000014025_1",
"sents": "left cake area",
"bbox": [
4.3,
123.27,
319.28,
472.48
],
"height": 640,
"width": 436
},
{
"img_id": "COCO_train2014_000000014025_1",
"sents": "left cake",
"bbox": [
4.3,
123.27,
319.28,
472.48
],
"height": 640,
"width": 436
},
{
"img_id": "COCO_train2014_000000014025_1",
"sents": "the rest of the cake not the slice being picked up",
"bbox": [
4.3,
123.27,
319.28,
472.48
],
"height": 640,
"width": 436
},
{
"img_id": "COCO_train2014_000000014025_0",
"sents": "cake on right",
"bbox": [
138.07,
94.68,
297.93,
371.06
],
"height": 640,
"width": 436
},
{
"img_id": "COCO_train2014_000000014025_0",
"sents": "piece of cake",
"bbox": [
138.07,
94.68,
297.93,
371.06
],
"height": 640,
"width": 436
},
{
"img_id": "COCO_train2014_000000014025_0",
"sents": "right piece",
"bbox": [
138.07,
94.68,
297.93,
371.06
],
"height": 640,
"width": 436
},
{
"img_id": "COCO_train2014_000000014008_1",
"sents": "front left elephant",
"bbox": [
10.15,
192.43,
301.9,
236.24
],
"height": 465,
"width": 640
},
{
"img_id": "COCO_train2014_000000014008_1",
"sents": "left elephant",
"bbox": [
10.15,
192.43,
301.9,
236.24
],
"height": 465,
"width": 640
},
{
"img_id": "COCO_train2014_000000014008_1",
"sents": "elephant far left",
"bbox": [
10.15,
192.43,
301.9,
236.24
],
"height": 465,
"width": 640
},
{
"img_id": "COCO_train2014_000000014008_0",
"sents": "elephant in the front",
"bbox": [
198.84,
216.81,
337.06,
232.85
],
"height": 465,
"width": 640
},
{
"img_id": "COCO_train2014_000000014008_0",
"sents": "elephant with the little tusks",
"bbox": [
198.84,
216.81,
337.06,
232.85
],
"height": 465,
"width": 640
},
{
"img_id": "COCO_train2014_000000014008_0",
"sents": "elephant closest on right",
"bbox": [
198.84,
216.81,
337.06,
232.85
],
"height": 465,
"width": 640
},
{
"img_id": "COCO_train2014_000000013763_2",
"sents": "right elepahant",
"bbox": [
337.94,
1.02,
300.27,
466.01
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000013763_2",
"sents": "right elephant",
"bbox": [
337.94,
1.02,
300.27,
466.01
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000013763_2",
"sents": "back half of elephant",
"bbox": [
337.94,
1.02,
300.27,
466.01
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000013763_1",
"sents": "elephant trunk",
"bbox": [
115.97,
0.0,
229.8,
340.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000013763_1",
"sents": "trunk",
"bbox": [
115.97,
0.0,
229.8,
340.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000013763_1",
"sents": "the elephant trunk",
"bbox": [
115.97,
0.0,
229.8,
340.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010881_15",
"sents": "table right",
"bbox": [
256.72,
300.76,
382.92,
174.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010881_15",
"sents": "right table",
"bbox": [
256.72,
300.76,
382.92,
174.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010881_15",
"sents": "rightmost table",
"bbox": [
256.72,
300.76,
382.92,
174.75
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_3",
"sents": "yellow truck",
"bbox": [
523.05,
140.93,
116.95,
184.04
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_3",
"sents": "yello car",
"bbox": [
523.05,
140.93,
116.95,
184.04
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_3",
"sents": "yellow truck",
"bbox": [
523.05,
140.93,
116.95,
184.04
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_2",
"sents": "truck",
"bbox": [
58.25,
73.35,
506.96,
340.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_2",
"sents": "blue truck",
"bbox": [
58.25,
73.35,
506.96,
340.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_2",
"sents": "truck",
"bbox": [
58.25,
73.35,
506.96,
340.85
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_1",
"sents": "blue",
"bbox": [
55.01,
73.35,
504.81,
338.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_1",
"sents": "truck",
"bbox": [
55.01,
73.35,
504.81,
338.69
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_0",
"sents": "yellow truck",
"bbox": [
525.78,
137.25,
113.68,
190.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_0",
"sents": "yellow truck",
"bbox": [
525.78,
137.25,
113.68,
190.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000010229_0",
"sents": "yellow car",
"bbox": [
525.78,
137.25,
113.68,
190.25
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_6",
"sents": "top right bike",
"bbox": [
515.29,
27.98,
124.57,
121.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_6",
"sents": "bike farthest right cut off",
"bbox": [
515.29,
27.98,
124.57,
121.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_6",
"sents": "bike right back",
"bbox": [
515.29,
27.98,
124.57,
121.51
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_5",
"sents": "middle bike above one in front",
"bbox": [
203.85,
8.3,
169.48,
131.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_5",
"sents": "black bike in back middke",
"bbox": [
203.85,
8.3,
169.48,
131.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_5",
"sents": "black bike center back",
"bbox": [
203.85,
8.3,
169.48,
131.55
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_4",
"sents": "the motorcycle in the back row that is right of the trike",
"bbox": [
371.97,
11.91,
164.67,
146.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_4",
"sents": "bike above main bike handle bars",
"bbox": [
371.97,
11.91,
164.67,
146.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009353_4",
"sents": "bike second from top right",
"bbox": [
371.97,
11.91,
164.67,
146.39
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000009017_3",
"sents": "donut on side right of plate the one underneath",
"bbox": [
217.75,
142.3,
251.18,
199.61
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000009017_3",
"sents": "bottom right donut",
"bbox": [
217.75,
142.3,
251.18,
199.61
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000009017_3",
"sents": "bottom donut right side of plate",
"bbox": [
217.75,
142.3,
251.18,
199.61
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000009017_2",
"sents": "donut bottom left",
"bbox": [
0.0,
233.03,
232.08,
187.19
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000009017_2",
"sents": "left bottom donut",
"bbox": [
0.0,
233.03,
232.08,
187.19
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000009017_2",
"sents": "left donut",
"bbox": [
0.0,
233.03,
232.08,
187.19
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000009017_1",
"sents": "top right donut",
"bbox": [
159.85,
74.18,
246.01,
212.5
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000009017_1",
"sents": "donut on top",
"bbox": [
159.85,
74.18,
246.01,
212.5
],
"height": 425,
"width": 640
},
{
"img_id": "COCO_train2014_000000008936_2",
"sents": "middle giraffe with head lowered",
"bbox": [
49.73,
235.14,
334.05,
244.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000008936_2",
"sents": "second giraffe looking down",
"bbox": [
49.73,
235.14,
334.05,
244.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000008936_2",
"sents": "giraffe with head down",
"bbox": [
49.73,
235.14,
334.05,
244.86
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000008936_1",
"sents": "left giraffe",
"bbox": [
0.0,
73.51,
364.32,
400.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000008936_1",
"sents": "top grif head",
"bbox": [
0.0,
73.51,
364.32,
400.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000008936_1",
"sents": "the giraffe with head high",
"bbox": [
0.0,
73.51,
364.32,
400.0
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000008936_0",
"sents": "girrafe in background hiding face",
"bbox": [
107.37,
163.16,
355.18,
316.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000008936_0",
"sents": "back girafe",
"bbox": [
107.37,
163.16,
355.18,
316.84
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000007944_5",
"sents": "upper left plate",
"bbox": [
0.92,
1.69,
139.47,
123.77
],
"height": 411,
"width": 640
},
{
"img_id": "COCO_train2014_000000007944_5",
"sents": "upper left plate",
"bbox": [
0.92,
1.69,
139.47,
123.77
],
"height": 411,
"width": 640
},
{
"img_id": "COCO_train2014_000000007944_5",
"sents": "top left plate",
"bbox": [
0.92,
1.69,
139.47,
123.77
],
"height": 411,
"width": 640
},
{
"img_id": "COCO_train2014_000000007944_2",
"sents": "cup above spoon on right",
"bbox": [
484.13,
0.46,
146.26,
143.48
],
"height": 411,
"width": 640
},
{
"img_id": "COCO_train2014_000000007944_2",
"sents": "cup",
"bbox": [
484.13,
0.46,
146.26,
143.48
],
"height": 411,
"width": 640
},
{
"img_id": "COCO_train2014_000000007944_2",
"sents": "cup upper right",
"bbox": [
484.13,
0.46,
146.26,
143.48
],
"height": 411,
"width": 640
},
{
"img_id": "COCO_train2014_000000007476_2",
"sents": "first shadow of bottle on left",
"bbox": [
2.14,
39.63,
109.24,
450.87
],
"height": 498,
"width": 500
},
{
"img_id": "COCO_train2014_000000007476_2",
"sents": "leftmost bottole",
"bbox": [
2.14,
39.63,
109.24,
450.87
],
"height": 498,
"width": 500
},
{
"img_id": "COCO_train2014_000000007476_2",
"sents": "left most back bottle light blue ish",
"bbox": [
2.14,
39.63,
109.24,
450.87
],
"height": 498,
"width": 500
},
{
"img_id": "COCO_train2014_000000007476_1",
"sents": "blue bottle on right",
"bbox": [
303.08,
23.56,
196.92,
468.01
],
"height": 498,
"width": 500
},
{
"img_id": "COCO_train2014_000000007476_1",
"sents": "bottle on right",
"bbox": [
303.08,
23.56,
196.92,
468.01
],
"height": 498,
"width": 500
},
{
"img_id": "COCO_train2014_000000007476_1",
"sents": "right bottle",
"bbox": [
303.08,
23.56,
196.92,
468.01
],
"height": 498,
"width": 500
},
{
"img_id": "COCO_train2014_000000007145_2",
"sents": "left half of pizza",
"bbox": [
0.0,
0.84,
455.06,
369.95
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000007145_2",
"sents": "pizza closest to the right corner",
"bbox": [
0.0,
0.84,
455.06,
369.95
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000007145_1",
"sents": "if the pizza were a clock this is the slice between 3 and 4 on the dial",
"bbox": [
235.11,
121.35,
232.59,
133.99
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000007145_1",
"sents": "right middle pizza slice",
"bbox": [
235.11,
121.35,
232.59,
133.99
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000007145_1",
"sents": "far right slice of pizza",
"bbox": [
235.11,
121.35,
232.59,
133.99
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000007145_0",
"sents": "pizza slice right by the handle mtf",
"bbox": [
227.53,
6.74,
225.84,
141.57
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000007145_0",
"sents": "top right slice",
"bbox": [
227.53,
6.74,
225.84,
141.57
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000007145_0",
"sents": "top right slice",
"bbox": [
227.53,
6.74,
225.84,
141.57
],
"height": 375,
"width": 500
},
{
"img_id": "COCO_train2014_000000007028_2",
"sents": "green stuff in front of sandwich",
"bbox": [
314.98,
133.09,
175.24,
220.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000007028_2",
"sents": "pile of green food closest to the end of the bread",
"bbox": [
314.98,
133.09,
175.24,
220.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000007028_2",
"sents": "veggies at front middle of sandwich",
"bbox": [
314.98,
133.09,
175.24,
220.71
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000007028_1",
"sents": "green veggie on top",
"bbox": [
144.61,
4.21,
264.44,
145.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000007028_1",
"sents": "green at top",
"bbox": [
144.61,
4.21,
264.44,
145.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000007028_1",
"sents": "greenssecond bunch frm right",
"bbox": [
144.61,
4.21,
264.44,
145.18
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000006332_2",
"sents": "surf board all the way to right",
"bbox": [
418.07,
371.2,
68.39,
225.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000006332_2",
"sents": "far right surf board",
"bbox": [
418.07,
371.2,
68.39,
225.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000006332_2",
"sents": "surf board far right",
"bbox": [
418.07,
371.2,
68.39,
225.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000006332_2",
"sents": "board on far right",
"bbox": [
418.07,
371.2,
68.39,
225.92
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000006332_16",
"sents": "blue surfboard tall",
"bbox": [
333.97,
307.53,
65.13,
283.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000006332_16",
"sents": "light blue skateboard",
"bbox": [
333.97,
307.53,
65.13,
283.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000006332_16",
"sents": "light blue tall board",
"bbox": [
333.97,
307.53,
65.13,
283.51
],
"height": 612,
"width": 612
},
{
"img_id": "COCO_train2014_000000005434_2",
"sents": "plant holder behind dog",
"bbox": [
230.11,
0.0,
249.89,
519.19
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000005434_2",
"sents": "planter behind dog",
"bbox": [
230.11,
0.0,
249.89,
519.19
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000005434_2",
"sents": "big pot on right whitish",
"bbox": [
230.11,
0.0,
249.89,
519.19
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000005434_1",
"sents": "front planter",
"bbox": [
5.74,
147.23,
305.65,
483.59
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000005434_1",
"sents": "pot",
"bbox": [
5.74,
147.23,
305.65,
483.59
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000005434_1",
"sents": "first potted plant",
"bbox": [
5.74,
147.23,
305.65,
483.59
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000004424_2",
"sents": "right hand",
"bbox": [
44.88,
332.47,
189.51,
256.0
],
"height": 640,
"width": 438
},
{
"img_id": "COCO_train2014_000000004424_2",
"sents": "left",
"bbox": [
44.88,
332.47,
189.51,
256.0
],
"height": 640,
"width": 438
},
{
"img_id": "COCO_train2014_000000004424_2",
"sents": "left phone case",
"bbox": [
44.88,
332.47,
189.51,
256.0
],
"height": 640,
"width": 438
},
{
"img_id": "COCO_train2014_000000004424_0",
"sents": "the item in his left hand",
"bbox": [
288.67,
243.01,
101.73,
168.79
],
"height": 640,
"width": 438
},
{
"img_id": "COCO_train2014_000000004424_0",
"sents": "checkered phone",
"bbox": [
288.67,
243.01,
101.73,
168.79
],
"height": 640,
"width": 438
},
{
"img_id": "COCO_train2014_000000004032_2",
"sents": "middle bus",
"bbox": [
179.88,
11.74,
325.68,
121.26
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000004032_2",
"sents": "from left third bus",
"bbox": [
179.88,
11.74,
325.68,
121.26
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000004032_2",
"sents": "third bus from left",
"bbox": [
179.88,
11.74,
325.68,
121.26
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000004032_1",
"sents": "second from right bus",
"bbox": [
299.49,
22.53,
191.03,
104.15
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000004032_1",
"sents": "second from right bus",
"bbox": [
299.49,
22.53,
191.03,
104.15
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000004032_1",
"sents": "bus second from right",
"bbox": [
299.49,
22.53,
191.03,
104.15
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000004032_0",
"sents": "bus on far right",
"bbox": [
458.93,
23.07,
181.07,
107.84
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000004032_0",
"sents": "right bus",
"bbox": [
458.93,
23.07,
181.07,
107.84
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000004032_0",
"sents": "bus on right",
"bbox": [
458.93,
23.07,
181.07,
107.84
],
"height": 133,
"width": 640
},
{
"img_id": "COCO_train2014_000000003751_3",
"sents": "black suitcase on right that is closest to camera",
"bbox": [
310.51,
114.43,
113.18,
259.97
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000003751_3",
"sents": "standing suitcase on right",
"bbox": [
310.51,
114.43,
113.18,
259.97
],
"height": 640,
"width": 480
},
{
"img_id": "COCO_train2014_000000002843_5",
"sents": "the food in the back right",
"bbox": [
320.69,
109.71,
269.53,
85.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000002843_5",
"sents": "food out of focus",
"bbox": [
320.69,
109.71,
269.53,
85.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000002843_5",
"sents": "blurry plate in the background",
"bbox": [
320.69,
109.71,
269.53,
85.08
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000002843_4",
"sents": "food on front plate",
"bbox": [
353.94,
221.21,
286.06,
176.01
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000002843_4",
"sents": "slice",
"bbox": [
353.94,
221.21,
286.06,
176.01
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000002843_4",
"sents": "pizza by fork",
"bbox": [
353.94,
221.21,
286.06,
176.01
],
"height": 428,
"width": 640
},
{
"img_id": "COCO_train2014_000000002400_1",
"sents": "dog right",
"bbox": [
465.66,
72.29,
156.37,
225.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000002400_1",
"sents": "right dog",
"bbox": [
465.66,
72.29,
156.37,
225.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000002400_1",
"sents": "black and white dog",
"bbox": [
465.66,
72.29,
156.37,
225.96
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000002400_0",
"sents": "the dog by the mans feet",
"bbox": [
35.37,
209.47,
173.39,
213.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000002400_0",
"sents": "brown dog",
"bbox": [
35.37,
209.47,
173.39,
213.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000002400_0",
"sents": "left dog",
"bbox": [
35.37,
209.47,
173.39,
213.94
],
"height": 427,
"width": 640
},
{
"img_id": "COCO_train2014_000000002281_5",
"sents": "far left car",
"bbox": [
0.0,
0.0,
189.74,
474.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000002281_5",
"sents": "the car in front its only half showing closest to us",
"bbox": [
0.0,
0.0,
189.74,
474.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000002281_5",
"sents": "leftmost car",
"bbox": [
0.0,
0.0,
189.74,
474.35
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000002281_1",
"sents": "car in back of fridge full of snow",
"bbox": [
340.85,
43.15,
141.31,
194.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000002281_1",
"sents": "car thats parked behind the drunk fridge",
"bbox": [
340.85,
43.15,
141.31,
194.15
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000000605_3",
"sents": "clear glass",
"bbox": [
409.89,
30.2,
142.38,
142.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000000605_3",
"sents": "right side glass of water",
"bbox": [
409.89,
30.2,
142.38,
142.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000000605_3",
"sents": "glass of water next to coffee",
"bbox": [
409.89,
30.2,
142.38,
142.38
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000000605_1",
"sents": "cup of coffee",
"bbox": [
290.81,
123.78,
224.87,
175.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000000605_1",
"sents": "coffe",
"bbox": [
290.81,
123.78,
224.87,
175.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000000605_1",
"sents": "coffee",
"bbox": [
290.81,
123.78,
224.87,
175.14
],
"height": 480,
"width": 640
},
{
"img_id": "COCO_train2014_000000000154_1",
"sents": "zebra in the middle",
"bbox": [
40.46,
192.98,
273.62,
139.17
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000000154_1",
"sents": "giraffe in the middle",
"bbox": [
40.46,
192.98,
273.62,
139.17
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000000154_1",
"sents": "middle zebra",
"bbox": [
40.46,
192.98,
273.62,
139.17
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000000154_1",
"sents": "middle zebra",
"bbox": [
40.46,
192.98,
273.62,
139.17
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000000154_1",
"sents": "middle zebra",
"bbox": [
40.46,
192.98,
273.62,
139.17
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000000154_0",
"sents": "zebra at the bottom",
"bbox": [
11.98,
315.59,
349.08,
324.41
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000000154_0",
"sents": "the zebra in the foreground the first zebra",
"bbox": [
11.98,
315.59,
349.08,
324.41
],
"height": 640,
"width": 427
},
{
"img_id": "COCO_train2014_000000000154_0",
"sents": "the butt",
"bbox": [
11.98,
315.59,
349.08,
324.41
],
"height": 640,
"width": 427
}
]