[{"id": 0, "image": "temp_image.png", "image_h": 2532, "image_w": 1170, "conversations": [{"from": "human", "value": "\nwhat you see "}], "box_x1y1x2y2": [[[446, 260, 1116, 443]]]}]