Upload folder using huggingface_hub

#2
by kimi000 - opened
This view is limited to 50 files because it contains too many changes. See the raw diff here.
Files changed (50) hide show
  1. .gitattributes +192 -0
  2. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/README.md +16 -0
  3. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/dataset.json +0 -0
  4. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/dataset.jsonl +0 -0
  5. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000001.json +16 -0
  6. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000003.json +16 -0
  7. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000004.json +16 -0
  8. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000005.json +16 -0
  9. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000006.json +16 -0
  10. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000007.json +32 -0
  11. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000008.json +16 -0
  12. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000009.json +16 -0
  13. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000010.json +16 -0
  14. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000011.json +16 -0
  15. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000001.json +4 -0
  16. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000003.json +4 -0
  17. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000004.json +4 -0
  18. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000005.json +4 -0
  19. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000006.json +4 -0
  20. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000007.json +4 -0
  21. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000008.json +4 -0
  22. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000009.json +4 -0
  23. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000010.json +4 -0
  24. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000011.json +4 -0
  25. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000001.json +14 -0
  26. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000002.json +14 -0
  27. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000003.json +14 -0
  28. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000004.json +14 -0
  29. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000005.json +14 -0
  30. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000006.json +14 -0
  31. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000007.json +14 -0
  32. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000008.json +14 -0
  33. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000009.json +14 -0
  34. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000010.json +14 -0
  35. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000011.json +14 -0
  36. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000001.json +18 -0
  37. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000003.json +18 -0
  38. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000004.json +18 -0
  39. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000005.json +18 -0
  40. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000006.json +18 -0
  41. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000007.json +18 -0
  42. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000008.json +18 -0
  43. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000009.json +18 -0
  44. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000010.json +18 -0
  45. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000011.json +18 -0
  46. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000001.json +164 -0
  47. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000003.json +164 -0
  48. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000004.json +173 -0
  49. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000005.json +302 -0
  50. samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000006.json +311 -0
.gitattributes CHANGED
@@ -52,3 +52,195 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
52
  10samples/sample_0007/overlays/overlay_accepted.png filter=lfs diff=lfs merge=lfs -text
53
  10samples/sample_0007/overlays/overlay_intended.png filter=lfs diff=lfs merge=lfs -text
54
  10samples/sample_0007/overlays/overlay_measured.png filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
52
  10samples/sample_0007/overlays/overlay_accepted.png filter=lfs diff=lfs merge=lfs -text
53
  10samples/sample_0007/overlays/overlay_intended.png filter=lfs diff=lfs merge=lfs -text
54
  10samples/sample_0007/overlays/overlay_measured.png filter=lfs diff=lfs merge=lfs -text
55
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
56
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/crops/detect_refine_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
57
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/crops/detect_refine_red_illuminated_structure.png filter=lfs diff=lfs merge=lfs -text
58
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/crops/diversify_input_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
59
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/crops/diversify_input_red_illuminated_structure.png filter=lfs diff=lfs merge=lfs -text
60
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/main_image.png filter=lfs diff=lfs merge=lfs -text
61
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/references/ref_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
62
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/references/ref_red_illuminated_structure.png filter=lfs diff=lfs merge=lfs -text
63
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_bright_blue_panel.png filter=lfs diff=lfs merge=lfs -text
64
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_dark_door.png filter=lfs diff=lfs merge=lfs -text
65
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_door_frame.png filter=lfs diff=lfs merge=lfs -text
66
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_patterned_floor.png filter=lfs diff=lfs merge=lfs -text
67
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_patterned_surface.png filter=lfs diff=lfs merge=lfs -text
68
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_person_forming_heart.png filter=lfs diff=lfs merge=lfs -text
69
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_person_holding_red_object.png filter=lfs diff=lfs merge=lfs -text
70
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_person_manipulating_object.png filter=lfs diff=lfs merge=lfs -text
71
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_rectangular_blue_screen.png filter=lfs diff=lfs merge=lfs -text
72
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_textured_background.png filter=lfs diff=lfs merge=lfs -text
73
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_textured_background_drapery.png filter=lfs diff=lfs merge=lfs -text
74
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_textured_surface.png filter=lfs diff=lfs merge=lfs -text
75
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_textured_table_cloth.png filter=lfs diff=lfs merge=lfs -text
76
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_wooden_chair.png filter=lfs diff=lfs merge=lfs -text
77
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_wooden_structure.png filter=lfs diff=lfs merge=lfs -text
78
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/main_image.png filter=lfs diff=lfs merge=lfs -text
79
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
80
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/detect_refine_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
81
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/detect_refine_red_illuminated_book.png filter=lfs diff=lfs merge=lfs -text
82
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/detect_refine_shadowy_doorway.png filter=lfs diff=lfs merge=lfs -text
83
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/diversify_input_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
84
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/diversify_input_red_illuminated_book.png filter=lfs diff=lfs merge=lfs -text
85
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/diversify_input_shadowy_doorway.png filter=lfs diff=lfs merge=lfs -text
86
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/main_image.png filter=lfs diff=lfs merge=lfs -text
87
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/references/ref_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
88
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/references/ref_red_illuminated_book.png filter=lfs diff=lfs merge=lfs -text
89
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/references/ref_shadowy_doorway.png filter=lfs diff=lfs merge=lfs -text
90
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
91
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/crops/detect_refine_draped_tarp.png filter=lfs diff=lfs merge=lfs -text
92
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/crops/detect_refine_painter_in_cap.png filter=lfs diff=lfs merge=lfs -text
93
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/crops/detect_refine_stacked_storage_boxes.png filter=lfs diff=lfs merge=lfs -text
94
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/crops/diversify_input_draped_tarp.png filter=lfs diff=lfs merge=lfs -text
95
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/main_image.png filter=lfs diff=lfs merge=lfs -text
96
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/references/ref_blue_light_source.png filter=lfs diff=lfs merge=lfs -text
97
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/references/ref_draped_tarp.png filter=lfs diff=lfs merge=lfs -text
98
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/references/ref_paint_roller.png filter=lfs diff=lfs merge=lfs -text
99
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
100
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_cutlery_set.png filter=lfs diff=lfs merge=lfs -text
101
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_person_in_jacket.png filter=lfs diff=lfs merge=lfs -text
102
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_person_with_pan.png filter=lfs diff=lfs merge=lfs -text
103
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_pizza_prep_hands.png filter=lfs diff=lfs merge=lfs -text
104
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_wall_cabinet.png filter=lfs diff=lfs merge=lfs -text
105
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_cutlery_set.png filter=lfs diff=lfs merge=lfs -text
106
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_person_in_jacket.png filter=lfs diff=lfs merge=lfs -text
107
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_person_with_pan.png filter=lfs diff=lfs merge=lfs -text
108
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_pizza_prep_hands.png filter=lfs diff=lfs merge=lfs -text
109
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_wall_cabinet.png filter=lfs diff=lfs merge=lfs -text
110
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/main_image.png filter=lfs diff=lfs merge=lfs -text
111
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_cutlery_set.png filter=lfs diff=lfs merge=lfs -text
112
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_person_in_jacket.png filter=lfs diff=lfs merge=lfs -text
113
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_person_with_pan.png filter=lfs diff=lfs merge=lfs -text
114
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_pizza_prep_hands.png filter=lfs diff=lfs merge=lfs -text
115
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_salt_box.png filter=lfs diff=lfs merge=lfs -text
116
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_wall_cabinet.png filter=lfs diff=lfs merge=lfs -text
117
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
118
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/detect_refine_large_black_pot.png filter=lfs diff=lfs merge=lfs -text
119
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/detect_refine_person_at_sink.png filter=lfs diff=lfs merge=lfs -text
120
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/detect_refine_wooden_door.png filter=lfs diff=lfs merge=lfs -text
121
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/diversify_input_large_black_pot.png filter=lfs diff=lfs merge=lfs -text
122
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/diversify_input_person_at_sink.png filter=lfs diff=lfs merge=lfs -text
123
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/diversify_input_sink_faucet.png filter=lfs diff=lfs merge=lfs -text
124
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/diversify_input_wooden_door.png filter=lfs diff=lfs merge=lfs -text
125
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/main_image.png filter=lfs diff=lfs merge=lfs -text
126
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_gas_stove.png filter=lfs diff=lfs merge=lfs -text
127
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_large_black_pot.png filter=lfs diff=lfs merge=lfs -text
128
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_person_at_sink.png filter=lfs diff=lfs merge=lfs -text
129
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_silver_spoon.png filter=lfs diff=lfs merge=lfs -text
130
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_sink_faucet.png filter=lfs diff=lfs merge=lfs -text
131
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_water_pitcher.png filter=lfs diff=lfs merge=lfs -text
132
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_wooden_door.png filter=lfs diff=lfs merge=lfs -text
133
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_wrapped_cucumber.png filter=lfs diff=lfs merge=lfs -text
134
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
135
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_backpack.png filter=lfs diff=lfs merge=lfs -text
136
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_cable.png filter=lfs diff=lfs merge=lfs -text
137
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_dark_area.png filter=lfs diff=lfs merge=lfs -text
138
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_grid_patterned_floor.png filter=lfs diff=lfs merge=lfs -text
139
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_shadowy_shape.png filter=lfs diff=lfs merge=lfs -text
140
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_textured_fabric_area.png filter=lfs diff=lfs merge=lfs -text
141
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_textured_surface.png filter=lfs diff=lfs merge=lfs -text
142
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_typist.png filter=lfs diff=lfs merge=lfs -text
143
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_backpack.png filter=lfs diff=lfs merge=lfs -text
144
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_blue_lines.png filter=lfs diff=lfs merge=lfs -text
145
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_cable.png filter=lfs diff=lfs merge=lfs -text
146
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_dark_area.png filter=lfs diff=lfs merge=lfs -text
147
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_grid_patterned_floor.png filter=lfs diff=lfs merge=lfs -text
148
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_shadowy_shape.png filter=lfs diff=lfs merge=lfs -text
149
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_textured_fabric_area.png filter=lfs diff=lfs merge=lfs -text
150
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_textured_surface.png filter=lfs diff=lfs merge=lfs -text
151
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_typist.png filter=lfs diff=lfs merge=lfs -text
152
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/main_image.png filter=lfs diff=lfs merge=lfs -text
153
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_backpack.png filter=lfs diff=lfs merge=lfs -text
154
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_blue_light.png filter=lfs diff=lfs merge=lfs -text
155
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_blue_light_source.png filter=lfs diff=lfs merge=lfs -text
156
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_blue_lines.png filter=lfs diff=lfs merge=lfs -text
157
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_dark_area.png filter=lfs diff=lfs merge=lfs -text
158
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_electronic_device.png filter=lfs diff=lfs merge=lfs -text
159
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_grid_patterned_floor.png filter=lfs diff=lfs merge=lfs -text
160
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_shadowy_shape.png filter=lfs diff=lfs merge=lfs -text
161
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_small_blue_rectangle.png filter=lfs diff=lfs merge=lfs -text
162
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_textured_fabric_area.png filter=lfs diff=lfs merge=lfs -text
163
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_textured_surface.png filter=lfs diff=lfs merge=lfs -text
164
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_thin_curved_object.png filter=lfs diff=lfs merge=lfs -text
165
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_typist.png filter=lfs diff=lfs merge=lfs -text
166
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
167
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_hands_holding_part.png filter=lfs diff=lfs merge=lfs -text
168
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_hands_with_small_object.png filter=lfs diff=lfs merge=lfs -text
169
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_helmeted_figure.png filter=lfs diff=lfs merge=lfs -text
170
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_person_by_screens.png filter=lfs diff=lfs merge=lfs -text
171
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_silhouette_with_phone.png filter=lfs diff=lfs merge=lfs -text
172
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_hands_with_small_object.png filter=lfs diff=lfs merge=lfs -text
173
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_hands_with_smoldering_tool.png filter=lfs diff=lfs merge=lfs -text
174
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_helmeted_figure.png filter=lfs diff=lfs merge=lfs -text
175
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_person_by_screens.png filter=lfs diff=lfs merge=lfs -text
176
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_silhouette_with_phone.png filter=lfs diff=lfs merge=lfs -text
177
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/main_image.png filter=lfs diff=lfs merge=lfs -text
178
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_blue_light_module.png filter=lfs diff=lfs merge=lfs -text
179
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_hands_holding_part.png filter=lfs diff=lfs merge=lfs -text
180
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_hands_passing_object.png filter=lfs diff=lfs merge=lfs -text
181
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_hands_with_small_object.png filter=lfs diff=lfs merge=lfs -text
182
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_hands_with_smoldering_tool.png filter=lfs diff=lfs merge=lfs -text
183
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_helmeted_figure.png filter=lfs diff=lfs merge=lfs -text
184
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_person_by_screens.png filter=lfs diff=lfs merge=lfs -text
185
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_reaching_hands.png filter=lfs diff=lfs merge=lfs -text
186
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_red_device.png filter=lfs diff=lfs merge=lfs -text
187
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_silhouette_with_phone.png filter=lfs diff=lfs merge=lfs -text
188
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
189
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_blue_cleaner_bottle.png filter=lfs diff=lfs merge=lfs -text
190
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_person_washing_sink.png filter=lfs diff=lfs merge=lfs -text
191
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_red_sink_mat.png filter=lfs diff=lfs merge=lfs -text
192
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_silver_faucet.png filter=lfs diff=lfs merge=lfs -text
193
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_yellow_dish_gloves.png filter=lfs diff=lfs merge=lfs -text
194
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_blue_cleaner_bottle.png filter=lfs diff=lfs merge=lfs -text
195
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_person_washing_sink.png filter=lfs diff=lfs merge=lfs -text
196
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_red_sink_mat.png filter=lfs diff=lfs merge=lfs -text
197
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_silver_faucet.png filter=lfs diff=lfs merge=lfs -text
198
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_yellow_dish_gloves.png filter=lfs diff=lfs merge=lfs -text
199
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/main_image.png filter=lfs diff=lfs merge=lfs -text
200
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_blue_cleaner_bottle.png filter=lfs diff=lfs merge=lfs -text
201
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_person_washing_sink.png filter=lfs diff=lfs merge=lfs -text
202
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_red_sink_mat.png filter=lfs diff=lfs merge=lfs -text
203
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_silver_faucet.png filter=lfs diff=lfs merge=lfs -text
204
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_yellow_dish_gloves.png filter=lfs diff=lfs merge=lfs -text
205
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
206
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_hands_gesturing.png filter=lfs diff=lfs merge=lfs -text
207
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_person_face_in_red_light.png filter=lfs diff=lfs merge=lfs -text
208
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_person_holding_blue_flashlight.png filter=lfs diff=lfs merge=lfs -text
209
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_person_reading_red_light.png filter=lfs diff=lfs merge=lfs -text
210
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_person_standing_background.png filter=lfs diff=lfs merge=lfs -text
211
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_hands_holding_triangular_object.png filter=lfs diff=lfs merge=lfs -text
212
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_person_holding_blue_flashlight.png filter=lfs diff=lfs merge=lfs -text
213
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_person_lying_reading_blue_light.png filter=lfs diff=lfs merge=lfs -text
214
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_person_reading_red_light.png filter=lfs diff=lfs merge=lfs -text
215
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_person_standing_background.png filter=lfs diff=lfs merge=lfs -text
216
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/main_image.png filter=lfs diff=lfs merge=lfs -text
217
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_hands_gesturing.png filter=lfs diff=lfs merge=lfs -text
218
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_hands_holding_small_object.png filter=lfs diff=lfs merge=lfs -text
219
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_hands_holding_triangular_object.png filter=lfs diff=lfs merge=lfs -text
220
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_face_in_red_light.png filter=lfs diff=lfs merge=lfs -text
221
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_holding_blue_flashlight.png filter=lfs diff=lfs merge=lfs -text
222
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_lying_reading_blue_light.png filter=lfs diff=lfs merge=lfs -text
223
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_reading_red_light.png filter=lfs diff=lfs merge=lfs -text
224
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_standing_background.png filter=lfs diff=lfs merge=lfs -text
225
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_plastic_water_bottle.png filter=lfs diff=lfs merge=lfs -text
226
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
227
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/detect_refine_granite_counter.png filter=lfs diff=lfs merge=lfs -text
228
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/detect_refine_person_hands.png filter=lfs diff=lfs merge=lfs -text
229
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/detect_refine_textured_mat.png filter=lfs diff=lfs merge=lfs -text
230
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/detect_refine_wooden_cabinets.png filter=lfs diff=lfs merge=lfs -text
231
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_granite_counter.png filter=lfs diff=lfs merge=lfs -text
232
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_person_hands.png filter=lfs diff=lfs merge=lfs -text
233
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_textured_mat.png filter=lfs diff=lfs merge=lfs -text
234
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_wall_shelf.png filter=lfs diff=lfs merge=lfs -text
235
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_wooden_cabinets.png filter=lfs diff=lfs merge=lfs -text
236
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/main_image.png filter=lfs diff=lfs merge=lfs -text
237
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_box_grater.png filter=lfs diff=lfs merge=lfs -text
238
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_dirty_plate.png filter=lfs diff=lfs merge=lfs -text
239
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_glass_bottle.png filter=lfs diff=lfs merge=lfs -text
240
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_granite_counter.png filter=lfs diff=lfs merge=lfs -text
241
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_metal_tool.png filter=lfs diff=lfs merge=lfs -text
242
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_person_hands.png filter=lfs diff=lfs merge=lfs -text
243
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_striped_towel.png filter=lfs diff=lfs merge=lfs -text
244
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_textured_mat.png filter=lfs diff=lfs merge=lfs -text
245
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_wall_shelf.png filter=lfs diff=lfs merge=lfs -text
246
+ samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_wooden_cabinets.png filter=lfs diff=lfs merge=lfs -text
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/README.md ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # samples_v8
2
+
3
+ Generated with `data_recipe_v8.md`: vocabulary-first planning, adaptive canvas selection, structured JSON compose prompts, no identity verification, no gate, SAM white-background reference postprocessing, and strict reference-completeness verification with regenerate-until-pass behavior.
4
+
5
+ - chat model: `gcp/google/gemini-3.1-pro-preview`
6
+ - image model: `gcp/google/gemini-3-pro-image-preview`
7
+ - people references: `white_bg_full_body_front`
8
+ - non-person references: `white_bg_encyclopedia_photo`
9
+ - SAM postprocess: every generated reference is segmented with `sam_vit_b` and pasted onto pure `#ffffff` background
10
+ - reference verify max attempts per subject: `10`
11
+ - allowed canvases: `[{"aspect_ratio": "1:1", "size": [1024, 1024], "style": "photorealistic"}, {"aspect_ratio": "4:3", "size": [1152, 864], "style": "photorealistic"}, {"aspect_ratio": "3:4", "size": [864, 1152], "style": "photorealistic"}, {"aspect_ratio": "3:2", "size": [1248, 832], "style": "photorealistic"}, {"aspect_ratio": "2:3", "size": [832, 1248], "style": "photorealistic"}, {"aspect_ratio": "16:9", "size": [1280, 720], "style": "photorealistic"}, {"aspect_ratio": "9:16", "size": [720, 1280], "style": "photorealistic"}]`
12
+ - scenario mode: `general`
13
+ - pools: `vocab_task_pool`, `plan_pool`, `scene_pool`, `detection_pool`, `reference_pool`
14
+ - bbox overlay: `bbox_overlay.png` draws every planned subject bbox; a sample is rejected and regenerated if any planned subject is still missing after VLM detection retries
15
+ - detection max attempts per subject: `3`
16
+ - launch args: `{"compose_workers": 3, "detect_max_attempts": 3, "detect_workers": 3, "emit_workers": 4, "idle_sleep": 1.0, "image_inflight": 32, "image_interval": 0.05, "image_max_retries": 8, "max_retries": 3, "no_topup": false, "plan_workers": 6, "ref_verify_max_attempts": 10, "reference_workers": 6, "requeue_in_progress": true, "seed": 1781927993, "status_interval": 30.0, "subject_detect_workers": 24, "target_samples": 10}`
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/dataset.json ADDED
The diff for this file is too large to render. See raw diff
 
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/dataset.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000001.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000001",
3
+ "plan_path": "sample_000001/plan.json",
4
+ "task_path": "sample_000001/vocab_task.json",
5
+ "main_image": "sample_000001/main_image.png",
6
+ "detections": "sample_000001/detections.json",
7
+ "n_detected": 3,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000001",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000003.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000003",
3
+ "plan_path": "sample_000003/plan.json",
4
+ "task_path": "sample_000003/vocab_task.json",
5
+ "main_image": "sample_000003/main_image.png",
6
+ "detections": "sample_000003/detections.json",
7
+ "n_detected": 3,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000003",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000004.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000004",
3
+ "plan_path": "sample_000004/plan.json",
4
+ "task_path": "sample_000004/vocab_task.json",
5
+ "main_image": "sample_000004/main_image.png",
6
+ "detections": "sample_000004/detections.json",
7
+ "n_detected": 5,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000004",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000005.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000005",
3
+ "plan_path": "sample_000005/plan.json",
4
+ "task_path": "sample_000005/vocab_task.json",
5
+ "main_image": "sample_000005/main_image.png",
6
+ "detections": "sample_000005/detections.json",
7
+ "n_detected": 6,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000005",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000006.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000006",
3
+ "plan_path": "sample_000006/plan.json",
4
+ "task_path": "sample_000006/vocab_task.json",
5
+ "main_image": "sample_000006/main_image.png",
6
+ "detections": "sample_000006/detections.json",
7
+ "n_detected": 8,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000006",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000007.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000007",
3
+ "plan_path": "sample_000007/plan.json",
4
+ "task_path": "sample_000007/vocab_task.json",
5
+ "main_image": "sample_000007/main_image.png",
6
+ "detections": "sample_000007/detections.json",
7
+ "n_detected": 14,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000007",
13
+ "pool": "detection_pool",
14
+ "retry_count": 3,
15
+ "errors": [
16
+ {
17
+ "time": 1782260885.2187717,
18
+ "error": "RuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark area' is entirely absent; Image shows a cardboard box instead of the requested subject",
19
+ "traceback": "Traceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 866, in generate_references\n references.append(helpers.diversify_subject(get_client(), sdir, main_image, subject, detection))\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/v8_helpers.py\", line 693, in diversify_subject\n raise RuntimeError(\nRuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark area' is entirely absent; Image shows a cardboard box instead of the requested subject\n\nThe above exception was the direct cause of the following exception:\n\nTraceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1020, in worker_loop\n handler(manifest)\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1113, in handler\n references, reference_errors = generate_references(sample_id, plan, detections)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 871, in generate_references\n raise RuntimeError(f\"reference generation or verification failed for {name}: {errors[name]}\") from exc\nRuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark area' is entirely absent; Image shows a cardboard box instead of the requested subject\n"
20
+ },
21
+ {
22
+ "time": 1782261302.7464893,
23
+ "error": "RuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject is absent; image shows a cardboard box instead of a dark shadowed area.",
24
+ "traceback": "Traceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 866, in generate_references\n references.append(helpers.diversify_subject(get_client(), sdir, main_image, subject, detection))\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/v8_helpers.py\", line 693, in diversify_subject\n raise RuntimeError(\nRuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject is absent; image shows a cardboard box instead of a dark shadowed area.\n\nThe above exception was the direct cause of the following exception:\n\nTraceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1020, in worker_loop\n handler(manifest)\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1113, in handler\n references, reference_errors = generate_references(sample_id, plan, detections)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 871, in generate_references\n raise RuntimeError(f\"reference generation or verification failed for {name}: {errors[name]}\") from exc\nRuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject is absent; image shows a cardboard box instead of a dark shadowed area.\n"
25
+ },
26
+ {
27
+ "time": 1782261717.330226,
28
+ "error": "RuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark_area' is absent.; Image shows a cardboard box instead of the requested subject.",
29
+ "traceback": "Traceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 866, in generate_references\n references.append(helpers.diversify_subject(get_client(), sdir, main_image, subject, detection))\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/v8_helpers.py\", line 693, in diversify_subject\n raise RuntimeError(\nRuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark_area' is absent.; Image shows a cardboard box instead of the requested subject.\n\nThe above exception was the direct cause of the following exception:\n\nTraceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1020, in worker_loop\n handler(manifest)\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1113, in handler\n references, reference_errors = generate_references(sample_id, plan, detections)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 871, in generate_references\n raise RuntimeError(f\"reference generation or verification failed for {name}: {errors[name]}\") from exc\nRuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark_area' is absent.; Image shows a cardboard box instead of the requested subject.\n"
30
+ }
31
+ ]
32
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000008.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000008",
3
+ "plan_path": "sample_000008/plan.json",
4
+ "task_path": "sample_000008/vocab_task.json",
5
+ "main_image": "sample_000008/main_image.png",
6
+ "detections": "sample_000008/detections.json",
7
+ "n_detected": 10,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000008",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000009.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000009",
3
+ "plan_path": "sample_000009/plan.json",
4
+ "task_path": "sample_000009/vocab_task.json",
5
+ "main_image": "sample_000009/main_image.png",
6
+ "detections": "sample_000009/detections.json",
7
+ "n_detected": 5,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000009",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000010.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000010",
3
+ "plan_path": "sample_000010/plan.json",
4
+ "task_path": "sample_000010/vocab_task.json",
5
+ "main_image": "sample_000010/main_image.png",
6
+ "detections": "sample_000010/detections.json",
7
+ "n_detected": 9,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000010",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000011.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000011",
3
+ "plan_path": "sample_000011/plan.json",
4
+ "task_path": "sample_000011/vocab_task.json",
5
+ "main_image": "sample_000011/main_image.png",
6
+ "detections": "sample_000011/detections.json",
7
+ "n_detected": 10,
8
+ "model_ids": {
9
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
10
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
11
+ },
12
+ "item_id": "sample_000011",
13
+ "pool": "detection_pool",
14
+ "retry_count": 0,
15
+ "errors": []
16
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000001.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000001",
3
+ "row": "sample_000001/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000003.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000003",
3
+ "row": "sample_000003/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000004.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000004",
3
+ "row": "sample_000004/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000005.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000005",
3
+ "row": "sample_000005/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000006.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000006",
3
+ "row": "sample_000006/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000007.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000007",
3
+ "row": "sample_000007/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000008.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000008",
3
+ "row": "sample_000008/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000009.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000009",
3
+ "row": "sample_000009/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000010.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000010",
3
+ "row": "sample_000010/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000011.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000011",
3
+ "row": "sample_000011/row.json"
4
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000001.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000001",
3
+ "plan_path": "sample_000001/plan.json",
4
+ "task_path": "sample_000001/vocab_task.json",
5
+ "prompt_hash": "de111ef88cac721a573e1463080c7ef8f709ab3311c0be649576445c9637d6d5",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000001",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000002.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000002",
3
+ "plan_path": "sample_000002/plan.json",
4
+ "task_path": "sample_000002/vocab_task.json",
5
+ "prompt_hash": "124ba3f0479caaeb5896d579dbace9891cca2fb6875690fdb3f66ee3524a7e9e",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000002",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000003.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000003",
3
+ "plan_path": "sample_000003/plan.json",
4
+ "task_path": "sample_000003/vocab_task.json",
5
+ "prompt_hash": "63e951d22cadbf6e15b5fd08f5054b228df47fc857c4e48e47c23160da12a111",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000003",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000004.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000004",
3
+ "plan_path": "sample_000004/plan.json",
4
+ "task_path": "sample_000004/vocab_task.json",
5
+ "prompt_hash": "3f5c74d4cad870d092def8f4466e975d281c99678ca962809503c5c456a06f49",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000004",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000005.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000005",
3
+ "plan_path": "sample_000005/plan.json",
4
+ "task_path": "sample_000005/vocab_task.json",
5
+ "prompt_hash": "946054fe68ce2e3f63d85b3eddd1a3e63af4d647ef6dc47764d65eb13cf867f4",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000005",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000006.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000006",
3
+ "plan_path": "sample_000006/plan.json",
4
+ "task_path": "sample_000006/vocab_task.json",
5
+ "prompt_hash": "006a1741e37f4e2fda0c82cbfbd7c6119932755e84be0002d17055a7af25bb79",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000006",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000007.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000007",
3
+ "plan_path": "sample_000007/plan.json",
4
+ "task_path": "sample_000007/vocab_task.json",
5
+ "prompt_hash": "e999f398d25887be57aad833cb2b38dd0d1b370d4b6b6019fbde86bc6c809c69",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000007",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000008.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000008",
3
+ "plan_path": "sample_000008/plan.json",
4
+ "task_path": "sample_000008/vocab_task.json",
5
+ "prompt_hash": "63aefc9a503e34719b1b91ec3397c9b92dc92ff7ce2c14e2c7bbe458bad64ba1",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000008",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000009.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000009",
3
+ "plan_path": "sample_000009/plan.json",
4
+ "task_path": "sample_000009/vocab_task.json",
5
+ "prompt_hash": "929afc2e2f3cfd582eb2c6b53c41f60141480cb35a1ce251ed1752a6e98ba9ea",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000009",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000010.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000010",
3
+ "plan_path": "sample_000010/plan.json",
4
+ "task_path": "sample_000010/vocab_task.json",
5
+ "prompt_hash": "74f4fe54dda8f633b152876c6b6433d4a90a0421304dd6db44bd84b9519110f8",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000010",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000011.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000011",
3
+ "plan_path": "sample_000011/plan.json",
4
+ "task_path": "sample_000011/vocab_task.json",
5
+ "prompt_hash": "e6c24d29d9d4a97828419fab43954232185614106bdd1c11f6a196e5398eabbc",
6
+ "model_ids": {
7
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
8
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
9
+ },
10
+ "item_id": "sample_000011",
11
+ "pool": "plan_pool",
12
+ "retry_count": 0,
13
+ "errors": []
14
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000001.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000001",
3
+ "plan_path": "sample_000001/plan.json",
4
+ "task_path": "sample_000001/vocab_task.json",
5
+ "main_image": "sample_000001/main_image.png",
6
+ "detections": "sample_000001/detections.json",
7
+ "references": "sample_000001/references.json",
8
+ "n_references": 3,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000001",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000003.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000003",
3
+ "plan_path": "sample_000003/plan.json",
4
+ "task_path": "sample_000003/vocab_task.json",
5
+ "main_image": "sample_000003/main_image.png",
6
+ "detections": "sample_000003/detections.json",
7
+ "references": "sample_000003/references.json",
8
+ "n_references": 3,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000003",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000004.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000004",
3
+ "plan_path": "sample_000004/plan.json",
4
+ "task_path": "sample_000004/vocab_task.json",
5
+ "main_image": "sample_000004/main_image.png",
6
+ "detections": "sample_000004/detections.json",
7
+ "references": "sample_000004/references.json",
8
+ "n_references": 3,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000004",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000005.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000005",
3
+ "plan_path": "sample_000005/plan.json",
4
+ "task_path": "sample_000005/vocab_task.json",
5
+ "main_image": "sample_000005/main_image.png",
6
+ "detections": "sample_000005/detections.json",
7
+ "references": "sample_000005/references.json",
8
+ "n_references": 6,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000005",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000006.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000006",
3
+ "plan_path": "sample_000006/plan.json",
4
+ "task_path": "sample_000006/vocab_task.json",
5
+ "main_image": "sample_000006/main_image.png",
6
+ "detections": "sample_000006/detections.json",
7
+ "references": "sample_000006/references.json",
8
+ "n_references": 8,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000006",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000007.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000007",
3
+ "plan_path": "sample_000007/plan.json",
4
+ "task_path": "sample_000007/vocab_task.json",
5
+ "main_image": "sample_000007/main_image.png",
6
+ "detections": "sample_000007/detections.json",
7
+ "references": "sample_000007/references.json",
8
+ "n_references": 14,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000007",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000008.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000008",
3
+ "plan_path": "sample_000008/plan.json",
4
+ "task_path": "sample_000008/vocab_task.json",
5
+ "main_image": "sample_000008/main_image.png",
6
+ "detections": "sample_000008/detections.json",
7
+ "references": "sample_000008/references.json",
8
+ "n_references": 10,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000008",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000009.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000009",
3
+ "plan_path": "sample_000009/plan.json",
4
+ "task_path": "sample_000009/vocab_task.json",
5
+ "main_image": "sample_000009/main_image.png",
6
+ "detections": "sample_000009/detections.json",
7
+ "references": "sample_000009/references.json",
8
+ "n_references": 5,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000009",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000010.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000010",
3
+ "plan_path": "sample_000010/plan.json",
4
+ "task_path": "sample_000010/vocab_task.json",
5
+ "main_image": "sample_000010/main_image.png",
6
+ "detections": "sample_000010/detections.json",
7
+ "references": "sample_000010/references.json",
8
+ "n_references": 9,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000010",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000011.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000011",
3
+ "plan_path": "sample_000011/plan.json",
4
+ "task_path": "sample_000011/vocab_task.json",
5
+ "main_image": "sample_000011/main_image.png",
6
+ "detections": "sample_000011/detections.json",
7
+ "references": "sample_000011/references.json",
8
+ "n_references": 10,
9
+ "reference_errors": {},
10
+ "model_ids": {
11
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
12
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
13
+ },
14
+ "item_id": "sample_000011",
15
+ "pool": "reference_pool",
16
+ "retry_count": 0,
17
+ "errors": []
18
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000001.json ADDED
@@ -0,0 +1,164 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000001",
3
+ "target_total": 3,
4
+ "target_people": 1,
5
+ "target_objects": 2,
6
+ "canvas_size": [
7
+ 1248,
8
+ 832
9
+ ],
10
+ "canvas_aspect_ratio": "3:2",
11
+ "main_image": "main_image.png",
12
+ "bbox_overlay": "bbox_overlay.png",
13
+ "plan": "plan.json",
14
+ "detections": "detections.json",
15
+ "vocab_task": "vocab_task.json",
16
+ "n_planned": 3,
17
+ "n_detected": 3,
18
+ "n_subjects": 3,
19
+ "subjects": [
20
+ {
21
+ "name": "person_in_red_light",
22
+ "is_person": true,
23
+ "subject_type": "person",
24
+ "source_set": "people_set",
25
+ "source_image_id": "Ego4D:ego4d_video/EGO_76251.npy:person:0",
26
+ "source_name": "person",
27
+ "source_description": "Visible by their hands, which are illuminated in bright red light, holding a small object. Source dataset: Ego4D. Scene context: A person's hands are visible in a dark setting, illuminated by a red light, holding and interacting with a small dark object.",
28
+ "sub_caption": "person: A person, prominently visible by their hands and forearms which are bathed in bright red light, holding and interacting with a small dark electronic object.. Scene role: Operating the small device in the foreground",
29
+ "measured_bbox": [
30
+ 0.301,
31
+ 0.039,
32
+ 0.714,
33
+ 0.98
34
+ ],
35
+ "detection_confidence": 0.95,
36
+ "ref_style": "white_bg_full_body_front",
37
+ "ref_image": "references/ref_person_in_red_light.png",
38
+ "raw_ref_image": "references/raw_ref_person_in_red_light_attempt_01.png",
39
+ "reference_verify": "references/reference_verify_person_in_red_light.json",
40
+ "reference_verify_passed": true,
41
+ "reference_attempts": 1,
42
+ "sam_white_bg": {
43
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000001/references/raw_ref_person_in_red_light_attempt_01.png",
44
+ "output": "references/ref_person_in_red_light.png",
45
+ "mask": "references/sam_mask_person_in_red_light.png",
46
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
47
+ "sam_model_type": "vit_b",
48
+ "sam_device": "auto",
49
+ "sam_working_size": [
50
+ 640,
51
+ 640
52
+ ],
53
+ "sam_max_side": 640,
54
+ "sam_downscale": 0.625,
55
+ "prompt_box_xyxy": [
56
+ 324.0,
57
+ 26.0,
58
+ 699.0,
59
+ 1013.0
60
+ ],
61
+ "mask_score": 3.392402,
62
+ "mask_area_ratio": 0.165197,
63
+ "elapsed_seconds": 53.7174
64
+ }
65
+ },
66
+ {
67
+ "name": "red_illuminated_structure",
68
+ "is_person": false,
69
+ "subject_type": "object",
70
+ "source_set": "obj_set",
71
+ "source_image_id": "Ego4D:ego4d_video/EGO_2029.npy:object:1",
72
+ "source_name": "red illuminated structure",
73
+ "source_description": "A structure on the right side of the image, possibly a wall or barricade, strongly illuminated with red light, featuring a grid-like or textured pattern. Source dataset: Ego4D. Scene context: A dark, possibly outdoor or poorly lit indoor area illuminated by strong blue and red artificial lights.",
74
+ "sub_caption": "red illuminated structure: A sturdy wall or barricade-like structure featuring a textured, grid-like pattern, strongly illuminated by deep red ambient light.. Scene role: Forms the textured, atmospheric background behind the person",
75
+ "measured_bbox": [
76
+ 0.6096,
77
+ 0.0,
78
+ 0.9961,
79
+ 0.991
80
+ ],
81
+ "detection_confidence": "high",
82
+ "ref_style": "white_bg_encyclopedia_photo",
83
+ "ref_image": "references/ref_red_illuminated_structure.png",
84
+ "raw_ref_image": "references/raw_ref_red_illuminated_structure_attempt_01.png",
85
+ "reference_verify": "references/reference_verify_red_illuminated_structure.json",
86
+ "reference_verify_passed": true,
87
+ "reference_attempts": 1,
88
+ "sam_white_bg": {
89
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000001/references/raw_ref_red_illuminated_structure_attempt_01.png",
90
+ "output": "references/ref_red_illuminated_structure.png",
91
+ "mask": "references/sam_mask_red_illuminated_structure.png",
92
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
93
+ "sam_model_type": "vit_b",
94
+ "sam_device": "auto",
95
+ "sam_working_size": [
96
+ 640,
97
+ 640
98
+ ],
99
+ "sam_max_side": 640,
100
+ "sam_downscale": 0.625,
101
+ "prompt_box_xyxy": [
102
+ 0.0,
103
+ 0.0,
104
+ 1023.0,
105
+ 1023.0
106
+ ],
107
+ "mask_score": 1.966617,
108
+ "mask_area_ratio": 0.597257,
109
+ "elapsed_seconds": 10.2671
110
+ }
111
+ },
112
+ {
113
+ "name": "green_indicator_light",
114
+ "is_person": false,
115
+ "subject_type": "object",
116
+ "source_set": "obj_set",
117
+ "source_image_id": "Ego4D:ego4d_video/EGO_294886.npy:object:1",
118
+ "source_name": "green light",
119
+ "source_description": "Small, bright green glowing indicator light, possibly an LED, located on the dark structure. Source dataset: Ego4D. Scene context: An extremely dark scene with only a faint silhouette of an object and a small green indicator light visible.",
120
+ "sub_caption": "green light: A small, bright green glowing LED indicator light piercing through the darkness.. Scene role: Glowing on a dark piece of equipment beside the person, contrasting sharply with the dominant red lighting",
121
+ "measured_bbox": [
122
+ 0.1227,
123
+ 0.438,
124
+ 0.1605,
125
+ 0.4975
126
+ ],
127
+ "detection_confidence": 0.95,
128
+ "ref_style": "white_bg_encyclopedia_photo",
129
+ "ref_image": "references/ref_green_indicator_light.png",
130
+ "raw_ref_image": "references/raw_ref_green_indicator_light_attempt_01.png",
131
+ "reference_verify": "references/reference_verify_green_indicator_light.json",
132
+ "reference_verify_passed": true,
133
+ "reference_attempts": 1,
134
+ "sam_white_bg": {
135
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000001/references/raw_ref_green_indicator_light_attempt_01.png",
136
+ "output": "references/ref_green_indicator_light.png",
137
+ "mask": "references/sam_mask_green_indicator_light.png",
138
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
139
+ "sam_model_type": "vit_b",
140
+ "sam_device": "auto",
141
+ "sam_working_size": [
142
+ 640,
143
+ 640
144
+ ],
145
+ "sam_max_side": 640,
146
+ "sam_downscale": 0.625,
147
+ "prompt_box_xyxy": [
148
+ 347.0,
149
+ 335.0,
150
+ 676.0,
151
+ 688.0
152
+ ],
153
+ "mask_score": 3.439631,
154
+ "mask_area_ratio": 0.059673,
155
+ "elapsed_seconds": 10.1365
156
+ }
157
+ }
158
+ ],
159
+ "not_emitted": [],
160
+ "model_ids": {
161
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
162
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
163
+ }
164
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000003.json ADDED
@@ -0,0 +1,164 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000003",
3
+ "target_total": 3,
4
+ "target_people": 1,
5
+ "target_objects": 2,
6
+ "canvas_size": [
7
+ 1152,
8
+ 864
9
+ ],
10
+ "canvas_aspect_ratio": "4:3",
11
+ "main_image": "main_image.png",
12
+ "bbox_overlay": "bbox_overlay.png",
13
+ "plan": "plan.json",
14
+ "detections": "detections.json",
15
+ "vocab_task": "vocab_task.json",
16
+ "n_planned": 3,
17
+ "n_detected": 3,
18
+ "n_subjects": 3,
19
+ "subjects": [
20
+ {
21
+ "name": "person_in_red_light",
22
+ "is_person": true,
23
+ "subject_type": "person",
24
+ "source_set": "people_set",
25
+ "source_image_id": "Ego4D:ego4d_video/EGO_135381.npy:person:0",
26
+ "source_name": "person",
27
+ "source_description": "Visible hands and arms of a person in a dark setting, illuminated by red light, interacting with objects. Source dataset: Ego4D. Scene context: A close-up view of a person's hands and arms interacting with objects in a dark setting, illuminated by red and white light.",
28
+ "sub_caption": "person: Visible hands and lower arms, dramatically illuminated by a deep red light, emerging from the dark surroundings.. Scene role: Interacting with the open book, fingers lightly resting on the visible pages.",
29
+ "measured_bbox": [
30
+ 0.0,
31
+ 0.0,
32
+ 0.5655,
33
+ 1.0
34
+ ],
35
+ "detection_confidence": 0.9,
36
+ "ref_style": "white_bg_full_body_front",
37
+ "ref_image": "references/ref_person_in_red_light.png",
38
+ "raw_ref_image": "references/raw_ref_person_in_red_light_attempt_01.png",
39
+ "reference_verify": "references/reference_verify_person_in_red_light.json",
40
+ "reference_verify_passed": true,
41
+ "reference_attempts": 1,
42
+ "sam_white_bg": {
43
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000003/references/raw_ref_person_in_red_light_attempt_01.png",
44
+ "output": "references/ref_person_in_red_light.png",
45
+ "mask": "references/sam_mask_person_in_red_light.png",
46
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
47
+ "sam_model_type": "vit_b",
48
+ "sam_device": "auto",
49
+ "sam_working_size": [
50
+ 640,
51
+ 640
52
+ ],
53
+ "sam_max_side": 640,
54
+ "sam_downscale": 0.625,
55
+ "prompt_box_xyxy": [
56
+ 351.0,
57
+ 54.0,
58
+ 667.0,
59
+ 1015.0
60
+ ],
61
+ "mask_score": 3.471897,
62
+ "mask_area_ratio": 0.134706,
63
+ "elapsed_seconds": 8.8737
64
+ }
65
+ },
66
+ {
67
+ "name": "red_illuminated_book",
68
+ "is_person": false,
69
+ "subject_type": "object",
70
+ "source_set": "obj_set",
71
+ "source_image_id": "Ego4D:ego4d_video/EGO_236888.npy:object:0",
72
+ "source_name": "book",
73
+ "source_description": "An open book with pages visible, illuminated in a red hue, showing text and some graphical elements. Source dataset: Ego4D. Scene context: A dimly lit scene showing an open book, illuminated by a red light, being held or resting in the darkness.",
74
+ "sub_caption": "book: A large, open book with visible pages and faint layout elements, cast in a striking red hue from an overhead light source.. Scene role: Lying open flat on the surface directly beneath the person's hands.",
75
+ "measured_bbox": [
76
+ 0.2245,
77
+ 0.3971,
78
+ 0.6708,
79
+ 0.6724
80
+ ],
81
+ "detection_confidence": 0.98,
82
+ "ref_style": "white_bg_encyclopedia_photo",
83
+ "ref_image": "references/ref_red_illuminated_book.png",
84
+ "raw_ref_image": "references/raw_ref_red_illuminated_book_attempt_01.png",
85
+ "reference_verify": "references/reference_verify_red_illuminated_book.json",
86
+ "reference_verify_passed": true,
87
+ "reference_attempts": 1,
88
+ "sam_white_bg": {
89
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000003/references/raw_ref_red_illuminated_book_attempt_01.png",
90
+ "output": "references/ref_red_illuminated_book.png",
91
+ "mask": "references/sam_mask_red_illuminated_book.png",
92
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
93
+ "sam_model_type": "vit_b",
94
+ "sam_device": "auto",
95
+ "sam_working_size": [
96
+ 640,
97
+ 640
98
+ ],
99
+ "sam_max_side": 640,
100
+ "sam_downscale": 0.625,
101
+ "prompt_box_xyxy": [
102
+ 22.0,
103
+ 180.0,
104
+ 1002.0,
105
+ 858.0
106
+ ],
107
+ "mask_score": 3.463648,
108
+ "mask_area_ratio": 0.502075,
109
+ "elapsed_seconds": 7.3171
110
+ }
111
+ },
112
+ {
113
+ "name": "shadowy_doorway",
114
+ "is_person": false,
115
+ "subject_type": "object",
116
+ "source_set": "obj_set",
117
+ "source_image_id": "Ego4D:ego4d_video/EGO_311165.npy:object:2",
118
+ "source_name": "doorway or opening",
119
+ "source_description": "A darker, arched or rectangular shape on the wall, suggesting an opening to another area. Source dataset: Ego4D. Scene context: A very dark, low-resolution scene indoors, mostly obscured by shadow with some faint brownish light indicating walls or structures.",
120
+ "sub_caption": "doorway or opening: A dark, arched doorway outline set into a shadowy, indistinct wall, suggesting a passage to another dark room.. Scene role: Positioned in the out-of-focus background to establish architectural depth behind the main illuminated desk area.",
121
+ "measured_bbox": [
122
+ 0.5153,
123
+ 0.0267,
124
+ 0.8188,
125
+ 0.8345
126
+ ],
127
+ "detection_confidence": 0.9,
128
+ "ref_style": "white_bg_encyclopedia_photo",
129
+ "ref_image": "references/ref_shadowy_doorway.png",
130
+ "raw_ref_image": "references/raw_ref_shadowy_doorway_attempt_01.png",
131
+ "reference_verify": "references/reference_verify_shadowy_doorway.json",
132
+ "reference_verify_passed": true,
133
+ "reference_attempts": 1,
134
+ "sam_white_bg": {
135
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000003/references/raw_ref_shadowy_doorway_attempt_01.png",
136
+ "output": "references/ref_shadowy_doorway.png",
137
+ "mask": "references/sam_mask_shadowy_doorway.png",
138
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
139
+ "sam_model_type": "vit_b",
140
+ "sam_device": "auto",
141
+ "sam_working_size": [
142
+ 640,
143
+ 640
144
+ ],
145
+ "sam_max_side": 640,
146
+ "sam_downscale": 0.625,
147
+ "prompt_box_xyxy": [
148
+ 141.0,
149
+ 11.0,
150
+ 899.0,
151
+ 969.0
152
+ ],
153
+ "mask_score": 3.471354,
154
+ "mask_area_ratio": 0.542183,
155
+ "elapsed_seconds": 7.2941
156
+ }
157
+ }
158
+ ],
159
+ "not_emitted": [],
160
+ "model_ids": {
161
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
162
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
163
+ }
164
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000004.json ADDED
@@ -0,0 +1,173 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000004",
3
+ "target_total": 5,
4
+ "target_people": 1,
5
+ "target_objects": 4,
6
+ "canvas_size": [
7
+ 864,
8
+ 1152
9
+ ],
10
+ "canvas_aspect_ratio": "3:4",
11
+ "main_image": "main_image.png",
12
+ "bbox_overlay": "bbox_overlay.png",
13
+ "plan": "plan.json",
14
+ "detections": "detections.json",
15
+ "vocab_task": "vocab_task.json",
16
+ "n_planned": 5,
17
+ "n_detected": 5,
18
+ "n_subjects": 3,
19
+ "subjects": [
20
+ {
21
+ "name": "blue_light_source",
22
+ "is_person": false,
23
+ "subject_type": "object",
24
+ "source_set": "obj_set",
25
+ "source_image_id": "Ego4D:ego4d_video/EGO_98001.npy:object:0",
26
+ "source_name": "blue light source",
27
+ "source_description": "A small, blurry blue light, appearing as a faint glow against the dark background. Source dataset: Ego4D. Scene context: A predominantly dark scene with a single, small, indistinct blue light source visible towards the right side.",
28
+ "sub_caption": "blue light source: A small, blurry blue light emitting a faint, cool glow against the darkness.. Scene role: Positioned in the deep background to the left, providing an atmospheric back-light and contrasting with the red lighting.",
29
+ "measured_bbox": [
30
+ 0.5155,
31
+ 0.3724,
32
+ 0.553,
33
+ 0.4239
34
+ ],
35
+ "detection_confidence": "high",
36
+ "ref_style": "white_bg_encyclopedia_photo",
37
+ "ref_image": "references/ref_blue_light_source.png",
38
+ "raw_ref_image": "references/raw_ref_blue_light_source_attempt_01.png",
39
+ "reference_verify": "references/reference_verify_blue_light_source.json",
40
+ "reference_verify_passed": true,
41
+ "reference_attempts": 1,
42
+ "sam_white_bg": {
43
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000004/references/raw_ref_blue_light_source_attempt_01.png",
44
+ "output": "references/ref_blue_light_source.png",
45
+ "mask": "references/sam_mask_blue_light_source.png",
46
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
47
+ "sam_model_type": "vit_b",
48
+ "sam_device": "auto",
49
+ "sam_working_size": [
50
+ 640,
51
+ 640
52
+ ],
53
+ "sam_max_side": 640,
54
+ "sam_downscale": 0.625,
55
+ "prompt_box_xyxy": [
56
+ 132.0,
57
+ 159.0,
58
+ 891.0,
59
+ 864.0
60
+ ],
61
+ "mask_score": 3.485053,
62
+ "mask_area_ratio": 0.292151,
63
+ "elapsed_seconds": 9.6106
64
+ }
65
+ },
66
+ {
67
+ "name": "paint_roller",
68
+ "is_person": false,
69
+ "subject_type": "object",
70
+ "source_set": "obj_set",
71
+ "source_image_id": "Ego4D:ego4d_video/EGO_95307.npy:object:0",
72
+ "source_name": "paint roller",
73
+ "source_description": "A standard paint roller with a dark cylindrical cover and a metal frame connecting to a handle. Source dataset: Ego4D. Scene context: A close-up view of a paint roller against a light-colored wall in a dimly lit setting.",
74
+ "sub_caption": "paint roller: A standard paint roller with a dark cylindrical cover, attached to a metal frame and handle.. Scene role: Resting on a nearby surface in the foreground, catching subtle highlights from the red light.",
75
+ "measured_bbox": [
76
+ 0.2917,
77
+ 0.532,
78
+ 0.4405,
79
+ 0.7522
80
+ ],
81
+ "detection_confidence": 0.99,
82
+ "ref_style": "white_bg_encyclopedia_photo",
83
+ "ref_image": "references/ref_paint_roller.png",
84
+ "raw_ref_image": "references/raw_ref_paint_roller_attempt_01.png",
85
+ "reference_verify": "references/reference_verify_paint_roller.json",
86
+ "reference_verify_passed": true,
87
+ "reference_attempts": 1,
88
+ "sam_white_bg": {
89
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000004/references/raw_ref_paint_roller_attempt_01.png",
90
+ "output": "references/ref_paint_roller.png",
91
+ "mask": "references/sam_mask_paint_roller.png",
92
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
93
+ "sam_model_type": "vit_b",
94
+ "sam_device": "auto",
95
+ "sam_working_size": [
96
+ 640,
97
+ 640
98
+ ],
99
+ "sam_max_side": 640,
100
+ "sam_downscale": 0.625,
101
+ "prompt_box_xyxy": [
102
+ 136.0,
103
+ 75.0,
104
+ 866.0,
105
+ 950.0
106
+ ],
107
+ "mask_score": 3.459168,
108
+ "mask_area_ratio": 0.116944,
109
+ "elapsed_seconds": 7.1624
110
+ }
111
+ },
112
+ {
113
+ "name": "draped_tarp",
114
+ "is_person": false,
115
+ "subject_type": "object",
116
+ "source_set": "obj_set",
117
+ "source_image_id": "Ego4D:ego4d_video/EGO_37499.npy:object:1",
118
+ "source_name": "light-colored material",
119
+ "source_description": "A draped, light-colored or beige material, possibly part of a tent or covering, visible on the right side. Source dataset: Ego4D. Scene context: The scene is a dark, possibly outdoor or dimly lit setting, showing what appears to be a structure or object covered with a large piece of material or tarp.",
120
+ "sub_caption": "light-colored material: A draped, light-colored tarp or drop cloth covering large, indistinct shapes.. Scene role: Draped over items on the right side of the room, adding textural detail and reflecting the mixed ambient lighting.",
121
+ "measured_bbox": [
122
+ 0.392,
123
+ 0.4207,
124
+ 0.8243,
125
+ 0.8862
126
+ ],
127
+ "detection_confidence": 0.98,
128
+ "ref_style": "white_bg_encyclopedia_photo",
129
+ "ref_image": "references/ref_draped_tarp.png",
130
+ "raw_ref_image": "references/raw_ref_draped_tarp_attempt_01.png",
131
+ "reference_verify": "references/reference_verify_draped_tarp.json",
132
+ "reference_verify_passed": true,
133
+ "reference_attempts": 1,
134
+ "sam_white_bg": {
135
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000004/references/raw_ref_draped_tarp_attempt_01.png",
136
+ "output": "references/ref_draped_tarp.png",
137
+ "mask": "references/sam_mask_draped_tarp.png",
138
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
139
+ "sam_model_type": "vit_b",
140
+ "sam_device": "auto",
141
+ "sam_working_size": [
142
+ 640,
143
+ 640
144
+ ],
145
+ "sam_max_side": 640,
146
+ "sam_downscale": 0.625,
147
+ "prompt_box_xyxy": [
148
+ 0.0,
149
+ 189.0,
150
+ 1023.0,
151
+ 888.0
152
+ ],
153
+ "mask_score": 3.482188,
154
+ "mask_area_ratio": 0.485075,
155
+ "elapsed_seconds": 7.4131
156
+ }
157
+ }
158
+ ],
159
+ "not_emitted": [
160
+ {
161
+ "name": "worker_in_cap",
162
+ "reason": "not_detected"
163
+ },
164
+ {
165
+ "name": "stacked_boxes",
166
+ "reason": "not_detected"
167
+ }
168
+ ],
169
+ "model_ids": {
170
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
171
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
172
+ }
173
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000005.json ADDED
@@ -0,0 +1,302 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000005",
3
+ "target_total": 6,
4
+ "target_people": 3,
5
+ "target_objects": 3,
6
+ "canvas_size": [
7
+ 1152,
8
+ 864
9
+ ],
10
+ "canvas_aspect_ratio": "4:3",
11
+ "main_image": "main_image.png",
12
+ "bbox_overlay": "bbox_overlay.png",
13
+ "plan": "plan.json",
14
+ "detections": "detections.json",
15
+ "vocab_task": "vocab_task.json",
16
+ "n_planned": 6,
17
+ "n_detected": 6,
18
+ "n_subjects": 6,
19
+ "subjects": [
20
+ {
21
+ "name": "pizza_prep_hands",
22
+ "is_person": true,
23
+ "subject_type": "person",
24
+ "source_set": "people_set",
25
+ "source_image_id": "EPIC-Kitchens:P11_106:person:0",
26
+ "source_name": "person",
27
+ "source_description": "The person's hands and lower arms are visible at the bottom of the frame, appearing to be in the middle of preparing food. Source dataset: EPIC-Kitchens. Scene context: A top-down view of a wooden kitchen table where two pizzas are being prepared with various ingredients like red onions, mushrooms, and tomatoes.",
28
+ "sub_caption": "person: Hands and lower arms visible, preparing a pizza on a wooden surface.. Scene role: In the foreground, actively making a pizza.",
29
+ "measured_bbox": [
30
+ 0.532,
31
+ 0.2245,
32
+ 1.0,
33
+ 0.7871
34
+ ],
35
+ "detection_confidence": 0.9,
36
+ "ref_style": "white_bg_full_body_front",
37
+ "ref_image": "references/ref_pizza_prep_hands.png",
38
+ "raw_ref_image": "references/raw_ref_pizza_prep_hands_attempt_02.png",
39
+ "reference_verify": "references/reference_verify_pizza_prep_hands.json",
40
+ "reference_verify_passed": true,
41
+ "reference_attempts": 2,
42
+ "sam_white_bg": {
43
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_pizza_prep_hands_attempt_02.png",
44
+ "output": "references/ref_pizza_prep_hands.png",
45
+ "mask": "references/sam_mask_pizza_prep_hands.png",
46
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
47
+ "sam_model_type": "vit_b",
48
+ "sam_device": "auto",
49
+ "sam_working_size": [
50
+ 640,
51
+ 640
52
+ ],
53
+ "sam_max_side": 640,
54
+ "sam_downscale": 0.625,
55
+ "prompt_box_xyxy": [
56
+ 349.0,
57
+ 14.0,
58
+ 677.0,
59
+ 1016.0
60
+ ],
61
+ "mask_score": 3.451951,
62
+ "mask_area_ratio": 0.150558,
63
+ "elapsed_seconds": 10.2196
64
+ }
65
+ },
66
+ {
67
+ "name": "person_in_jacket",
68
+ "is_person": true,
69
+ "subject_type": "person",
70
+ "source_set": "people_set",
71
+ "source_image_id": "Ego4D:ego4d_video/EGO_22577.npy:person:0",
72
+ "source_name": "person",
73
+ "source_description": "A person visible mostly from the back, wearing a dark jacket over a red shirt with yellow text that includes the words 'STANLEY CUP'. The person has dark hair. Source dataset: Ego4D. Scene context: A close-up view of a person wearing a red shirt with yellow text, seemingly engaged in an activity in a dimly lit indoor setting.",
74
+ "sub_caption": "person: Person seen mostly from the back, dark hair, wearing a dark jacket over a red shirt with yellow abstract patterns.. Scene role: Standing in the midground, facing away toward the kitchen cabinets.",
75
+ "measured_bbox": [
76
+ 0.0,
77
+ 0.0,
78
+ 0.361,
79
+ 0.675
80
+ ],
81
+ "detection_confidence": 1.0,
82
+ "ref_style": "white_bg_full_body_front",
83
+ "ref_image": "references/ref_person_in_jacket.png",
84
+ "raw_ref_image": "references/raw_ref_person_in_jacket_attempt_02.png",
85
+ "reference_verify": "references/reference_verify_person_in_jacket.json",
86
+ "reference_verify_passed": true,
87
+ "reference_attempts": 2,
88
+ "sam_white_bg": {
89
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_person_in_jacket_attempt_02.png",
90
+ "output": "references/ref_person_in_jacket.png",
91
+ "mask": "references/sam_mask_person_in_jacket.png",
92
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
93
+ "sam_model_type": "vit_b",
94
+ "sam_device": "auto",
95
+ "sam_working_size": [
96
+ 640,
97
+ 640
98
+ ],
99
+ "sam_max_side": 640,
100
+ "sam_downscale": 0.625,
101
+ "prompt_box_xyxy": [
102
+ 334.0,
103
+ 15.0,
104
+ 684.0,
105
+ 1023.0
106
+ ],
107
+ "mask_score": 3.414528,
108
+ "mask_area_ratio": 0.160464,
109
+ "elapsed_seconds": 10.2925
110
+ }
111
+ },
112
+ {
113
+ "name": "person_with_pan",
114
+ "is_person": true,
115
+ "subject_type": "person",
116
+ "source_set": "people_set",
117
+ "source_image_id": "Ego4D:ego4d_video/EGO_192493.npy:person:0",
118
+ "source_name": "person",
119
+ "source_description": "A person standing in the room, seen from the torso down, holding a dark round object. Source dataset: Ego4D. Scene context: A person stands in a dimly lit room holding a round object near a blue wall.",
120
+ "sub_caption": "person: Person seen from the torso down, holding a dark round object.. Scene role: Standing in the background near a blue wall.",
121
+ "measured_bbox": [
122
+ 0.1195,
123
+ 0.0021,
124
+ 0.4483,
125
+ 0.6302
126
+ ],
127
+ "detection_confidence": 0.95,
128
+ "ref_style": "white_bg_full_body_front",
129
+ "ref_image": "references/ref_person_with_pan.png",
130
+ "raw_ref_image": "references/raw_ref_person_with_pan_attempt_02.png",
131
+ "reference_verify": "references/reference_verify_person_with_pan.json",
132
+ "reference_verify_passed": true,
133
+ "reference_attempts": 2,
134
+ "sam_white_bg": {
135
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_person_with_pan_attempt_02.png",
136
+ "output": "references/ref_person_with_pan.png",
137
+ "mask": "references/sam_mask_person_with_pan.png",
138
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
139
+ "sam_model_type": "vit_b",
140
+ "sam_device": "auto",
141
+ "sam_working_size": [
142
+ 640,
143
+ 640
144
+ ],
145
+ "sam_max_side": 640,
146
+ "sam_downscale": 0.625,
147
+ "prompt_box_xyxy": [
148
+ 334.0,
149
+ 18.0,
150
+ 690.0,
151
+ 1023.0
152
+ ],
153
+ "mask_score": 3.408831,
154
+ "mask_area_ratio": 0.163625,
155
+ "elapsed_seconds": 10.3028
156
+ }
157
+ },
158
+ {
159
+ "name": "salt_box",
160
+ "is_person": false,
161
+ "subject_type": "object",
162
+ "source_set": "obj_set",
163
+ "source_image_id": "EPIC-Kitchens:P35_102:object:1",
164
+ "source_name": "box of salt",
165
+ "source_description": "A small cardboard box with blue and black text, sitting on the counter near the stove. Source dataset: EPIC-Kitchens. Scene context: A kitchen counter area with a sink containing dirty dishes, a frying pan on a drying rack, and various cooking utensils.",
166
+ "sub_caption": "box of salt: A small cardboard box with blue and black graphical patterns, resembling a salt container.. Scene role: Resting on the wooden counter next to the pizza prep area.",
167
+ "measured_bbox": [
168
+ 0.5558,
169
+ 0.4006,
170
+ 0.6966,
171
+ 0.4937
172
+ ],
173
+ "detection_confidence": 0.5,
174
+ "ref_style": "white_bg_encyclopedia_photo",
175
+ "ref_image": "references/ref_salt_box.png",
176
+ "raw_ref_image": "references/raw_ref_salt_box_attempt_01.png",
177
+ "reference_verify": "references/reference_verify_salt_box.json",
178
+ "reference_verify_passed": true,
179
+ "reference_attempts": 1,
180
+ "sam_white_bg": {
181
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_salt_box_attempt_01.png",
182
+ "output": "references/ref_salt_box.png",
183
+ "mask": "references/sam_mask_salt_box.png",
184
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
185
+ "sam_model_type": "vit_b",
186
+ "sam_device": "auto",
187
+ "sam_working_size": [
188
+ 640,
189
+ 640
190
+ ],
191
+ "sam_max_side": 640,
192
+ "sam_downscale": 0.625,
193
+ "prompt_box_xyxy": [
194
+ 73.0,
195
+ 268.0,
196
+ 952.0,
197
+ 762.0
198
+ ],
199
+ "mask_score": 3.471932,
200
+ "mask_area_ratio": 0.353847,
201
+ "elapsed_seconds": 10.266
202
+ }
203
+ },
204
+ {
205
+ "name": "cutlery_set",
206
+ "is_person": false,
207
+ "subject_type": "object",
208
+ "source_set": "obj_set",
209
+ "source_image_id": "EPIC-Kitchens:P26_103:object:4",
210
+ "source_name": "cutlery",
211
+ "source_description": "A silver fork and a knife resting on the yellow plate inside the right sink bowl. Source dataset: EPIC-Kitchens. Scene context: A first-person view of a stainless steel kitchen sink containing dirty dishes and a blue cloth, with a hand visible in the foreground.",
212
+ "sub_caption": "cutlery: A silver fork and a knife resting on a yellow plate.. Scene role: Placed on the counter in the foreground left.",
213
+ "measured_bbox": [
214
+ 0.1913,
215
+ 0.8329,
216
+ 0.6116,
217
+ 0.9636
218
+ ],
219
+ "detection_confidence": "high",
220
+ "ref_style": "white_bg_encyclopedia_photo",
221
+ "ref_image": "references/ref_cutlery_set.png",
222
+ "raw_ref_image": "references/raw_ref_cutlery_set_attempt_02.png",
223
+ "reference_verify": "references/reference_verify_cutlery_set.json",
224
+ "reference_verify_passed": true,
225
+ "reference_attempts": 2,
226
+ "sam_white_bg": {
227
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_cutlery_set_attempt_02.png",
228
+ "output": "references/ref_cutlery_set.png",
229
+ "mask": "references/sam_mask_cutlery_set.png",
230
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
231
+ "sam_model_type": "vit_b",
232
+ "sam_device": "auto",
233
+ "sam_working_size": [
234
+ 640,
235
+ 640
236
+ ],
237
+ "sam_max_side": 640,
238
+ "sam_downscale": 0.625,
239
+ "prompt_box_xyxy": [
240
+ 28.0,
241
+ 122.0,
242
+ 1013.0,
243
+ 887.0
244
+ ],
245
+ "mask_score": 3.237995,
246
+ "mask_area_ratio": 0.452152,
247
+ "elapsed_seconds": 10.821
248
+ }
249
+ },
250
+ {
251
+ "name": "wall_cabinet",
252
+ "is_person": false,
253
+ "subject_type": "object",
254
+ "source_set": "obj_set",
255
+ "source_image_id": "EPIC-Kitchens:P26_121:object:12",
256
+ "source_name": "cabinet",
257
+ "source_description": "A wooden cabinet positioned above the counter on the right side. Source dataset: EPIC-Kitchens. Scene context: A kitchen counter top with a stove, a pan, a bowl of yellow liquid, a wooden cutting board, a plate of food, a water bottle, a large water jug, and a small metal lid.",
258
+ "sub_caption": "cabinet: A wooden cabinet positioned above a kitchen counter.. Scene role: Mounted on the wall in the midground, directly above the counter.",
259
+ "measured_bbox": [
260
+ 0.5897,
261
+ 0.0017,
262
+ 0.9469,
263
+ 0.1735
264
+ ],
265
+ "detection_confidence": 0.99,
266
+ "ref_style": "white_bg_encyclopedia_photo",
267
+ "ref_image": "references/ref_wall_cabinet.png",
268
+ "raw_ref_image": "references/raw_ref_wall_cabinet_attempt_01.png",
269
+ "reference_verify": "references/reference_verify_wall_cabinet.json",
270
+ "reference_verify_passed": true,
271
+ "reference_attempts": 1,
272
+ "sam_white_bg": {
273
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_wall_cabinet_attempt_01.png",
274
+ "output": "references/ref_wall_cabinet.png",
275
+ "mask": "references/sam_mask_wall_cabinet.png",
276
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
277
+ "sam_model_type": "vit_b",
278
+ "sam_device": "auto",
279
+ "sam_working_size": [
280
+ 640,
281
+ 640
282
+ ],
283
+ "sam_max_side": 640,
284
+ "sam_downscale": 0.625,
285
+ "prompt_box_xyxy": [
286
+ 15.0,
287
+ 31.0,
288
+ 1008.0,
289
+ 1013.0
290
+ ],
291
+ "mask_score": 3.398914,
292
+ "mask_area_ratio": 0.735002,
293
+ "elapsed_seconds": 10.923
294
+ }
295
+ }
296
+ ],
297
+ "not_emitted": [],
298
+ "model_ids": {
299
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
300
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
301
+ }
302
+ }
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000006.json ADDED
@@ -0,0 +1,311 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sample_id": "sample_000006",
3
+ "target_total": 8,
4
+ "target_people": 1,
5
+ "target_objects": 7,
6
+ "canvas_size": [
7
+ 1152,
8
+ 864
9
+ ],
10
+ "canvas_aspect_ratio": "4:3",
11
+ "main_image": "main_image.png",
12
+ "bbox_overlay": "bbox_overlay.png",
13
+ "plan": "plan.json",
14
+ "detections": "detections.json",
15
+ "vocab_task": "vocab_task.json",
16
+ "n_planned": 8,
17
+ "n_detected": 8,
18
+ "n_subjects": 6,
19
+ "subjects": [
20
+ {
21
+ "name": "person_at_sink",
22
+ "is_person": true,
23
+ "subject_type": "person",
24
+ "source_set": "people_set",
25
+ "source_image_id": "EPIC-Kitchens:P26_103:person:0",
26
+ "source_name": "person",
27
+ "source_description": "A person's left hand and lower body, including dark trousers and black shoes with white soles, are visible in the foreground, reaching towards the sink. Source dataset: EPIC-Kitchens. Scene context: A first-person view of a stainless steel kitchen sink containing dirty dishes and a blue cloth, with a hand visible in the foreground.",
28
+ "sub_caption": "person: A person's left hand and lower body wearing dark trousers and black shoes with white soles.. Scene role: Standing in the foreground, reaching their left hand towards the kitchen faucet.",
29
+ "measured_bbox": [
30
+ 0.0,
31
+ 0.3583,
32
+ 0.2441,
33
+ 1.0
34
+ ],
35
+ "detection_confidence": 0.95,
36
+ "ref_style": "white_bg_full_body_front",
37
+ "ref_image": "references/ref_person_at_sink.png",
38
+ "raw_ref_image": "references/raw_ref_person_at_sink_attempt_01.png",
39
+ "reference_verify": "references/reference_verify_person_at_sink.json",
40
+ "reference_verify_passed": true,
41
+ "reference_attempts": 1,
42
+ "sam_white_bg": {
43
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_person_at_sink_attempt_01.png",
44
+ "output": "references/ref_person_at_sink.png",
45
+ "mask": "references/sam_mask_person_at_sink.png",
46
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
47
+ "sam_model_type": "vit_b",
48
+ "sam_device": "auto",
49
+ "sam_working_size": [
50
+ 640,
51
+ 640
52
+ ],
53
+ "sam_max_side": 640,
54
+ "sam_downscale": 0.625,
55
+ "prompt_box_xyxy": [
56
+ 320.0,
57
+ 24.0,
58
+ 689.0,
59
+ 1002.0
60
+ ],
61
+ "mask_score": 3.450755,
62
+ "mask_area_ratio": 0.163542,
63
+ "elapsed_seconds": 31.0984
64
+ }
65
+ },
66
+ {
67
+ "name": "wooden_door",
68
+ "is_person": false,
69
+ "subject_type": "object",
70
+ "source_set": "obj_set",
71
+ "source_image_id": "EPIC-Kitchens:P12_104:object:0",
72
+ "source_name": "door",
73
+ "source_description": "A light brown wooden door, closed, with a metallic door handle. Source dataset: EPIC-Kitchens. Scene context: A close-up view of a closed wooden door with a metal handle, positioned in a room with a kitchen area visible to the left.",
74
+ "sub_caption": "door: A light brown wooden door, closed, with a metallic handle.. Scene role: Visible in the background on the kitchen wall.",
75
+ "measured_bbox": [
76
+ 0.2139,
77
+ 0.0,
78
+ 0.3994,
79
+ 0.412
80
+ ],
81
+ "detection_confidence": 1.0,
82
+ "ref_style": "white_bg_encyclopedia_photo",
83
+ "ref_image": "references/ref_wooden_door.png",
84
+ "raw_ref_image": "references/raw_ref_wooden_door_attempt_01.png",
85
+ "reference_verify": "references/reference_verify_wooden_door.json",
86
+ "reference_verify_passed": true,
87
+ "reference_attempts": 1,
88
+ "sam_white_bg": {
89
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_wooden_door_attempt_01.png",
90
+ "output": "references/ref_wooden_door.png",
91
+ "mask": "references/sam_mask_wooden_door.png",
92
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
93
+ "sam_model_type": "vit_b",
94
+ "sam_device": "auto",
95
+ "sam_working_size": [
96
+ 640,
97
+ 640
98
+ ],
99
+ "sam_max_side": 640,
100
+ "sam_downscale": 0.625,
101
+ "prompt_box_xyxy": [
102
+ 256.0,
103
+ 26.0,
104
+ 767.0,
105
+ 1015.0
106
+ ],
107
+ "mask_score": 3.446321,
108
+ "mask_area_ratio": 0.388947,
109
+ "elapsed_seconds": 9.29
110
+ }
111
+ },
112
+ {
113
+ "name": "wrapped_cucumber",
114
+ "is_person": false,
115
+ "subject_type": "object",
116
+ "source_set": "obj_set",
117
+ "source_image_id": "EPIC-Kitchens:P37_101:object:1",
118
+ "source_name": "cucumber 2",
119
+ "source_description": "A long, green cucumber wrapped in clear plastic, resting horizontally on the dark countertop, slightly overlapping the other cucumber and positioned closer to the viewer. Source dataset: EPIC-Kitchens. Scene context: A first-person view of a person holding two whole cucumbers over a dark kitchen counter, with an onion, garlic, a plastic container, a rice cooker, and a living area in the background.",
120
+ "sub_caption": "cucumber 2: A long, green cucumber wrapped in clear plastic.. Scene role: Resting horizontally on the dark countertop next to the sink.",
121
+ "measured_bbox": [
122
+ 0.2215,
123
+ 0.4465,
124
+ 0.4029,
125
+ 0.5104
126
+ ],
127
+ "detection_confidence": 0.99,
128
+ "ref_style": "white_bg_encyclopedia_photo",
129
+ "ref_image": "references/ref_wrapped_cucumber.png",
130
+ "raw_ref_image": "references/raw_ref_wrapped_cucumber_attempt_01.png",
131
+ "reference_verify": "references/reference_verify_wrapped_cucumber.json",
132
+ "reference_verify_passed": true,
133
+ "reference_attempts": 1,
134
+ "sam_white_bg": {
135
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_wrapped_cucumber_attempt_01.png",
136
+ "output": "references/ref_wrapped_cucumber.png",
137
+ "mask": "references/sam_mask_wrapped_cucumber.png",
138
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
139
+ "sam_model_type": "vit_b",
140
+ "sam_device": "auto",
141
+ "sam_working_size": [
142
+ 640,
143
+ 640
144
+ ],
145
+ "sam_max_side": 640,
146
+ "sam_downscale": 0.625,
147
+ "prompt_box_xyxy": [
148
+ 33.0,
149
+ 397.0,
150
+ 1011.0,
151
+ 624.0
152
+ ],
153
+ "mask_score": 3.430612,
154
+ "mask_area_ratio": 0.118574,
155
+ "elapsed_seconds": 7.2551
156
+ }
157
+ },
158
+ {
159
+ "name": "gas_stove",
160
+ "is_person": false,
161
+ "subject_type": "object",
162
+ "source_set": "obj_set",
163
+ "source_image_id": "EPIC-Kitchens:P22_105:object:12",
164
+ "source_name": "stove",
165
+ "source_description": "A gas stove with black grates on the left side. Source dataset: EPIC-Kitchens. Scene context: A kitchen counter area with a stove, a sink, various utensils, bottles, and cabinets.",
166
+ "sub_caption": "stove: A kitchen gas stove with black grates.. Scene role: Positioned along the counter in the background.",
167
+ "measured_bbox": [
168
+ 0.03,
169
+ 0.345,
170
+ 0.318,
171
+ 0.444
172
+ ],
173
+ "detection_confidence": 0.99,
174
+ "ref_style": "white_bg_encyclopedia_photo",
175
+ "ref_image": "references/ref_gas_stove.png",
176
+ "raw_ref_image": "references/raw_ref_gas_stove_attempt_01.png",
177
+ "reference_verify": "references/reference_verify_gas_stove.json",
178
+ "reference_verify_passed": true,
179
+ "reference_attempts": 1,
180
+ "sam_white_bg": {
181
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_gas_stove_attempt_01.png",
182
+ "output": "references/ref_gas_stove.png",
183
+ "mask": "references/sam_mask_gas_stove.png",
184
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
185
+ "sam_model_type": "vit_b",
186
+ "sam_device": "auto",
187
+ "sam_working_size": [
188
+ 640,
189
+ 640
190
+ ],
191
+ "sam_max_side": 640,
192
+ "sam_downscale": 0.625,
193
+ "prompt_box_xyxy": [
194
+ 58.0,
195
+ 180.0,
196
+ 965.0,
197
+ 842.0
198
+ ],
199
+ "mask_score": 3.470988,
200
+ "mask_area_ratio": 0.477615,
201
+ "elapsed_seconds": 7.3908
202
+ }
203
+ },
204
+ {
205
+ "name": "water_pitcher",
206
+ "is_person": false,
207
+ "subject_type": "object",
208
+ "source_set": "obj_set",
209
+ "source_image_id": "EPIC-Kitchens:P07_107:object:13",
210
+ "source_name": "water pitcher",
211
+ "source_description": "A clear plastic water pitcher with a white handle and lid, sitting on the counter. Source dataset: EPIC-Kitchens. Scene context: A narrow kitchen space with a dark floor, light cabinets, a sink counter with various items, a radiator on the wall, and a trash can on the floor.",
212
+ "sub_caption": "water pitcher: A clear plastic water pitcher with a white handle and lid.. Scene role: Sitting upright on the counter.",
213
+ "measured_bbox": [
214
+ 0.3327,
215
+ 0.2732,
216
+ 0.4536,
217
+ 0.4573
218
+ ],
219
+ "detection_confidence": 0.99,
220
+ "ref_style": "white_bg_encyclopedia_photo",
221
+ "ref_image": "references/ref_water_pitcher.png",
222
+ "raw_ref_image": "references/raw_ref_water_pitcher_attempt_01.png",
223
+ "reference_verify": "references/reference_verify_water_pitcher.json",
224
+ "reference_verify_passed": true,
225
+ "reference_attempts": 1,
226
+ "sam_white_bg": {
227
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_water_pitcher_attempt_01.png",
228
+ "output": "references/ref_water_pitcher.png",
229
+ "mask": "references/sam_mask_water_pitcher.png",
230
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
231
+ "sam_model_type": "vit_b",
232
+ "sam_device": "auto",
233
+ "sam_working_size": [
234
+ 640,
235
+ 640
236
+ ],
237
+ "sam_max_side": 640,
238
+ "sam_downscale": 0.625,
239
+ "prompt_box_xyxy": [
240
+ 242.0,
241
+ 115.0,
242
+ 856.0,
243
+ 972.0
244
+ ],
245
+ "mask_score": 3.323768,
246
+ "mask_area_ratio": 0.450877,
247
+ "elapsed_seconds": 7.2849
248
+ }
249
+ },
250
+ {
251
+ "name": "silver_spoon",
252
+ "is_person": false,
253
+ "subject_type": "object",
254
+ "source_set": "obj_set",
255
+ "source_image_id": "EPIC-Kitchens:P04_103:object:9",
256
+ "source_name": "Silver Spoon",
257
+ "source_description": "Small silver metal spoon resting near the black spatula handle. Source dataset: EPIC-Kitchens. Scene context: A messy kitchen counter with a stove, toaster, and various cooking utensils scattered around.",
258
+ "sub_caption": "Silver Spoon: A small silver metal spoon.. Scene role: Laying flat on the messy countertop near the cucumber.",
259
+ "measured_bbox": [
260
+ 0.3001,
261
+ 0.4801,
262
+ 0.3988,
263
+ 0.539
264
+ ],
265
+ "detection_confidence": 0.99,
266
+ "ref_style": "white_bg_encyclopedia_photo",
267
+ "ref_image": "references/ref_silver_spoon.png",
268
+ "raw_ref_image": "references/raw_ref_silver_spoon_attempt_01.png",
269
+ "reference_verify": "references/reference_verify_silver_spoon.json",
270
+ "reference_verify_passed": true,
271
+ "reference_attempts": 1,
272
+ "sam_white_bg": {
273
+ "input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_silver_spoon_attempt_01.png",
274
+ "output": "references/ref_silver_spoon.png",
275
+ "mask": "references/sam_mask_silver_spoon.png",
276
+ "sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
277
+ "sam_model_type": "vit_b",
278
+ "sam_device": "auto",
279
+ "sam_working_size": [
280
+ 640,
281
+ 640
282
+ ],
283
+ "sam_max_side": 640,
284
+ "sam_downscale": 0.625,
285
+ "prompt_box_xyxy": [
286
+ 88.0,
287
+ 77.0,
288
+ 916.0,
289
+ 950.0
290
+ ],
291
+ "mask_score": 3.449565,
292
+ "mask_area_ratio": 0.092279,
293
+ "elapsed_seconds": 7.0866
294
+ }
295
+ }
296
+ ],
297
+ "not_emitted": [
298
+ {
299
+ "name": "black_pot",
300
+ "reason": "not_detected"
301
+ },
302
+ {
303
+ "name": "kitchen_faucet",
304
+ "reason": "not_detected"
305
+ }
306
+ ],
307
+ "model_ids": {
308
+ "chat_model": "gcp/google/gemini-3.1-pro-preview",
309
+ "image_model": "gcp/google/gemini-3-pro-image-preview"
310
+ }
311
+ }