Upload folder using huggingface_hub
#2
by kimi000 - opened
This view is limited to 50 files because it contains too many changes. See the raw diff here.
- .gitattributes +192 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/README.md +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/dataset.json +0 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/dataset.jsonl +0 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000001.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000003.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000004.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000005.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000006.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000007.json +32 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000008.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000009.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000010.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000011.json +16 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000001.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000003.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000004.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000005.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000006.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000007.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000008.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000009.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000010.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000011.json +4 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000001.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000002.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000003.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000004.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000005.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000006.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000007.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000008.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000009.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000010.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000011.json +14 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000001.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000003.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000004.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000005.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000006.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000007.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000008.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000009.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000010.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000011.json +18 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000001.json +164 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000003.json +164 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000004.json +173 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000005.json +302 -0
- samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000006.json +311 -0
.gitattributes
CHANGED
|
@@ -52,3 +52,195 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 52 |
10samples/sample_0007/overlays/overlay_accepted.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
10samples/sample_0007/overlays/overlay_intended.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
10samples/sample_0007/overlays/overlay_measured.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 52 |
10samples/sample_0007/overlays/overlay_accepted.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
10samples/sample_0007/overlays/overlay_intended.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
10samples/sample_0007/overlays/overlay_measured.png filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/crops/detect_refine_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/crops/detect_refine_red_illuminated_structure.png filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/crops/diversify_input_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/crops/diversify_input_red_illuminated_structure.png filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/references/ref_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000001/references/ref_red_illuminated_structure.png filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_bright_blue_panel.png filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_dark_door.png filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_door_frame.png filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_patterned_floor.png filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_patterned_surface.png filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_person_forming_heart.png filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_person_holding_red_object.png filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_person_manipulating_object.png filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_rectangular_blue_screen.png filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_textured_background.png filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_textured_background_drapery.png filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_textured_surface.png filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_textured_table_cloth.png filter=lfs diff=lfs merge=lfs -text
|
| 76 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_wooden_chair.png filter=lfs diff=lfs merge=lfs -text
|
| 77 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/crops/detect_refine_wooden_structure.png filter=lfs diff=lfs merge=lfs -text
|
| 78 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000002/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 80 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/detect_refine_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 81 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/detect_refine_red_illuminated_book.png filter=lfs diff=lfs merge=lfs -text
|
| 82 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/detect_refine_shadowy_doorway.png filter=lfs diff=lfs merge=lfs -text
|
| 83 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/diversify_input_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 84 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/diversify_input_red_illuminated_book.png filter=lfs diff=lfs merge=lfs -text
|
| 85 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/crops/diversify_input_shadowy_doorway.png filter=lfs diff=lfs merge=lfs -text
|
| 86 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 87 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/references/ref_person_in_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 88 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/references/ref_red_illuminated_book.png filter=lfs diff=lfs merge=lfs -text
|
| 89 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000003/references/ref_shadowy_doorway.png filter=lfs diff=lfs merge=lfs -text
|
| 90 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 91 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/crops/detect_refine_draped_tarp.png filter=lfs diff=lfs merge=lfs -text
|
| 92 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/crops/detect_refine_painter_in_cap.png filter=lfs diff=lfs merge=lfs -text
|
| 93 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/crops/detect_refine_stacked_storage_boxes.png filter=lfs diff=lfs merge=lfs -text
|
| 94 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/crops/diversify_input_draped_tarp.png filter=lfs diff=lfs merge=lfs -text
|
| 95 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 96 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/references/ref_blue_light_source.png filter=lfs diff=lfs merge=lfs -text
|
| 97 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/references/ref_draped_tarp.png filter=lfs diff=lfs merge=lfs -text
|
| 98 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000004/references/ref_paint_roller.png filter=lfs diff=lfs merge=lfs -text
|
| 99 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 100 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_cutlery_set.png filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_person_in_jacket.png filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_person_with_pan.png filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_pizza_prep_hands.png filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/detect_refine_wall_cabinet.png filter=lfs diff=lfs merge=lfs -text
|
| 105 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_cutlery_set.png filter=lfs diff=lfs merge=lfs -text
|
| 106 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_person_in_jacket.png filter=lfs diff=lfs merge=lfs -text
|
| 107 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_person_with_pan.png filter=lfs diff=lfs merge=lfs -text
|
| 108 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_pizza_prep_hands.png filter=lfs diff=lfs merge=lfs -text
|
| 109 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/crops/diversify_input_wall_cabinet.png filter=lfs diff=lfs merge=lfs -text
|
| 110 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 111 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_cutlery_set.png filter=lfs diff=lfs merge=lfs -text
|
| 112 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_person_in_jacket.png filter=lfs diff=lfs merge=lfs -text
|
| 113 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_person_with_pan.png filter=lfs diff=lfs merge=lfs -text
|
| 114 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_pizza_prep_hands.png filter=lfs diff=lfs merge=lfs -text
|
| 115 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_salt_box.png filter=lfs diff=lfs merge=lfs -text
|
| 116 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000005/references/ref_wall_cabinet.png filter=lfs diff=lfs merge=lfs -text
|
| 117 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 118 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/detect_refine_large_black_pot.png filter=lfs diff=lfs merge=lfs -text
|
| 119 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/detect_refine_person_at_sink.png filter=lfs diff=lfs merge=lfs -text
|
| 120 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/detect_refine_wooden_door.png filter=lfs diff=lfs merge=lfs -text
|
| 121 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/diversify_input_large_black_pot.png filter=lfs diff=lfs merge=lfs -text
|
| 122 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/diversify_input_person_at_sink.png filter=lfs diff=lfs merge=lfs -text
|
| 123 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/diversify_input_sink_faucet.png filter=lfs diff=lfs merge=lfs -text
|
| 124 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/crops/diversify_input_wooden_door.png filter=lfs diff=lfs merge=lfs -text
|
| 125 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 126 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_gas_stove.png filter=lfs diff=lfs merge=lfs -text
|
| 127 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_large_black_pot.png filter=lfs diff=lfs merge=lfs -text
|
| 128 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_person_at_sink.png filter=lfs diff=lfs merge=lfs -text
|
| 129 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_silver_spoon.png filter=lfs diff=lfs merge=lfs -text
|
| 130 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_sink_faucet.png filter=lfs diff=lfs merge=lfs -text
|
| 131 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_water_pitcher.png filter=lfs diff=lfs merge=lfs -text
|
| 132 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_wooden_door.png filter=lfs diff=lfs merge=lfs -text
|
| 133 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000006/references/ref_wrapped_cucumber.png filter=lfs diff=lfs merge=lfs -text
|
| 134 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 135 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_backpack.png filter=lfs diff=lfs merge=lfs -text
|
| 136 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_cable.png filter=lfs diff=lfs merge=lfs -text
|
| 137 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_dark_area.png filter=lfs diff=lfs merge=lfs -text
|
| 138 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_grid_patterned_floor.png filter=lfs diff=lfs merge=lfs -text
|
| 139 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_shadowy_shape.png filter=lfs diff=lfs merge=lfs -text
|
| 140 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_textured_fabric_area.png filter=lfs diff=lfs merge=lfs -text
|
| 141 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_textured_surface.png filter=lfs diff=lfs merge=lfs -text
|
| 142 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/detect_refine_typist.png filter=lfs diff=lfs merge=lfs -text
|
| 143 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_backpack.png filter=lfs diff=lfs merge=lfs -text
|
| 144 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_blue_lines.png filter=lfs diff=lfs merge=lfs -text
|
| 145 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_cable.png filter=lfs diff=lfs merge=lfs -text
|
| 146 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_dark_area.png filter=lfs diff=lfs merge=lfs -text
|
| 147 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_grid_patterned_floor.png filter=lfs diff=lfs merge=lfs -text
|
| 148 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_shadowy_shape.png filter=lfs diff=lfs merge=lfs -text
|
| 149 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_textured_fabric_area.png filter=lfs diff=lfs merge=lfs -text
|
| 150 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_textured_surface.png filter=lfs diff=lfs merge=lfs -text
|
| 151 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/crops/diversify_input_typist.png filter=lfs diff=lfs merge=lfs -text
|
| 152 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 153 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_backpack.png filter=lfs diff=lfs merge=lfs -text
|
| 154 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_blue_light.png filter=lfs diff=lfs merge=lfs -text
|
| 155 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_blue_light_source.png filter=lfs diff=lfs merge=lfs -text
|
| 156 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_blue_lines.png filter=lfs diff=lfs merge=lfs -text
|
| 157 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_dark_area.png filter=lfs diff=lfs merge=lfs -text
|
| 158 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_electronic_device.png filter=lfs diff=lfs merge=lfs -text
|
| 159 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_grid_patterned_floor.png filter=lfs diff=lfs merge=lfs -text
|
| 160 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_shadowy_shape.png filter=lfs diff=lfs merge=lfs -text
|
| 161 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_small_blue_rectangle.png filter=lfs diff=lfs merge=lfs -text
|
| 162 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_textured_fabric_area.png filter=lfs diff=lfs merge=lfs -text
|
| 163 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_textured_surface.png filter=lfs diff=lfs merge=lfs -text
|
| 164 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_thin_curved_object.png filter=lfs diff=lfs merge=lfs -text
|
| 165 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000007/references/ref_typist.png filter=lfs diff=lfs merge=lfs -text
|
| 166 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 167 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_hands_holding_part.png filter=lfs diff=lfs merge=lfs -text
|
| 168 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_hands_with_small_object.png filter=lfs diff=lfs merge=lfs -text
|
| 169 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_helmeted_figure.png filter=lfs diff=lfs merge=lfs -text
|
| 170 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_person_by_screens.png filter=lfs diff=lfs merge=lfs -text
|
| 171 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/detect_refine_silhouette_with_phone.png filter=lfs diff=lfs merge=lfs -text
|
| 172 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_hands_with_small_object.png filter=lfs diff=lfs merge=lfs -text
|
| 173 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_hands_with_smoldering_tool.png filter=lfs diff=lfs merge=lfs -text
|
| 174 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_helmeted_figure.png filter=lfs diff=lfs merge=lfs -text
|
| 175 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_person_by_screens.png filter=lfs diff=lfs merge=lfs -text
|
| 176 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/crops/diversify_input_silhouette_with_phone.png filter=lfs diff=lfs merge=lfs -text
|
| 177 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 178 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_blue_light_module.png filter=lfs diff=lfs merge=lfs -text
|
| 179 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_hands_holding_part.png filter=lfs diff=lfs merge=lfs -text
|
| 180 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_hands_passing_object.png filter=lfs diff=lfs merge=lfs -text
|
| 181 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_hands_with_small_object.png filter=lfs diff=lfs merge=lfs -text
|
| 182 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_hands_with_smoldering_tool.png filter=lfs diff=lfs merge=lfs -text
|
| 183 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_helmeted_figure.png filter=lfs diff=lfs merge=lfs -text
|
| 184 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_person_by_screens.png filter=lfs diff=lfs merge=lfs -text
|
| 185 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_reaching_hands.png filter=lfs diff=lfs merge=lfs -text
|
| 186 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_red_device.png filter=lfs diff=lfs merge=lfs -text
|
| 187 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000008/references/ref_silhouette_with_phone.png filter=lfs diff=lfs merge=lfs -text
|
| 188 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 189 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_blue_cleaner_bottle.png filter=lfs diff=lfs merge=lfs -text
|
| 190 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_person_washing_sink.png filter=lfs diff=lfs merge=lfs -text
|
| 191 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_red_sink_mat.png filter=lfs diff=lfs merge=lfs -text
|
| 192 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_silver_faucet.png filter=lfs diff=lfs merge=lfs -text
|
| 193 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/detect_refine_yellow_dish_gloves.png filter=lfs diff=lfs merge=lfs -text
|
| 194 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_blue_cleaner_bottle.png filter=lfs diff=lfs merge=lfs -text
|
| 195 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_person_washing_sink.png filter=lfs diff=lfs merge=lfs -text
|
| 196 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_red_sink_mat.png filter=lfs diff=lfs merge=lfs -text
|
| 197 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_silver_faucet.png filter=lfs diff=lfs merge=lfs -text
|
| 198 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/crops/diversify_input_yellow_dish_gloves.png filter=lfs diff=lfs merge=lfs -text
|
| 199 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 200 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_blue_cleaner_bottle.png filter=lfs diff=lfs merge=lfs -text
|
| 201 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_person_washing_sink.png filter=lfs diff=lfs merge=lfs -text
|
| 202 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_red_sink_mat.png filter=lfs diff=lfs merge=lfs -text
|
| 203 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_silver_faucet.png filter=lfs diff=lfs merge=lfs -text
|
| 204 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000009/references/ref_yellow_dish_gloves.png filter=lfs diff=lfs merge=lfs -text
|
| 205 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 206 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_hands_gesturing.png filter=lfs diff=lfs merge=lfs -text
|
| 207 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_person_face_in_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 208 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_person_holding_blue_flashlight.png filter=lfs diff=lfs merge=lfs -text
|
| 209 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_person_reading_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 210 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/detect_refine_person_standing_background.png filter=lfs diff=lfs merge=lfs -text
|
| 211 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_hands_holding_triangular_object.png filter=lfs diff=lfs merge=lfs -text
|
| 212 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_person_holding_blue_flashlight.png filter=lfs diff=lfs merge=lfs -text
|
| 213 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_person_lying_reading_blue_light.png filter=lfs diff=lfs merge=lfs -text
|
| 214 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_person_reading_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 215 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/crops/diversify_input_person_standing_background.png filter=lfs diff=lfs merge=lfs -text
|
| 216 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 217 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_hands_gesturing.png filter=lfs diff=lfs merge=lfs -text
|
| 218 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_hands_holding_small_object.png filter=lfs diff=lfs merge=lfs -text
|
| 219 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_hands_holding_triangular_object.png filter=lfs diff=lfs merge=lfs -text
|
| 220 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_face_in_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 221 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_holding_blue_flashlight.png filter=lfs diff=lfs merge=lfs -text
|
| 222 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_lying_reading_blue_light.png filter=lfs diff=lfs merge=lfs -text
|
| 223 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_reading_red_light.png filter=lfs diff=lfs merge=lfs -text
|
| 224 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_person_standing_background.png filter=lfs diff=lfs merge=lfs -text
|
| 225 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000010/references/ref_plastic_water_bottle.png filter=lfs diff=lfs merge=lfs -text
|
| 226 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 227 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/detect_refine_granite_counter.png filter=lfs diff=lfs merge=lfs -text
|
| 228 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/detect_refine_person_hands.png filter=lfs diff=lfs merge=lfs -text
|
| 229 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/detect_refine_textured_mat.png filter=lfs diff=lfs merge=lfs -text
|
| 230 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/detect_refine_wooden_cabinets.png filter=lfs diff=lfs merge=lfs -text
|
| 231 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_granite_counter.png filter=lfs diff=lfs merge=lfs -text
|
| 232 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_person_hands.png filter=lfs diff=lfs merge=lfs -text
|
| 233 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_textured_mat.png filter=lfs diff=lfs merge=lfs -text
|
| 234 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_wall_shelf.png filter=lfs diff=lfs merge=lfs -text
|
| 235 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/crops/diversify_input_wooden_cabinets.png filter=lfs diff=lfs merge=lfs -text
|
| 236 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 237 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_box_grater.png filter=lfs diff=lfs merge=lfs -text
|
| 238 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_dirty_plate.png filter=lfs diff=lfs merge=lfs -text
|
| 239 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_glass_bottle.png filter=lfs diff=lfs merge=lfs -text
|
| 240 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_granite_counter.png filter=lfs diff=lfs merge=lfs -text
|
| 241 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_metal_tool.png filter=lfs diff=lfs merge=lfs -text
|
| 242 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_person_hands.png filter=lfs diff=lfs merge=lfs -text
|
| 243 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_striped_towel.png filter=lfs diff=lfs merge=lfs -text
|
| 244 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_textured_mat.png filter=lfs diff=lfs merge=lfs -text
|
| 245 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_wall_shelf.png filter=lfs diff=lfs merge=lfs -text
|
| 246 |
+
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/sample_000011/references/ref_wooden_cabinets.png filter=lfs diff=lfs merge=lfs -text
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/README.md
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# samples_v8
|
| 2 |
+
|
| 3 |
+
Generated with `data_recipe_v8.md`: vocabulary-first planning, adaptive canvas selection, structured JSON compose prompts, no identity verification, no gate, SAM white-background reference postprocessing, and strict reference-completeness verification with regenerate-until-pass behavior.
|
| 4 |
+
|
| 5 |
+
- chat model: `gcp/google/gemini-3.1-pro-preview`
|
| 6 |
+
- image model: `gcp/google/gemini-3-pro-image-preview`
|
| 7 |
+
- people references: `white_bg_full_body_front`
|
| 8 |
+
- non-person references: `white_bg_encyclopedia_photo`
|
| 9 |
+
- SAM postprocess: every generated reference is segmented with `sam_vit_b` and pasted onto pure `#ffffff` background
|
| 10 |
+
- reference verify max attempts per subject: `10`
|
| 11 |
+
- allowed canvases: `[{"aspect_ratio": "1:1", "size": [1024, 1024], "style": "photorealistic"}, {"aspect_ratio": "4:3", "size": [1152, 864], "style": "photorealistic"}, {"aspect_ratio": "3:4", "size": [864, 1152], "style": "photorealistic"}, {"aspect_ratio": "3:2", "size": [1248, 832], "style": "photorealistic"}, {"aspect_ratio": "2:3", "size": [832, 1248], "style": "photorealistic"}, {"aspect_ratio": "16:9", "size": [1280, 720], "style": "photorealistic"}, {"aspect_ratio": "9:16", "size": [720, 1280], "style": "photorealistic"}]`
|
| 12 |
+
- scenario mode: `general`
|
| 13 |
+
- pools: `vocab_task_pool`, `plan_pool`, `scene_pool`, `detection_pool`, `reference_pool`
|
| 14 |
+
- bbox overlay: `bbox_overlay.png` draws every planned subject bbox; a sample is rejected and regenerated if any planned subject is still missing after VLM detection retries
|
| 15 |
+
- detection max attempts per subject: `3`
|
| 16 |
+
- launch args: `{"compose_workers": 3, "detect_max_attempts": 3, "detect_workers": 3, "emit_workers": 4, "idle_sleep": 1.0, "image_inflight": 32, "image_interval": 0.05, "image_max_retries": 8, "max_retries": 3, "no_topup": false, "plan_workers": 6, "ref_verify_max_attempts": 10, "reference_workers": 6, "requeue_in_progress": true, "seed": 1781927993, "status_interval": 30.0, "subject_detect_workers": 24, "target_samples": 10}`
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/dataset.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/dataset.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000001.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000001",
|
| 3 |
+
"plan_path": "sample_000001/plan.json",
|
| 4 |
+
"task_path": "sample_000001/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000001/main_image.png",
|
| 6 |
+
"detections": "sample_000001/detections.json",
|
| 7 |
+
"n_detected": 3,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000001",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000003.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000003",
|
| 3 |
+
"plan_path": "sample_000003/plan.json",
|
| 4 |
+
"task_path": "sample_000003/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000003/main_image.png",
|
| 6 |
+
"detections": "sample_000003/detections.json",
|
| 7 |
+
"n_detected": 3,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000003",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000004.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000004",
|
| 3 |
+
"plan_path": "sample_000004/plan.json",
|
| 4 |
+
"task_path": "sample_000004/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000004/main_image.png",
|
| 6 |
+
"detections": "sample_000004/detections.json",
|
| 7 |
+
"n_detected": 5,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000004",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000005.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000005",
|
| 3 |
+
"plan_path": "sample_000005/plan.json",
|
| 4 |
+
"task_path": "sample_000005/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000005/main_image.png",
|
| 6 |
+
"detections": "sample_000005/detections.json",
|
| 7 |
+
"n_detected": 6,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000005",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000006.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000006",
|
| 3 |
+
"plan_path": "sample_000006/plan.json",
|
| 4 |
+
"task_path": "sample_000006/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000006/main_image.png",
|
| 6 |
+
"detections": "sample_000006/detections.json",
|
| 7 |
+
"n_detected": 8,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000006",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000007.json
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000007",
|
| 3 |
+
"plan_path": "sample_000007/plan.json",
|
| 4 |
+
"task_path": "sample_000007/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000007/main_image.png",
|
| 6 |
+
"detections": "sample_000007/detections.json",
|
| 7 |
+
"n_detected": 14,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000007",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 3,
|
| 15 |
+
"errors": [
|
| 16 |
+
{
|
| 17 |
+
"time": 1782260885.2187717,
|
| 18 |
+
"error": "RuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark area' is entirely absent; Image shows a cardboard box instead of the requested subject",
|
| 19 |
+
"traceback": "Traceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 866, in generate_references\n references.append(helpers.diversify_subject(get_client(), sdir, main_image, subject, detection))\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/v8_helpers.py\", line 693, in diversify_subject\n raise RuntimeError(\nRuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark area' is entirely absent; Image shows a cardboard box instead of the requested subject\n\nThe above exception was the direct cause of the following exception:\n\nTraceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1020, in worker_loop\n handler(manifest)\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1113, in handler\n references, reference_errors = generate_references(sample_id, plan, detections)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 871, in generate_references\n raise RuntimeError(f\"reference generation or verification failed for {name}: {errors[name]}\") from exc\nRuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark area' is entirely absent; Image shows a cardboard box instead of the requested subject\n"
|
| 20 |
+
},
|
| 21 |
+
{
|
| 22 |
+
"time": 1782261302.7464893,
|
| 23 |
+
"error": "RuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject is absent; image shows a cardboard box instead of a dark shadowed area.",
|
| 24 |
+
"traceback": "Traceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 866, in generate_references\n references.append(helpers.diversify_subject(get_client(), sdir, main_image, subject, detection))\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/v8_helpers.py\", line 693, in diversify_subject\n raise RuntimeError(\nRuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject is absent; image shows a cardboard box instead of a dark shadowed area.\n\nThe above exception was the direct cause of the following exception:\n\nTraceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1020, in worker_loop\n handler(manifest)\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1113, in handler\n references, reference_errors = generate_references(sample_id, plan, detections)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 871, in generate_references\n raise RuntimeError(f\"reference generation or verification failed for {name}: {errors[name]}\") from exc\nRuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject is absent; image shows a cardboard box instead of a dark shadowed area.\n"
|
| 25 |
+
},
|
| 26 |
+
{
|
| 27 |
+
"time": 1782261717.330226,
|
| 28 |
+
"error": "RuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark_area' is absent.; Image shows a cardboard box instead of the requested subject.",
|
| 29 |
+
"traceback": "Traceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 866, in generate_references\n references.append(helpers.diversify_subject(get_client(), sdir, main_image, subject, detection))\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/v8_helpers.py\", line 693, in diversify_subject\n raise RuntimeError(\nRuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark_area' is absent.; Image shows a cardboard box instead of the requested subject.\n\nThe above exception was the direct cause of the following exception:\n\nTraceback (most recent call last):\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1020, in worker_loop\n handler(manifest)\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 1113, in handler\n references, reference_errors = generate_references(sample_id, plan, detections)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/samples_v8/generate_samples_v8.py\", line 871, in generate_references\n raise RuntimeError(f\"reference generation or verification failed for {name}: {errors[name]}\") from exc\nRuntimeError: reference generation or verification failed for dark_area: RuntimeError: reference verification failed for dark_area after 10 attempts: Intended subject 'dark_area' is absent.; Image shows a cardboard box instead of the requested subject.\n"
|
| 30 |
+
}
|
| 31 |
+
]
|
| 32 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000008.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000008",
|
| 3 |
+
"plan_path": "sample_000008/plan.json",
|
| 4 |
+
"task_path": "sample_000008/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000008/main_image.png",
|
| 6 |
+
"detections": "sample_000008/detections.json",
|
| 7 |
+
"n_detected": 10,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000008",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000009.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000009",
|
| 3 |
+
"plan_path": "sample_000009/plan.json",
|
| 4 |
+
"task_path": "sample_000009/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000009/main_image.png",
|
| 6 |
+
"detections": "sample_000009/detections.json",
|
| 7 |
+
"n_detected": 5,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000009",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000010.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000010",
|
| 3 |
+
"plan_path": "sample_000010/plan.json",
|
| 4 |
+
"task_path": "sample_000010/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000010/main_image.png",
|
| 6 |
+
"detections": "sample_000010/detections.json",
|
| 7 |
+
"n_detected": 9,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000010",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/detection_pool/done/sample_000011.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000011",
|
| 3 |
+
"plan_path": "sample_000011/plan.json",
|
| 4 |
+
"task_path": "sample_000011/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000011/main_image.png",
|
| 6 |
+
"detections": "sample_000011/detections.json",
|
| 7 |
+
"n_detected": 10,
|
| 8 |
+
"model_ids": {
|
| 9 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 10 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 11 |
+
},
|
| 12 |
+
"item_id": "sample_000011",
|
| 13 |
+
"pool": "detection_pool",
|
| 14 |
+
"retry_count": 0,
|
| 15 |
+
"errors": []
|
| 16 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000001.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000001",
|
| 3 |
+
"row": "sample_000001/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000003.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000003",
|
| 3 |
+
"row": "sample_000003/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000004.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000004",
|
| 3 |
+
"row": "sample_000004/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000005.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000005",
|
| 3 |
+
"row": "sample_000005/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000006.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000006",
|
| 3 |
+
"row": "sample_000006/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000007.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000007",
|
| 3 |
+
"row": "sample_000007/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000008.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000008",
|
| 3 |
+
"row": "sample_000008/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000009.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000009",
|
| 3 |
+
"row": "sample_000009/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000010.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000010",
|
| 3 |
+
"row": "sample_000010/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/emit_pool/done/sample_000011.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000011",
|
| 3 |
+
"row": "sample_000011/row.json"
|
| 4 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000001.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000001",
|
| 3 |
+
"plan_path": "sample_000001/plan.json",
|
| 4 |
+
"task_path": "sample_000001/vocab_task.json",
|
| 5 |
+
"prompt_hash": "de111ef88cac721a573e1463080c7ef8f709ab3311c0be649576445c9637d6d5",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000001",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000002.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000002",
|
| 3 |
+
"plan_path": "sample_000002/plan.json",
|
| 4 |
+
"task_path": "sample_000002/vocab_task.json",
|
| 5 |
+
"prompt_hash": "124ba3f0479caaeb5896d579dbace9891cca2fb6875690fdb3f66ee3524a7e9e",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000002",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000003.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000003",
|
| 3 |
+
"plan_path": "sample_000003/plan.json",
|
| 4 |
+
"task_path": "sample_000003/vocab_task.json",
|
| 5 |
+
"prompt_hash": "63e951d22cadbf6e15b5fd08f5054b228df47fc857c4e48e47c23160da12a111",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000003",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000004.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000004",
|
| 3 |
+
"plan_path": "sample_000004/plan.json",
|
| 4 |
+
"task_path": "sample_000004/vocab_task.json",
|
| 5 |
+
"prompt_hash": "3f5c74d4cad870d092def8f4466e975d281c99678ca962809503c5c456a06f49",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000004",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000005.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000005",
|
| 3 |
+
"plan_path": "sample_000005/plan.json",
|
| 4 |
+
"task_path": "sample_000005/vocab_task.json",
|
| 5 |
+
"prompt_hash": "946054fe68ce2e3f63d85b3eddd1a3e63af4d647ef6dc47764d65eb13cf867f4",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000005",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000006.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000006",
|
| 3 |
+
"plan_path": "sample_000006/plan.json",
|
| 4 |
+
"task_path": "sample_000006/vocab_task.json",
|
| 5 |
+
"prompt_hash": "006a1741e37f4e2fda0c82cbfbd7c6119932755e84be0002d17055a7af25bb79",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000006",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000007.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000007",
|
| 3 |
+
"plan_path": "sample_000007/plan.json",
|
| 4 |
+
"task_path": "sample_000007/vocab_task.json",
|
| 5 |
+
"prompt_hash": "e999f398d25887be57aad833cb2b38dd0d1b370d4b6b6019fbde86bc6c809c69",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000007",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000008.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000008",
|
| 3 |
+
"plan_path": "sample_000008/plan.json",
|
| 4 |
+
"task_path": "sample_000008/vocab_task.json",
|
| 5 |
+
"prompt_hash": "63aefc9a503e34719b1b91ec3397c9b92dc92ff7ce2c14e2c7bbe458bad64ba1",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000008",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000009.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000009",
|
| 3 |
+
"plan_path": "sample_000009/plan.json",
|
| 4 |
+
"task_path": "sample_000009/vocab_task.json",
|
| 5 |
+
"prompt_hash": "929afc2e2f3cfd582eb2c6b53c41f60141480cb35a1ce251ed1752a6e98ba9ea",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000009",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000010.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000010",
|
| 3 |
+
"plan_path": "sample_000010/plan.json",
|
| 4 |
+
"task_path": "sample_000010/vocab_task.json",
|
| 5 |
+
"prompt_hash": "74f4fe54dda8f633b152876c6b6433d4a90a0421304dd6db44bd84b9519110f8",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000010",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/plan_pool/done/sample_000011.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000011",
|
| 3 |
+
"plan_path": "sample_000011/plan.json",
|
| 4 |
+
"task_path": "sample_000011/vocab_task.json",
|
| 5 |
+
"prompt_hash": "e6c24d29d9d4a97828419fab43954232185614106bdd1c11f6a196e5398eabbc",
|
| 6 |
+
"model_ids": {
|
| 7 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 8 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 9 |
+
},
|
| 10 |
+
"item_id": "sample_000011",
|
| 11 |
+
"pool": "plan_pool",
|
| 12 |
+
"retry_count": 0,
|
| 13 |
+
"errors": []
|
| 14 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000001.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000001",
|
| 3 |
+
"plan_path": "sample_000001/plan.json",
|
| 4 |
+
"task_path": "sample_000001/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000001/main_image.png",
|
| 6 |
+
"detections": "sample_000001/detections.json",
|
| 7 |
+
"references": "sample_000001/references.json",
|
| 8 |
+
"n_references": 3,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000001",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000003.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000003",
|
| 3 |
+
"plan_path": "sample_000003/plan.json",
|
| 4 |
+
"task_path": "sample_000003/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000003/main_image.png",
|
| 6 |
+
"detections": "sample_000003/detections.json",
|
| 7 |
+
"references": "sample_000003/references.json",
|
| 8 |
+
"n_references": 3,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000003",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000004.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000004",
|
| 3 |
+
"plan_path": "sample_000004/plan.json",
|
| 4 |
+
"task_path": "sample_000004/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000004/main_image.png",
|
| 6 |
+
"detections": "sample_000004/detections.json",
|
| 7 |
+
"references": "sample_000004/references.json",
|
| 8 |
+
"n_references": 3,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000004",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000005.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000005",
|
| 3 |
+
"plan_path": "sample_000005/plan.json",
|
| 4 |
+
"task_path": "sample_000005/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000005/main_image.png",
|
| 6 |
+
"detections": "sample_000005/detections.json",
|
| 7 |
+
"references": "sample_000005/references.json",
|
| 8 |
+
"n_references": 6,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000005",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000006.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000006",
|
| 3 |
+
"plan_path": "sample_000006/plan.json",
|
| 4 |
+
"task_path": "sample_000006/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000006/main_image.png",
|
| 6 |
+
"detections": "sample_000006/detections.json",
|
| 7 |
+
"references": "sample_000006/references.json",
|
| 8 |
+
"n_references": 8,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000006",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000007.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000007",
|
| 3 |
+
"plan_path": "sample_000007/plan.json",
|
| 4 |
+
"task_path": "sample_000007/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000007/main_image.png",
|
| 6 |
+
"detections": "sample_000007/detections.json",
|
| 7 |
+
"references": "sample_000007/references.json",
|
| 8 |
+
"n_references": 14,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000007",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000008.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000008",
|
| 3 |
+
"plan_path": "sample_000008/plan.json",
|
| 4 |
+
"task_path": "sample_000008/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000008/main_image.png",
|
| 6 |
+
"detections": "sample_000008/detections.json",
|
| 7 |
+
"references": "sample_000008/references.json",
|
| 8 |
+
"n_references": 10,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000008",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000009.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000009",
|
| 3 |
+
"plan_path": "sample_000009/plan.json",
|
| 4 |
+
"task_path": "sample_000009/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000009/main_image.png",
|
| 6 |
+
"detections": "sample_000009/detections.json",
|
| 7 |
+
"references": "sample_000009/references.json",
|
| 8 |
+
"n_references": 5,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000009",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000010.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000010",
|
| 3 |
+
"plan_path": "sample_000010/plan.json",
|
| 4 |
+
"task_path": "sample_000010/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000010/main_image.png",
|
| 6 |
+
"detections": "sample_000010/detections.json",
|
| 7 |
+
"references": "sample_000010/references.json",
|
| 8 |
+
"n_references": 9,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000010",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/reference_pool/done/sample_000011.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000011",
|
| 3 |
+
"plan_path": "sample_000011/plan.json",
|
| 4 |
+
"task_path": "sample_000011/vocab_task.json",
|
| 5 |
+
"main_image": "sample_000011/main_image.png",
|
| 6 |
+
"detections": "sample_000011/detections.json",
|
| 7 |
+
"references": "sample_000011/references.json",
|
| 8 |
+
"n_references": 10,
|
| 9 |
+
"reference_errors": {},
|
| 10 |
+
"model_ids": {
|
| 11 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 12 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 13 |
+
},
|
| 14 |
+
"item_id": "sample_000011",
|
| 15 |
+
"pool": "reference_pool",
|
| 16 |
+
"retry_count": 0,
|
| 17 |
+
"errors": []
|
| 18 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000001.json
ADDED
|
@@ -0,0 +1,164 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000001",
|
| 3 |
+
"target_total": 3,
|
| 4 |
+
"target_people": 1,
|
| 5 |
+
"target_objects": 2,
|
| 6 |
+
"canvas_size": [
|
| 7 |
+
1248,
|
| 8 |
+
832
|
| 9 |
+
],
|
| 10 |
+
"canvas_aspect_ratio": "3:2",
|
| 11 |
+
"main_image": "main_image.png",
|
| 12 |
+
"bbox_overlay": "bbox_overlay.png",
|
| 13 |
+
"plan": "plan.json",
|
| 14 |
+
"detections": "detections.json",
|
| 15 |
+
"vocab_task": "vocab_task.json",
|
| 16 |
+
"n_planned": 3,
|
| 17 |
+
"n_detected": 3,
|
| 18 |
+
"n_subjects": 3,
|
| 19 |
+
"subjects": [
|
| 20 |
+
{
|
| 21 |
+
"name": "person_in_red_light",
|
| 22 |
+
"is_person": true,
|
| 23 |
+
"subject_type": "person",
|
| 24 |
+
"source_set": "people_set",
|
| 25 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_76251.npy:person:0",
|
| 26 |
+
"source_name": "person",
|
| 27 |
+
"source_description": "Visible by their hands, which are illuminated in bright red light, holding a small object. Source dataset: Ego4D. Scene context: A person's hands are visible in a dark setting, illuminated by a red light, holding and interacting with a small dark object.",
|
| 28 |
+
"sub_caption": "person: A person, prominently visible by their hands and forearms which are bathed in bright red light, holding and interacting with a small dark electronic object.. Scene role: Operating the small device in the foreground",
|
| 29 |
+
"measured_bbox": [
|
| 30 |
+
0.301,
|
| 31 |
+
0.039,
|
| 32 |
+
0.714,
|
| 33 |
+
0.98
|
| 34 |
+
],
|
| 35 |
+
"detection_confidence": 0.95,
|
| 36 |
+
"ref_style": "white_bg_full_body_front",
|
| 37 |
+
"ref_image": "references/ref_person_in_red_light.png",
|
| 38 |
+
"raw_ref_image": "references/raw_ref_person_in_red_light_attempt_01.png",
|
| 39 |
+
"reference_verify": "references/reference_verify_person_in_red_light.json",
|
| 40 |
+
"reference_verify_passed": true,
|
| 41 |
+
"reference_attempts": 1,
|
| 42 |
+
"sam_white_bg": {
|
| 43 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000001/references/raw_ref_person_in_red_light_attempt_01.png",
|
| 44 |
+
"output": "references/ref_person_in_red_light.png",
|
| 45 |
+
"mask": "references/sam_mask_person_in_red_light.png",
|
| 46 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 47 |
+
"sam_model_type": "vit_b",
|
| 48 |
+
"sam_device": "auto",
|
| 49 |
+
"sam_working_size": [
|
| 50 |
+
640,
|
| 51 |
+
640
|
| 52 |
+
],
|
| 53 |
+
"sam_max_side": 640,
|
| 54 |
+
"sam_downscale": 0.625,
|
| 55 |
+
"prompt_box_xyxy": [
|
| 56 |
+
324.0,
|
| 57 |
+
26.0,
|
| 58 |
+
699.0,
|
| 59 |
+
1013.0
|
| 60 |
+
],
|
| 61 |
+
"mask_score": 3.392402,
|
| 62 |
+
"mask_area_ratio": 0.165197,
|
| 63 |
+
"elapsed_seconds": 53.7174
|
| 64 |
+
}
|
| 65 |
+
},
|
| 66 |
+
{
|
| 67 |
+
"name": "red_illuminated_structure",
|
| 68 |
+
"is_person": false,
|
| 69 |
+
"subject_type": "object",
|
| 70 |
+
"source_set": "obj_set",
|
| 71 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_2029.npy:object:1",
|
| 72 |
+
"source_name": "red illuminated structure",
|
| 73 |
+
"source_description": "A structure on the right side of the image, possibly a wall or barricade, strongly illuminated with red light, featuring a grid-like or textured pattern. Source dataset: Ego4D. Scene context: A dark, possibly outdoor or poorly lit indoor area illuminated by strong blue and red artificial lights.",
|
| 74 |
+
"sub_caption": "red illuminated structure: A sturdy wall or barricade-like structure featuring a textured, grid-like pattern, strongly illuminated by deep red ambient light.. Scene role: Forms the textured, atmospheric background behind the person",
|
| 75 |
+
"measured_bbox": [
|
| 76 |
+
0.6096,
|
| 77 |
+
0.0,
|
| 78 |
+
0.9961,
|
| 79 |
+
0.991
|
| 80 |
+
],
|
| 81 |
+
"detection_confidence": "high",
|
| 82 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 83 |
+
"ref_image": "references/ref_red_illuminated_structure.png",
|
| 84 |
+
"raw_ref_image": "references/raw_ref_red_illuminated_structure_attempt_01.png",
|
| 85 |
+
"reference_verify": "references/reference_verify_red_illuminated_structure.json",
|
| 86 |
+
"reference_verify_passed": true,
|
| 87 |
+
"reference_attempts": 1,
|
| 88 |
+
"sam_white_bg": {
|
| 89 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000001/references/raw_ref_red_illuminated_structure_attempt_01.png",
|
| 90 |
+
"output": "references/ref_red_illuminated_structure.png",
|
| 91 |
+
"mask": "references/sam_mask_red_illuminated_structure.png",
|
| 92 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 93 |
+
"sam_model_type": "vit_b",
|
| 94 |
+
"sam_device": "auto",
|
| 95 |
+
"sam_working_size": [
|
| 96 |
+
640,
|
| 97 |
+
640
|
| 98 |
+
],
|
| 99 |
+
"sam_max_side": 640,
|
| 100 |
+
"sam_downscale": 0.625,
|
| 101 |
+
"prompt_box_xyxy": [
|
| 102 |
+
0.0,
|
| 103 |
+
0.0,
|
| 104 |
+
1023.0,
|
| 105 |
+
1023.0
|
| 106 |
+
],
|
| 107 |
+
"mask_score": 1.966617,
|
| 108 |
+
"mask_area_ratio": 0.597257,
|
| 109 |
+
"elapsed_seconds": 10.2671
|
| 110 |
+
}
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "green_indicator_light",
|
| 114 |
+
"is_person": false,
|
| 115 |
+
"subject_type": "object",
|
| 116 |
+
"source_set": "obj_set",
|
| 117 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_294886.npy:object:1",
|
| 118 |
+
"source_name": "green light",
|
| 119 |
+
"source_description": "Small, bright green glowing indicator light, possibly an LED, located on the dark structure. Source dataset: Ego4D. Scene context: An extremely dark scene with only a faint silhouette of an object and a small green indicator light visible.",
|
| 120 |
+
"sub_caption": "green light: A small, bright green glowing LED indicator light piercing through the darkness.. Scene role: Glowing on a dark piece of equipment beside the person, contrasting sharply with the dominant red lighting",
|
| 121 |
+
"measured_bbox": [
|
| 122 |
+
0.1227,
|
| 123 |
+
0.438,
|
| 124 |
+
0.1605,
|
| 125 |
+
0.4975
|
| 126 |
+
],
|
| 127 |
+
"detection_confidence": 0.95,
|
| 128 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 129 |
+
"ref_image": "references/ref_green_indicator_light.png",
|
| 130 |
+
"raw_ref_image": "references/raw_ref_green_indicator_light_attempt_01.png",
|
| 131 |
+
"reference_verify": "references/reference_verify_green_indicator_light.json",
|
| 132 |
+
"reference_verify_passed": true,
|
| 133 |
+
"reference_attempts": 1,
|
| 134 |
+
"sam_white_bg": {
|
| 135 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000001/references/raw_ref_green_indicator_light_attempt_01.png",
|
| 136 |
+
"output": "references/ref_green_indicator_light.png",
|
| 137 |
+
"mask": "references/sam_mask_green_indicator_light.png",
|
| 138 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 139 |
+
"sam_model_type": "vit_b",
|
| 140 |
+
"sam_device": "auto",
|
| 141 |
+
"sam_working_size": [
|
| 142 |
+
640,
|
| 143 |
+
640
|
| 144 |
+
],
|
| 145 |
+
"sam_max_side": 640,
|
| 146 |
+
"sam_downscale": 0.625,
|
| 147 |
+
"prompt_box_xyxy": [
|
| 148 |
+
347.0,
|
| 149 |
+
335.0,
|
| 150 |
+
676.0,
|
| 151 |
+
688.0
|
| 152 |
+
],
|
| 153 |
+
"mask_score": 3.439631,
|
| 154 |
+
"mask_area_ratio": 0.059673,
|
| 155 |
+
"elapsed_seconds": 10.1365
|
| 156 |
+
}
|
| 157 |
+
}
|
| 158 |
+
],
|
| 159 |
+
"not_emitted": [],
|
| 160 |
+
"model_ids": {
|
| 161 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 162 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 163 |
+
}
|
| 164 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000003.json
ADDED
|
@@ -0,0 +1,164 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000003",
|
| 3 |
+
"target_total": 3,
|
| 4 |
+
"target_people": 1,
|
| 5 |
+
"target_objects": 2,
|
| 6 |
+
"canvas_size": [
|
| 7 |
+
1152,
|
| 8 |
+
864
|
| 9 |
+
],
|
| 10 |
+
"canvas_aspect_ratio": "4:3",
|
| 11 |
+
"main_image": "main_image.png",
|
| 12 |
+
"bbox_overlay": "bbox_overlay.png",
|
| 13 |
+
"plan": "plan.json",
|
| 14 |
+
"detections": "detections.json",
|
| 15 |
+
"vocab_task": "vocab_task.json",
|
| 16 |
+
"n_planned": 3,
|
| 17 |
+
"n_detected": 3,
|
| 18 |
+
"n_subjects": 3,
|
| 19 |
+
"subjects": [
|
| 20 |
+
{
|
| 21 |
+
"name": "person_in_red_light",
|
| 22 |
+
"is_person": true,
|
| 23 |
+
"subject_type": "person",
|
| 24 |
+
"source_set": "people_set",
|
| 25 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_135381.npy:person:0",
|
| 26 |
+
"source_name": "person",
|
| 27 |
+
"source_description": "Visible hands and arms of a person in a dark setting, illuminated by red light, interacting with objects. Source dataset: Ego4D. Scene context: A close-up view of a person's hands and arms interacting with objects in a dark setting, illuminated by red and white light.",
|
| 28 |
+
"sub_caption": "person: Visible hands and lower arms, dramatically illuminated by a deep red light, emerging from the dark surroundings.. Scene role: Interacting with the open book, fingers lightly resting on the visible pages.",
|
| 29 |
+
"measured_bbox": [
|
| 30 |
+
0.0,
|
| 31 |
+
0.0,
|
| 32 |
+
0.5655,
|
| 33 |
+
1.0
|
| 34 |
+
],
|
| 35 |
+
"detection_confidence": 0.9,
|
| 36 |
+
"ref_style": "white_bg_full_body_front",
|
| 37 |
+
"ref_image": "references/ref_person_in_red_light.png",
|
| 38 |
+
"raw_ref_image": "references/raw_ref_person_in_red_light_attempt_01.png",
|
| 39 |
+
"reference_verify": "references/reference_verify_person_in_red_light.json",
|
| 40 |
+
"reference_verify_passed": true,
|
| 41 |
+
"reference_attempts": 1,
|
| 42 |
+
"sam_white_bg": {
|
| 43 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000003/references/raw_ref_person_in_red_light_attempt_01.png",
|
| 44 |
+
"output": "references/ref_person_in_red_light.png",
|
| 45 |
+
"mask": "references/sam_mask_person_in_red_light.png",
|
| 46 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 47 |
+
"sam_model_type": "vit_b",
|
| 48 |
+
"sam_device": "auto",
|
| 49 |
+
"sam_working_size": [
|
| 50 |
+
640,
|
| 51 |
+
640
|
| 52 |
+
],
|
| 53 |
+
"sam_max_side": 640,
|
| 54 |
+
"sam_downscale": 0.625,
|
| 55 |
+
"prompt_box_xyxy": [
|
| 56 |
+
351.0,
|
| 57 |
+
54.0,
|
| 58 |
+
667.0,
|
| 59 |
+
1015.0
|
| 60 |
+
],
|
| 61 |
+
"mask_score": 3.471897,
|
| 62 |
+
"mask_area_ratio": 0.134706,
|
| 63 |
+
"elapsed_seconds": 8.8737
|
| 64 |
+
}
|
| 65 |
+
},
|
| 66 |
+
{
|
| 67 |
+
"name": "red_illuminated_book",
|
| 68 |
+
"is_person": false,
|
| 69 |
+
"subject_type": "object",
|
| 70 |
+
"source_set": "obj_set",
|
| 71 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_236888.npy:object:0",
|
| 72 |
+
"source_name": "book",
|
| 73 |
+
"source_description": "An open book with pages visible, illuminated in a red hue, showing text and some graphical elements. Source dataset: Ego4D. Scene context: A dimly lit scene showing an open book, illuminated by a red light, being held or resting in the darkness.",
|
| 74 |
+
"sub_caption": "book: A large, open book with visible pages and faint layout elements, cast in a striking red hue from an overhead light source.. Scene role: Lying open flat on the surface directly beneath the person's hands.",
|
| 75 |
+
"measured_bbox": [
|
| 76 |
+
0.2245,
|
| 77 |
+
0.3971,
|
| 78 |
+
0.6708,
|
| 79 |
+
0.6724
|
| 80 |
+
],
|
| 81 |
+
"detection_confidence": 0.98,
|
| 82 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 83 |
+
"ref_image": "references/ref_red_illuminated_book.png",
|
| 84 |
+
"raw_ref_image": "references/raw_ref_red_illuminated_book_attempt_01.png",
|
| 85 |
+
"reference_verify": "references/reference_verify_red_illuminated_book.json",
|
| 86 |
+
"reference_verify_passed": true,
|
| 87 |
+
"reference_attempts": 1,
|
| 88 |
+
"sam_white_bg": {
|
| 89 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000003/references/raw_ref_red_illuminated_book_attempt_01.png",
|
| 90 |
+
"output": "references/ref_red_illuminated_book.png",
|
| 91 |
+
"mask": "references/sam_mask_red_illuminated_book.png",
|
| 92 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 93 |
+
"sam_model_type": "vit_b",
|
| 94 |
+
"sam_device": "auto",
|
| 95 |
+
"sam_working_size": [
|
| 96 |
+
640,
|
| 97 |
+
640
|
| 98 |
+
],
|
| 99 |
+
"sam_max_side": 640,
|
| 100 |
+
"sam_downscale": 0.625,
|
| 101 |
+
"prompt_box_xyxy": [
|
| 102 |
+
22.0,
|
| 103 |
+
180.0,
|
| 104 |
+
1002.0,
|
| 105 |
+
858.0
|
| 106 |
+
],
|
| 107 |
+
"mask_score": 3.463648,
|
| 108 |
+
"mask_area_ratio": 0.502075,
|
| 109 |
+
"elapsed_seconds": 7.3171
|
| 110 |
+
}
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "shadowy_doorway",
|
| 114 |
+
"is_person": false,
|
| 115 |
+
"subject_type": "object",
|
| 116 |
+
"source_set": "obj_set",
|
| 117 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_311165.npy:object:2",
|
| 118 |
+
"source_name": "doorway or opening",
|
| 119 |
+
"source_description": "A darker, arched or rectangular shape on the wall, suggesting an opening to another area. Source dataset: Ego4D. Scene context: A very dark, low-resolution scene indoors, mostly obscured by shadow with some faint brownish light indicating walls or structures.",
|
| 120 |
+
"sub_caption": "doorway or opening: A dark, arched doorway outline set into a shadowy, indistinct wall, suggesting a passage to another dark room.. Scene role: Positioned in the out-of-focus background to establish architectural depth behind the main illuminated desk area.",
|
| 121 |
+
"measured_bbox": [
|
| 122 |
+
0.5153,
|
| 123 |
+
0.0267,
|
| 124 |
+
0.8188,
|
| 125 |
+
0.8345
|
| 126 |
+
],
|
| 127 |
+
"detection_confidence": 0.9,
|
| 128 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 129 |
+
"ref_image": "references/ref_shadowy_doorway.png",
|
| 130 |
+
"raw_ref_image": "references/raw_ref_shadowy_doorway_attempt_01.png",
|
| 131 |
+
"reference_verify": "references/reference_verify_shadowy_doorway.json",
|
| 132 |
+
"reference_verify_passed": true,
|
| 133 |
+
"reference_attempts": 1,
|
| 134 |
+
"sam_white_bg": {
|
| 135 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000003/references/raw_ref_shadowy_doorway_attempt_01.png",
|
| 136 |
+
"output": "references/ref_shadowy_doorway.png",
|
| 137 |
+
"mask": "references/sam_mask_shadowy_doorway.png",
|
| 138 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 139 |
+
"sam_model_type": "vit_b",
|
| 140 |
+
"sam_device": "auto",
|
| 141 |
+
"sam_working_size": [
|
| 142 |
+
640,
|
| 143 |
+
640
|
| 144 |
+
],
|
| 145 |
+
"sam_max_side": 640,
|
| 146 |
+
"sam_downscale": 0.625,
|
| 147 |
+
"prompt_box_xyxy": [
|
| 148 |
+
141.0,
|
| 149 |
+
11.0,
|
| 150 |
+
899.0,
|
| 151 |
+
969.0
|
| 152 |
+
],
|
| 153 |
+
"mask_score": 3.471354,
|
| 154 |
+
"mask_area_ratio": 0.542183,
|
| 155 |
+
"elapsed_seconds": 7.2941
|
| 156 |
+
}
|
| 157 |
+
}
|
| 158 |
+
],
|
| 159 |
+
"not_emitted": [],
|
| 160 |
+
"model_ids": {
|
| 161 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 162 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 163 |
+
}
|
| 164 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000004.json
ADDED
|
@@ -0,0 +1,173 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000004",
|
| 3 |
+
"target_total": 5,
|
| 4 |
+
"target_people": 1,
|
| 5 |
+
"target_objects": 4,
|
| 6 |
+
"canvas_size": [
|
| 7 |
+
864,
|
| 8 |
+
1152
|
| 9 |
+
],
|
| 10 |
+
"canvas_aspect_ratio": "3:4",
|
| 11 |
+
"main_image": "main_image.png",
|
| 12 |
+
"bbox_overlay": "bbox_overlay.png",
|
| 13 |
+
"plan": "plan.json",
|
| 14 |
+
"detections": "detections.json",
|
| 15 |
+
"vocab_task": "vocab_task.json",
|
| 16 |
+
"n_planned": 5,
|
| 17 |
+
"n_detected": 5,
|
| 18 |
+
"n_subjects": 3,
|
| 19 |
+
"subjects": [
|
| 20 |
+
{
|
| 21 |
+
"name": "blue_light_source",
|
| 22 |
+
"is_person": false,
|
| 23 |
+
"subject_type": "object",
|
| 24 |
+
"source_set": "obj_set",
|
| 25 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_98001.npy:object:0",
|
| 26 |
+
"source_name": "blue light source",
|
| 27 |
+
"source_description": "A small, blurry blue light, appearing as a faint glow against the dark background. Source dataset: Ego4D. Scene context: A predominantly dark scene with a single, small, indistinct blue light source visible towards the right side.",
|
| 28 |
+
"sub_caption": "blue light source: A small, blurry blue light emitting a faint, cool glow against the darkness.. Scene role: Positioned in the deep background to the left, providing an atmospheric back-light and contrasting with the red lighting.",
|
| 29 |
+
"measured_bbox": [
|
| 30 |
+
0.5155,
|
| 31 |
+
0.3724,
|
| 32 |
+
0.553,
|
| 33 |
+
0.4239
|
| 34 |
+
],
|
| 35 |
+
"detection_confidence": "high",
|
| 36 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 37 |
+
"ref_image": "references/ref_blue_light_source.png",
|
| 38 |
+
"raw_ref_image": "references/raw_ref_blue_light_source_attempt_01.png",
|
| 39 |
+
"reference_verify": "references/reference_verify_blue_light_source.json",
|
| 40 |
+
"reference_verify_passed": true,
|
| 41 |
+
"reference_attempts": 1,
|
| 42 |
+
"sam_white_bg": {
|
| 43 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000004/references/raw_ref_blue_light_source_attempt_01.png",
|
| 44 |
+
"output": "references/ref_blue_light_source.png",
|
| 45 |
+
"mask": "references/sam_mask_blue_light_source.png",
|
| 46 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 47 |
+
"sam_model_type": "vit_b",
|
| 48 |
+
"sam_device": "auto",
|
| 49 |
+
"sam_working_size": [
|
| 50 |
+
640,
|
| 51 |
+
640
|
| 52 |
+
],
|
| 53 |
+
"sam_max_side": 640,
|
| 54 |
+
"sam_downscale": 0.625,
|
| 55 |
+
"prompt_box_xyxy": [
|
| 56 |
+
132.0,
|
| 57 |
+
159.0,
|
| 58 |
+
891.0,
|
| 59 |
+
864.0
|
| 60 |
+
],
|
| 61 |
+
"mask_score": 3.485053,
|
| 62 |
+
"mask_area_ratio": 0.292151,
|
| 63 |
+
"elapsed_seconds": 9.6106
|
| 64 |
+
}
|
| 65 |
+
},
|
| 66 |
+
{
|
| 67 |
+
"name": "paint_roller",
|
| 68 |
+
"is_person": false,
|
| 69 |
+
"subject_type": "object",
|
| 70 |
+
"source_set": "obj_set",
|
| 71 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_95307.npy:object:0",
|
| 72 |
+
"source_name": "paint roller",
|
| 73 |
+
"source_description": "A standard paint roller with a dark cylindrical cover and a metal frame connecting to a handle. Source dataset: Ego4D. Scene context: A close-up view of a paint roller against a light-colored wall in a dimly lit setting.",
|
| 74 |
+
"sub_caption": "paint roller: A standard paint roller with a dark cylindrical cover, attached to a metal frame and handle.. Scene role: Resting on a nearby surface in the foreground, catching subtle highlights from the red light.",
|
| 75 |
+
"measured_bbox": [
|
| 76 |
+
0.2917,
|
| 77 |
+
0.532,
|
| 78 |
+
0.4405,
|
| 79 |
+
0.7522
|
| 80 |
+
],
|
| 81 |
+
"detection_confidence": 0.99,
|
| 82 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 83 |
+
"ref_image": "references/ref_paint_roller.png",
|
| 84 |
+
"raw_ref_image": "references/raw_ref_paint_roller_attempt_01.png",
|
| 85 |
+
"reference_verify": "references/reference_verify_paint_roller.json",
|
| 86 |
+
"reference_verify_passed": true,
|
| 87 |
+
"reference_attempts": 1,
|
| 88 |
+
"sam_white_bg": {
|
| 89 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000004/references/raw_ref_paint_roller_attempt_01.png",
|
| 90 |
+
"output": "references/ref_paint_roller.png",
|
| 91 |
+
"mask": "references/sam_mask_paint_roller.png",
|
| 92 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 93 |
+
"sam_model_type": "vit_b",
|
| 94 |
+
"sam_device": "auto",
|
| 95 |
+
"sam_working_size": [
|
| 96 |
+
640,
|
| 97 |
+
640
|
| 98 |
+
],
|
| 99 |
+
"sam_max_side": 640,
|
| 100 |
+
"sam_downscale": 0.625,
|
| 101 |
+
"prompt_box_xyxy": [
|
| 102 |
+
136.0,
|
| 103 |
+
75.0,
|
| 104 |
+
866.0,
|
| 105 |
+
950.0
|
| 106 |
+
],
|
| 107 |
+
"mask_score": 3.459168,
|
| 108 |
+
"mask_area_ratio": 0.116944,
|
| 109 |
+
"elapsed_seconds": 7.1624
|
| 110 |
+
}
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "draped_tarp",
|
| 114 |
+
"is_person": false,
|
| 115 |
+
"subject_type": "object",
|
| 116 |
+
"source_set": "obj_set",
|
| 117 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_37499.npy:object:1",
|
| 118 |
+
"source_name": "light-colored material",
|
| 119 |
+
"source_description": "A draped, light-colored or beige material, possibly part of a tent or covering, visible on the right side. Source dataset: Ego4D. Scene context: The scene is a dark, possibly outdoor or dimly lit setting, showing what appears to be a structure or object covered with a large piece of material or tarp.",
|
| 120 |
+
"sub_caption": "light-colored material: A draped, light-colored tarp or drop cloth covering large, indistinct shapes.. Scene role: Draped over items on the right side of the room, adding textural detail and reflecting the mixed ambient lighting.",
|
| 121 |
+
"measured_bbox": [
|
| 122 |
+
0.392,
|
| 123 |
+
0.4207,
|
| 124 |
+
0.8243,
|
| 125 |
+
0.8862
|
| 126 |
+
],
|
| 127 |
+
"detection_confidence": 0.98,
|
| 128 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 129 |
+
"ref_image": "references/ref_draped_tarp.png",
|
| 130 |
+
"raw_ref_image": "references/raw_ref_draped_tarp_attempt_01.png",
|
| 131 |
+
"reference_verify": "references/reference_verify_draped_tarp.json",
|
| 132 |
+
"reference_verify_passed": true,
|
| 133 |
+
"reference_attempts": 1,
|
| 134 |
+
"sam_white_bg": {
|
| 135 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000004/references/raw_ref_draped_tarp_attempt_01.png",
|
| 136 |
+
"output": "references/ref_draped_tarp.png",
|
| 137 |
+
"mask": "references/sam_mask_draped_tarp.png",
|
| 138 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 139 |
+
"sam_model_type": "vit_b",
|
| 140 |
+
"sam_device": "auto",
|
| 141 |
+
"sam_working_size": [
|
| 142 |
+
640,
|
| 143 |
+
640
|
| 144 |
+
],
|
| 145 |
+
"sam_max_side": 640,
|
| 146 |
+
"sam_downscale": 0.625,
|
| 147 |
+
"prompt_box_xyxy": [
|
| 148 |
+
0.0,
|
| 149 |
+
189.0,
|
| 150 |
+
1023.0,
|
| 151 |
+
888.0
|
| 152 |
+
],
|
| 153 |
+
"mask_score": 3.482188,
|
| 154 |
+
"mask_area_ratio": 0.485075,
|
| 155 |
+
"elapsed_seconds": 7.4131
|
| 156 |
+
}
|
| 157 |
+
}
|
| 158 |
+
],
|
| 159 |
+
"not_emitted": [
|
| 160 |
+
{
|
| 161 |
+
"name": "worker_in_cap",
|
| 162 |
+
"reason": "not_detected"
|
| 163 |
+
},
|
| 164 |
+
{
|
| 165 |
+
"name": "stacked_boxes",
|
| 166 |
+
"reason": "not_detected"
|
| 167 |
+
}
|
| 168 |
+
],
|
| 169 |
+
"model_ids": {
|
| 170 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 171 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 172 |
+
}
|
| 173 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000005.json
ADDED
|
@@ -0,0 +1,302 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000005",
|
| 3 |
+
"target_total": 6,
|
| 4 |
+
"target_people": 3,
|
| 5 |
+
"target_objects": 3,
|
| 6 |
+
"canvas_size": [
|
| 7 |
+
1152,
|
| 8 |
+
864
|
| 9 |
+
],
|
| 10 |
+
"canvas_aspect_ratio": "4:3",
|
| 11 |
+
"main_image": "main_image.png",
|
| 12 |
+
"bbox_overlay": "bbox_overlay.png",
|
| 13 |
+
"plan": "plan.json",
|
| 14 |
+
"detections": "detections.json",
|
| 15 |
+
"vocab_task": "vocab_task.json",
|
| 16 |
+
"n_planned": 6,
|
| 17 |
+
"n_detected": 6,
|
| 18 |
+
"n_subjects": 6,
|
| 19 |
+
"subjects": [
|
| 20 |
+
{
|
| 21 |
+
"name": "pizza_prep_hands",
|
| 22 |
+
"is_person": true,
|
| 23 |
+
"subject_type": "person",
|
| 24 |
+
"source_set": "people_set",
|
| 25 |
+
"source_image_id": "EPIC-Kitchens:P11_106:person:0",
|
| 26 |
+
"source_name": "person",
|
| 27 |
+
"source_description": "The person's hands and lower arms are visible at the bottom of the frame, appearing to be in the middle of preparing food. Source dataset: EPIC-Kitchens. Scene context: A top-down view of a wooden kitchen table where two pizzas are being prepared with various ingredients like red onions, mushrooms, and tomatoes.",
|
| 28 |
+
"sub_caption": "person: Hands and lower arms visible, preparing a pizza on a wooden surface.. Scene role: In the foreground, actively making a pizza.",
|
| 29 |
+
"measured_bbox": [
|
| 30 |
+
0.532,
|
| 31 |
+
0.2245,
|
| 32 |
+
1.0,
|
| 33 |
+
0.7871
|
| 34 |
+
],
|
| 35 |
+
"detection_confidence": 0.9,
|
| 36 |
+
"ref_style": "white_bg_full_body_front",
|
| 37 |
+
"ref_image": "references/ref_pizza_prep_hands.png",
|
| 38 |
+
"raw_ref_image": "references/raw_ref_pizza_prep_hands_attempt_02.png",
|
| 39 |
+
"reference_verify": "references/reference_verify_pizza_prep_hands.json",
|
| 40 |
+
"reference_verify_passed": true,
|
| 41 |
+
"reference_attempts": 2,
|
| 42 |
+
"sam_white_bg": {
|
| 43 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_pizza_prep_hands_attempt_02.png",
|
| 44 |
+
"output": "references/ref_pizza_prep_hands.png",
|
| 45 |
+
"mask": "references/sam_mask_pizza_prep_hands.png",
|
| 46 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 47 |
+
"sam_model_type": "vit_b",
|
| 48 |
+
"sam_device": "auto",
|
| 49 |
+
"sam_working_size": [
|
| 50 |
+
640,
|
| 51 |
+
640
|
| 52 |
+
],
|
| 53 |
+
"sam_max_side": 640,
|
| 54 |
+
"sam_downscale": 0.625,
|
| 55 |
+
"prompt_box_xyxy": [
|
| 56 |
+
349.0,
|
| 57 |
+
14.0,
|
| 58 |
+
677.0,
|
| 59 |
+
1016.0
|
| 60 |
+
],
|
| 61 |
+
"mask_score": 3.451951,
|
| 62 |
+
"mask_area_ratio": 0.150558,
|
| 63 |
+
"elapsed_seconds": 10.2196
|
| 64 |
+
}
|
| 65 |
+
},
|
| 66 |
+
{
|
| 67 |
+
"name": "person_in_jacket",
|
| 68 |
+
"is_person": true,
|
| 69 |
+
"subject_type": "person",
|
| 70 |
+
"source_set": "people_set",
|
| 71 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_22577.npy:person:0",
|
| 72 |
+
"source_name": "person",
|
| 73 |
+
"source_description": "A person visible mostly from the back, wearing a dark jacket over a red shirt with yellow text that includes the words 'STANLEY CUP'. The person has dark hair. Source dataset: Ego4D. Scene context: A close-up view of a person wearing a red shirt with yellow text, seemingly engaged in an activity in a dimly lit indoor setting.",
|
| 74 |
+
"sub_caption": "person: Person seen mostly from the back, dark hair, wearing a dark jacket over a red shirt with yellow abstract patterns.. Scene role: Standing in the midground, facing away toward the kitchen cabinets.",
|
| 75 |
+
"measured_bbox": [
|
| 76 |
+
0.0,
|
| 77 |
+
0.0,
|
| 78 |
+
0.361,
|
| 79 |
+
0.675
|
| 80 |
+
],
|
| 81 |
+
"detection_confidence": 1.0,
|
| 82 |
+
"ref_style": "white_bg_full_body_front",
|
| 83 |
+
"ref_image": "references/ref_person_in_jacket.png",
|
| 84 |
+
"raw_ref_image": "references/raw_ref_person_in_jacket_attempt_02.png",
|
| 85 |
+
"reference_verify": "references/reference_verify_person_in_jacket.json",
|
| 86 |
+
"reference_verify_passed": true,
|
| 87 |
+
"reference_attempts": 2,
|
| 88 |
+
"sam_white_bg": {
|
| 89 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_person_in_jacket_attempt_02.png",
|
| 90 |
+
"output": "references/ref_person_in_jacket.png",
|
| 91 |
+
"mask": "references/sam_mask_person_in_jacket.png",
|
| 92 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 93 |
+
"sam_model_type": "vit_b",
|
| 94 |
+
"sam_device": "auto",
|
| 95 |
+
"sam_working_size": [
|
| 96 |
+
640,
|
| 97 |
+
640
|
| 98 |
+
],
|
| 99 |
+
"sam_max_side": 640,
|
| 100 |
+
"sam_downscale": 0.625,
|
| 101 |
+
"prompt_box_xyxy": [
|
| 102 |
+
334.0,
|
| 103 |
+
15.0,
|
| 104 |
+
684.0,
|
| 105 |
+
1023.0
|
| 106 |
+
],
|
| 107 |
+
"mask_score": 3.414528,
|
| 108 |
+
"mask_area_ratio": 0.160464,
|
| 109 |
+
"elapsed_seconds": 10.2925
|
| 110 |
+
}
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "person_with_pan",
|
| 114 |
+
"is_person": true,
|
| 115 |
+
"subject_type": "person",
|
| 116 |
+
"source_set": "people_set",
|
| 117 |
+
"source_image_id": "Ego4D:ego4d_video/EGO_192493.npy:person:0",
|
| 118 |
+
"source_name": "person",
|
| 119 |
+
"source_description": "A person standing in the room, seen from the torso down, holding a dark round object. Source dataset: Ego4D. Scene context: A person stands in a dimly lit room holding a round object near a blue wall.",
|
| 120 |
+
"sub_caption": "person: Person seen from the torso down, holding a dark round object.. Scene role: Standing in the background near a blue wall.",
|
| 121 |
+
"measured_bbox": [
|
| 122 |
+
0.1195,
|
| 123 |
+
0.0021,
|
| 124 |
+
0.4483,
|
| 125 |
+
0.6302
|
| 126 |
+
],
|
| 127 |
+
"detection_confidence": 0.95,
|
| 128 |
+
"ref_style": "white_bg_full_body_front",
|
| 129 |
+
"ref_image": "references/ref_person_with_pan.png",
|
| 130 |
+
"raw_ref_image": "references/raw_ref_person_with_pan_attempt_02.png",
|
| 131 |
+
"reference_verify": "references/reference_verify_person_with_pan.json",
|
| 132 |
+
"reference_verify_passed": true,
|
| 133 |
+
"reference_attempts": 2,
|
| 134 |
+
"sam_white_bg": {
|
| 135 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_person_with_pan_attempt_02.png",
|
| 136 |
+
"output": "references/ref_person_with_pan.png",
|
| 137 |
+
"mask": "references/sam_mask_person_with_pan.png",
|
| 138 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 139 |
+
"sam_model_type": "vit_b",
|
| 140 |
+
"sam_device": "auto",
|
| 141 |
+
"sam_working_size": [
|
| 142 |
+
640,
|
| 143 |
+
640
|
| 144 |
+
],
|
| 145 |
+
"sam_max_side": 640,
|
| 146 |
+
"sam_downscale": 0.625,
|
| 147 |
+
"prompt_box_xyxy": [
|
| 148 |
+
334.0,
|
| 149 |
+
18.0,
|
| 150 |
+
690.0,
|
| 151 |
+
1023.0
|
| 152 |
+
],
|
| 153 |
+
"mask_score": 3.408831,
|
| 154 |
+
"mask_area_ratio": 0.163625,
|
| 155 |
+
"elapsed_seconds": 10.3028
|
| 156 |
+
}
|
| 157 |
+
},
|
| 158 |
+
{
|
| 159 |
+
"name": "salt_box",
|
| 160 |
+
"is_person": false,
|
| 161 |
+
"subject_type": "object",
|
| 162 |
+
"source_set": "obj_set",
|
| 163 |
+
"source_image_id": "EPIC-Kitchens:P35_102:object:1",
|
| 164 |
+
"source_name": "box of salt",
|
| 165 |
+
"source_description": "A small cardboard box with blue and black text, sitting on the counter near the stove. Source dataset: EPIC-Kitchens. Scene context: A kitchen counter area with a sink containing dirty dishes, a frying pan on a drying rack, and various cooking utensils.",
|
| 166 |
+
"sub_caption": "box of salt: A small cardboard box with blue and black graphical patterns, resembling a salt container.. Scene role: Resting on the wooden counter next to the pizza prep area.",
|
| 167 |
+
"measured_bbox": [
|
| 168 |
+
0.5558,
|
| 169 |
+
0.4006,
|
| 170 |
+
0.6966,
|
| 171 |
+
0.4937
|
| 172 |
+
],
|
| 173 |
+
"detection_confidence": 0.5,
|
| 174 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 175 |
+
"ref_image": "references/ref_salt_box.png",
|
| 176 |
+
"raw_ref_image": "references/raw_ref_salt_box_attempt_01.png",
|
| 177 |
+
"reference_verify": "references/reference_verify_salt_box.json",
|
| 178 |
+
"reference_verify_passed": true,
|
| 179 |
+
"reference_attempts": 1,
|
| 180 |
+
"sam_white_bg": {
|
| 181 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_salt_box_attempt_01.png",
|
| 182 |
+
"output": "references/ref_salt_box.png",
|
| 183 |
+
"mask": "references/sam_mask_salt_box.png",
|
| 184 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 185 |
+
"sam_model_type": "vit_b",
|
| 186 |
+
"sam_device": "auto",
|
| 187 |
+
"sam_working_size": [
|
| 188 |
+
640,
|
| 189 |
+
640
|
| 190 |
+
],
|
| 191 |
+
"sam_max_side": 640,
|
| 192 |
+
"sam_downscale": 0.625,
|
| 193 |
+
"prompt_box_xyxy": [
|
| 194 |
+
73.0,
|
| 195 |
+
268.0,
|
| 196 |
+
952.0,
|
| 197 |
+
762.0
|
| 198 |
+
],
|
| 199 |
+
"mask_score": 3.471932,
|
| 200 |
+
"mask_area_ratio": 0.353847,
|
| 201 |
+
"elapsed_seconds": 10.266
|
| 202 |
+
}
|
| 203 |
+
},
|
| 204 |
+
{
|
| 205 |
+
"name": "cutlery_set",
|
| 206 |
+
"is_person": false,
|
| 207 |
+
"subject_type": "object",
|
| 208 |
+
"source_set": "obj_set",
|
| 209 |
+
"source_image_id": "EPIC-Kitchens:P26_103:object:4",
|
| 210 |
+
"source_name": "cutlery",
|
| 211 |
+
"source_description": "A silver fork and a knife resting on the yellow plate inside the right sink bowl. Source dataset: EPIC-Kitchens. Scene context: A first-person view of a stainless steel kitchen sink containing dirty dishes and a blue cloth, with a hand visible in the foreground.",
|
| 212 |
+
"sub_caption": "cutlery: A silver fork and a knife resting on a yellow plate.. Scene role: Placed on the counter in the foreground left.",
|
| 213 |
+
"measured_bbox": [
|
| 214 |
+
0.1913,
|
| 215 |
+
0.8329,
|
| 216 |
+
0.6116,
|
| 217 |
+
0.9636
|
| 218 |
+
],
|
| 219 |
+
"detection_confidence": "high",
|
| 220 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 221 |
+
"ref_image": "references/ref_cutlery_set.png",
|
| 222 |
+
"raw_ref_image": "references/raw_ref_cutlery_set_attempt_02.png",
|
| 223 |
+
"reference_verify": "references/reference_verify_cutlery_set.json",
|
| 224 |
+
"reference_verify_passed": true,
|
| 225 |
+
"reference_attempts": 2,
|
| 226 |
+
"sam_white_bg": {
|
| 227 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_cutlery_set_attempt_02.png",
|
| 228 |
+
"output": "references/ref_cutlery_set.png",
|
| 229 |
+
"mask": "references/sam_mask_cutlery_set.png",
|
| 230 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 231 |
+
"sam_model_type": "vit_b",
|
| 232 |
+
"sam_device": "auto",
|
| 233 |
+
"sam_working_size": [
|
| 234 |
+
640,
|
| 235 |
+
640
|
| 236 |
+
],
|
| 237 |
+
"sam_max_side": 640,
|
| 238 |
+
"sam_downscale": 0.625,
|
| 239 |
+
"prompt_box_xyxy": [
|
| 240 |
+
28.0,
|
| 241 |
+
122.0,
|
| 242 |
+
1013.0,
|
| 243 |
+
887.0
|
| 244 |
+
],
|
| 245 |
+
"mask_score": 3.237995,
|
| 246 |
+
"mask_area_ratio": 0.452152,
|
| 247 |
+
"elapsed_seconds": 10.821
|
| 248 |
+
}
|
| 249 |
+
},
|
| 250 |
+
{
|
| 251 |
+
"name": "wall_cabinet",
|
| 252 |
+
"is_person": false,
|
| 253 |
+
"subject_type": "object",
|
| 254 |
+
"source_set": "obj_set",
|
| 255 |
+
"source_image_id": "EPIC-Kitchens:P26_121:object:12",
|
| 256 |
+
"source_name": "cabinet",
|
| 257 |
+
"source_description": "A wooden cabinet positioned above the counter on the right side. Source dataset: EPIC-Kitchens. Scene context: A kitchen counter top with a stove, a pan, a bowl of yellow liquid, a wooden cutting board, a plate of food, a water bottle, a large water jug, and a small metal lid.",
|
| 258 |
+
"sub_caption": "cabinet: A wooden cabinet positioned above a kitchen counter.. Scene role: Mounted on the wall in the midground, directly above the counter.",
|
| 259 |
+
"measured_bbox": [
|
| 260 |
+
0.5897,
|
| 261 |
+
0.0017,
|
| 262 |
+
0.9469,
|
| 263 |
+
0.1735
|
| 264 |
+
],
|
| 265 |
+
"detection_confidence": 0.99,
|
| 266 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 267 |
+
"ref_image": "references/ref_wall_cabinet.png",
|
| 268 |
+
"raw_ref_image": "references/raw_ref_wall_cabinet_attempt_01.png",
|
| 269 |
+
"reference_verify": "references/reference_verify_wall_cabinet.json",
|
| 270 |
+
"reference_verify_passed": true,
|
| 271 |
+
"reference_attempts": 1,
|
| 272 |
+
"sam_white_bg": {
|
| 273 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000005/references/raw_ref_wall_cabinet_attempt_01.png",
|
| 274 |
+
"output": "references/ref_wall_cabinet.png",
|
| 275 |
+
"mask": "references/sam_mask_wall_cabinet.png",
|
| 276 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 277 |
+
"sam_model_type": "vit_b",
|
| 278 |
+
"sam_device": "auto",
|
| 279 |
+
"sam_working_size": [
|
| 280 |
+
640,
|
| 281 |
+
640
|
| 282 |
+
],
|
| 283 |
+
"sam_max_side": 640,
|
| 284 |
+
"sam_downscale": 0.625,
|
| 285 |
+
"prompt_box_xyxy": [
|
| 286 |
+
15.0,
|
| 287 |
+
31.0,
|
| 288 |
+
1008.0,
|
| 289 |
+
1013.0
|
| 290 |
+
],
|
| 291 |
+
"mask_score": 3.398914,
|
| 292 |
+
"mask_area_ratio": 0.735002,
|
| 293 |
+
"elapsed_seconds": 10.923
|
| 294 |
+
}
|
| 295 |
+
}
|
| 296 |
+
],
|
| 297 |
+
"not_emitted": [],
|
| 298 |
+
"model_ids": {
|
| 299 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 300 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 301 |
+
}
|
| 302 |
+
}
|
samples_v8/chaos/EPIC-Kitchens_Ego4D_samples/rows/sample_000006.json
ADDED
|
@@ -0,0 +1,311 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000006",
|
| 3 |
+
"target_total": 8,
|
| 4 |
+
"target_people": 1,
|
| 5 |
+
"target_objects": 7,
|
| 6 |
+
"canvas_size": [
|
| 7 |
+
1152,
|
| 8 |
+
864
|
| 9 |
+
],
|
| 10 |
+
"canvas_aspect_ratio": "4:3",
|
| 11 |
+
"main_image": "main_image.png",
|
| 12 |
+
"bbox_overlay": "bbox_overlay.png",
|
| 13 |
+
"plan": "plan.json",
|
| 14 |
+
"detections": "detections.json",
|
| 15 |
+
"vocab_task": "vocab_task.json",
|
| 16 |
+
"n_planned": 8,
|
| 17 |
+
"n_detected": 8,
|
| 18 |
+
"n_subjects": 6,
|
| 19 |
+
"subjects": [
|
| 20 |
+
{
|
| 21 |
+
"name": "person_at_sink",
|
| 22 |
+
"is_person": true,
|
| 23 |
+
"subject_type": "person",
|
| 24 |
+
"source_set": "people_set",
|
| 25 |
+
"source_image_id": "EPIC-Kitchens:P26_103:person:0",
|
| 26 |
+
"source_name": "person",
|
| 27 |
+
"source_description": "A person's left hand and lower body, including dark trousers and black shoes with white soles, are visible in the foreground, reaching towards the sink. Source dataset: EPIC-Kitchens. Scene context: A first-person view of a stainless steel kitchen sink containing dirty dishes and a blue cloth, with a hand visible in the foreground.",
|
| 28 |
+
"sub_caption": "person: A person's left hand and lower body wearing dark trousers and black shoes with white soles.. Scene role: Standing in the foreground, reaching their left hand towards the kitchen faucet.",
|
| 29 |
+
"measured_bbox": [
|
| 30 |
+
0.0,
|
| 31 |
+
0.3583,
|
| 32 |
+
0.2441,
|
| 33 |
+
1.0
|
| 34 |
+
],
|
| 35 |
+
"detection_confidence": 0.95,
|
| 36 |
+
"ref_style": "white_bg_full_body_front",
|
| 37 |
+
"ref_image": "references/ref_person_at_sink.png",
|
| 38 |
+
"raw_ref_image": "references/raw_ref_person_at_sink_attempt_01.png",
|
| 39 |
+
"reference_verify": "references/reference_verify_person_at_sink.json",
|
| 40 |
+
"reference_verify_passed": true,
|
| 41 |
+
"reference_attempts": 1,
|
| 42 |
+
"sam_white_bg": {
|
| 43 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_person_at_sink_attempt_01.png",
|
| 44 |
+
"output": "references/ref_person_at_sink.png",
|
| 45 |
+
"mask": "references/sam_mask_person_at_sink.png",
|
| 46 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 47 |
+
"sam_model_type": "vit_b",
|
| 48 |
+
"sam_device": "auto",
|
| 49 |
+
"sam_working_size": [
|
| 50 |
+
640,
|
| 51 |
+
640
|
| 52 |
+
],
|
| 53 |
+
"sam_max_side": 640,
|
| 54 |
+
"sam_downscale": 0.625,
|
| 55 |
+
"prompt_box_xyxy": [
|
| 56 |
+
320.0,
|
| 57 |
+
24.0,
|
| 58 |
+
689.0,
|
| 59 |
+
1002.0
|
| 60 |
+
],
|
| 61 |
+
"mask_score": 3.450755,
|
| 62 |
+
"mask_area_ratio": 0.163542,
|
| 63 |
+
"elapsed_seconds": 31.0984
|
| 64 |
+
}
|
| 65 |
+
},
|
| 66 |
+
{
|
| 67 |
+
"name": "wooden_door",
|
| 68 |
+
"is_person": false,
|
| 69 |
+
"subject_type": "object",
|
| 70 |
+
"source_set": "obj_set",
|
| 71 |
+
"source_image_id": "EPIC-Kitchens:P12_104:object:0",
|
| 72 |
+
"source_name": "door",
|
| 73 |
+
"source_description": "A light brown wooden door, closed, with a metallic door handle. Source dataset: EPIC-Kitchens. Scene context: A close-up view of a closed wooden door with a metal handle, positioned in a room with a kitchen area visible to the left.",
|
| 74 |
+
"sub_caption": "door: A light brown wooden door, closed, with a metallic handle.. Scene role: Visible in the background on the kitchen wall.",
|
| 75 |
+
"measured_bbox": [
|
| 76 |
+
0.2139,
|
| 77 |
+
0.0,
|
| 78 |
+
0.3994,
|
| 79 |
+
0.412
|
| 80 |
+
],
|
| 81 |
+
"detection_confidence": 1.0,
|
| 82 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 83 |
+
"ref_image": "references/ref_wooden_door.png",
|
| 84 |
+
"raw_ref_image": "references/raw_ref_wooden_door_attempt_01.png",
|
| 85 |
+
"reference_verify": "references/reference_verify_wooden_door.json",
|
| 86 |
+
"reference_verify_passed": true,
|
| 87 |
+
"reference_attempts": 1,
|
| 88 |
+
"sam_white_bg": {
|
| 89 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_wooden_door_attempt_01.png",
|
| 90 |
+
"output": "references/ref_wooden_door.png",
|
| 91 |
+
"mask": "references/sam_mask_wooden_door.png",
|
| 92 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 93 |
+
"sam_model_type": "vit_b",
|
| 94 |
+
"sam_device": "auto",
|
| 95 |
+
"sam_working_size": [
|
| 96 |
+
640,
|
| 97 |
+
640
|
| 98 |
+
],
|
| 99 |
+
"sam_max_side": 640,
|
| 100 |
+
"sam_downscale": 0.625,
|
| 101 |
+
"prompt_box_xyxy": [
|
| 102 |
+
256.0,
|
| 103 |
+
26.0,
|
| 104 |
+
767.0,
|
| 105 |
+
1015.0
|
| 106 |
+
],
|
| 107 |
+
"mask_score": 3.446321,
|
| 108 |
+
"mask_area_ratio": 0.388947,
|
| 109 |
+
"elapsed_seconds": 9.29
|
| 110 |
+
}
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "wrapped_cucumber",
|
| 114 |
+
"is_person": false,
|
| 115 |
+
"subject_type": "object",
|
| 116 |
+
"source_set": "obj_set",
|
| 117 |
+
"source_image_id": "EPIC-Kitchens:P37_101:object:1",
|
| 118 |
+
"source_name": "cucumber 2",
|
| 119 |
+
"source_description": "A long, green cucumber wrapped in clear plastic, resting horizontally on the dark countertop, slightly overlapping the other cucumber and positioned closer to the viewer. Source dataset: EPIC-Kitchens. Scene context: A first-person view of a person holding two whole cucumbers over a dark kitchen counter, with an onion, garlic, a plastic container, a rice cooker, and a living area in the background.",
|
| 120 |
+
"sub_caption": "cucumber 2: A long, green cucumber wrapped in clear plastic.. Scene role: Resting horizontally on the dark countertop next to the sink.",
|
| 121 |
+
"measured_bbox": [
|
| 122 |
+
0.2215,
|
| 123 |
+
0.4465,
|
| 124 |
+
0.4029,
|
| 125 |
+
0.5104
|
| 126 |
+
],
|
| 127 |
+
"detection_confidence": 0.99,
|
| 128 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 129 |
+
"ref_image": "references/ref_wrapped_cucumber.png",
|
| 130 |
+
"raw_ref_image": "references/raw_ref_wrapped_cucumber_attempt_01.png",
|
| 131 |
+
"reference_verify": "references/reference_verify_wrapped_cucumber.json",
|
| 132 |
+
"reference_verify_passed": true,
|
| 133 |
+
"reference_attempts": 1,
|
| 134 |
+
"sam_white_bg": {
|
| 135 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_wrapped_cucumber_attempt_01.png",
|
| 136 |
+
"output": "references/ref_wrapped_cucumber.png",
|
| 137 |
+
"mask": "references/sam_mask_wrapped_cucumber.png",
|
| 138 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 139 |
+
"sam_model_type": "vit_b",
|
| 140 |
+
"sam_device": "auto",
|
| 141 |
+
"sam_working_size": [
|
| 142 |
+
640,
|
| 143 |
+
640
|
| 144 |
+
],
|
| 145 |
+
"sam_max_side": 640,
|
| 146 |
+
"sam_downscale": 0.625,
|
| 147 |
+
"prompt_box_xyxy": [
|
| 148 |
+
33.0,
|
| 149 |
+
397.0,
|
| 150 |
+
1011.0,
|
| 151 |
+
624.0
|
| 152 |
+
],
|
| 153 |
+
"mask_score": 3.430612,
|
| 154 |
+
"mask_area_ratio": 0.118574,
|
| 155 |
+
"elapsed_seconds": 7.2551
|
| 156 |
+
}
|
| 157 |
+
},
|
| 158 |
+
{
|
| 159 |
+
"name": "gas_stove",
|
| 160 |
+
"is_person": false,
|
| 161 |
+
"subject_type": "object",
|
| 162 |
+
"source_set": "obj_set",
|
| 163 |
+
"source_image_id": "EPIC-Kitchens:P22_105:object:12",
|
| 164 |
+
"source_name": "stove",
|
| 165 |
+
"source_description": "A gas stove with black grates on the left side. Source dataset: EPIC-Kitchens. Scene context: A kitchen counter area with a stove, a sink, various utensils, bottles, and cabinets.",
|
| 166 |
+
"sub_caption": "stove: A kitchen gas stove with black grates.. Scene role: Positioned along the counter in the background.",
|
| 167 |
+
"measured_bbox": [
|
| 168 |
+
0.03,
|
| 169 |
+
0.345,
|
| 170 |
+
0.318,
|
| 171 |
+
0.444
|
| 172 |
+
],
|
| 173 |
+
"detection_confidence": 0.99,
|
| 174 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 175 |
+
"ref_image": "references/ref_gas_stove.png",
|
| 176 |
+
"raw_ref_image": "references/raw_ref_gas_stove_attempt_01.png",
|
| 177 |
+
"reference_verify": "references/reference_verify_gas_stove.json",
|
| 178 |
+
"reference_verify_passed": true,
|
| 179 |
+
"reference_attempts": 1,
|
| 180 |
+
"sam_white_bg": {
|
| 181 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_gas_stove_attempt_01.png",
|
| 182 |
+
"output": "references/ref_gas_stove.png",
|
| 183 |
+
"mask": "references/sam_mask_gas_stove.png",
|
| 184 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 185 |
+
"sam_model_type": "vit_b",
|
| 186 |
+
"sam_device": "auto",
|
| 187 |
+
"sam_working_size": [
|
| 188 |
+
640,
|
| 189 |
+
640
|
| 190 |
+
],
|
| 191 |
+
"sam_max_side": 640,
|
| 192 |
+
"sam_downscale": 0.625,
|
| 193 |
+
"prompt_box_xyxy": [
|
| 194 |
+
58.0,
|
| 195 |
+
180.0,
|
| 196 |
+
965.0,
|
| 197 |
+
842.0
|
| 198 |
+
],
|
| 199 |
+
"mask_score": 3.470988,
|
| 200 |
+
"mask_area_ratio": 0.477615,
|
| 201 |
+
"elapsed_seconds": 7.3908
|
| 202 |
+
}
|
| 203 |
+
},
|
| 204 |
+
{
|
| 205 |
+
"name": "water_pitcher",
|
| 206 |
+
"is_person": false,
|
| 207 |
+
"subject_type": "object",
|
| 208 |
+
"source_set": "obj_set",
|
| 209 |
+
"source_image_id": "EPIC-Kitchens:P07_107:object:13",
|
| 210 |
+
"source_name": "water pitcher",
|
| 211 |
+
"source_description": "A clear plastic water pitcher with a white handle and lid, sitting on the counter. Source dataset: EPIC-Kitchens. Scene context: A narrow kitchen space with a dark floor, light cabinets, a sink counter with various items, a radiator on the wall, and a trash can on the floor.",
|
| 212 |
+
"sub_caption": "water pitcher: A clear plastic water pitcher with a white handle and lid.. Scene role: Sitting upright on the counter.",
|
| 213 |
+
"measured_bbox": [
|
| 214 |
+
0.3327,
|
| 215 |
+
0.2732,
|
| 216 |
+
0.4536,
|
| 217 |
+
0.4573
|
| 218 |
+
],
|
| 219 |
+
"detection_confidence": 0.99,
|
| 220 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 221 |
+
"ref_image": "references/ref_water_pitcher.png",
|
| 222 |
+
"raw_ref_image": "references/raw_ref_water_pitcher_attempt_01.png",
|
| 223 |
+
"reference_verify": "references/reference_verify_water_pitcher.json",
|
| 224 |
+
"reference_verify_passed": true,
|
| 225 |
+
"reference_attempts": 1,
|
| 226 |
+
"sam_white_bg": {
|
| 227 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_water_pitcher_attempt_01.png",
|
| 228 |
+
"output": "references/ref_water_pitcher.png",
|
| 229 |
+
"mask": "references/sam_mask_water_pitcher.png",
|
| 230 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 231 |
+
"sam_model_type": "vit_b",
|
| 232 |
+
"sam_device": "auto",
|
| 233 |
+
"sam_working_size": [
|
| 234 |
+
640,
|
| 235 |
+
640
|
| 236 |
+
],
|
| 237 |
+
"sam_max_side": 640,
|
| 238 |
+
"sam_downscale": 0.625,
|
| 239 |
+
"prompt_box_xyxy": [
|
| 240 |
+
242.0,
|
| 241 |
+
115.0,
|
| 242 |
+
856.0,
|
| 243 |
+
972.0
|
| 244 |
+
],
|
| 245 |
+
"mask_score": 3.323768,
|
| 246 |
+
"mask_area_ratio": 0.450877,
|
| 247 |
+
"elapsed_seconds": 7.2849
|
| 248 |
+
}
|
| 249 |
+
},
|
| 250 |
+
{
|
| 251 |
+
"name": "silver_spoon",
|
| 252 |
+
"is_person": false,
|
| 253 |
+
"subject_type": "object",
|
| 254 |
+
"source_set": "obj_set",
|
| 255 |
+
"source_image_id": "EPIC-Kitchens:P04_103:object:9",
|
| 256 |
+
"source_name": "Silver Spoon",
|
| 257 |
+
"source_description": "Small silver metal spoon resting near the black spatula handle. Source dataset: EPIC-Kitchens. Scene context: A messy kitchen counter with a stove, toaster, and various cooking utensils scattered around.",
|
| 258 |
+
"sub_caption": "Silver Spoon: A small silver metal spoon.. Scene role: Laying flat on the messy countertop near the cucumber.",
|
| 259 |
+
"measured_bbox": [
|
| 260 |
+
0.3001,
|
| 261 |
+
0.4801,
|
| 262 |
+
0.3988,
|
| 263 |
+
0.539
|
| 264 |
+
],
|
| 265 |
+
"detection_confidence": 0.99,
|
| 266 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 267 |
+
"ref_image": "references/ref_silver_spoon.png",
|
| 268 |
+
"raw_ref_image": "references/raw_ref_silver_spoon_attempt_01.png",
|
| 269 |
+
"reference_verify": "references/reference_verify_silver_spoon.json",
|
| 270 |
+
"reference_verify_passed": true,
|
| 271 |
+
"reference_attempts": 1,
|
| 272 |
+
"sam_white_bg": {
|
| 273 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/chaos/samples/sample_000006/references/raw_ref_silver_spoon_attempt_01.png",
|
| 274 |
+
"output": "references/ref_silver_spoon.png",
|
| 275 |
+
"mask": "references/sam_mask_silver_spoon.png",
|
| 276 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 277 |
+
"sam_model_type": "vit_b",
|
| 278 |
+
"sam_device": "auto",
|
| 279 |
+
"sam_working_size": [
|
| 280 |
+
640,
|
| 281 |
+
640
|
| 282 |
+
],
|
| 283 |
+
"sam_max_side": 640,
|
| 284 |
+
"sam_downscale": 0.625,
|
| 285 |
+
"prompt_box_xyxy": [
|
| 286 |
+
88.0,
|
| 287 |
+
77.0,
|
| 288 |
+
916.0,
|
| 289 |
+
950.0
|
| 290 |
+
],
|
| 291 |
+
"mask_score": 3.449565,
|
| 292 |
+
"mask_area_ratio": 0.092279,
|
| 293 |
+
"elapsed_seconds": 7.0866
|
| 294 |
+
}
|
| 295 |
+
}
|
| 296 |
+
],
|
| 297 |
+
"not_emitted": [
|
| 298 |
+
{
|
| 299 |
+
"name": "black_pot",
|
| 300 |
+
"reason": "not_detected"
|
| 301 |
+
},
|
| 302 |
+
{
|
| 303 |
+
"name": "kitchen_faucet",
|
| 304 |
+
"reason": "not_detected"
|
| 305 |
+
}
|
| 306 |
+
],
|
| 307 |
+
"model_ids": {
|
| 308 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 309 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 310 |
+
}
|
| 311 |
+
}
|