Upload folder using huggingface_hub
#4
by kimi000 - opened
This view is limited to 50 files because it contains too many changes. See the raw diff here.
- .gitattributes +170 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/README.md +16 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/dataset.json +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/dataset.jsonl +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/bbox_overlay.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/compose_prompt.txt +63 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_metal_barrier.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_parked_dark_car.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_pedestrian.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_metal_barrier.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_parked_dark_car.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_pedestrian.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/detections.json +59 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/main_image.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/plan.json +107 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references.json +101 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_metal_barrier.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_parked_dark_car.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_pedestrian.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/reference_verify_metal_barrier.json +46 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/reference_verify_parked_dark_car.json +46 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/reference_verify_pedestrian.json +46 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/sam_mask_metal_barrier.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/sam_mask_parked_dark_car.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/sam_mask_pedestrian.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/row.json +164 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/vocab_task.json +56 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/bbox_overlay.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/compose_prompt.txt +159 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_city_buildings.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_drainage_grate.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_parked_car_left.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_parked_suv_right.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_pedestrian_walking.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_shop_pedestrian.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_storefront_sign.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_street_light.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_street_signs.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_street_trees.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_traveling_dark_suv.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_twilight_sky.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_vehicle_dashboard.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_white_car.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_yellow_lines.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_city_buildings.png +3 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_drainage_grate.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_parked_car_left.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_parked_suv_right.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_pedestrian_walking.png +0 -0
- samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_shop_pedestrian.png +0 -0
.gitattributes
CHANGED
|
@@ -52,3 +52,173 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 52 |
10samples/sample_0007/overlays/overlay_accepted.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
10samples/sample_0007/overlays/overlay_intended.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
10samples/sample_0007/overlays/overlay_measured.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 52 |
10samples/sample_0007/overlays/overlay_accepted.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
10samples/sample_0007/overlays/overlay_intended.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
10samples/sample_0007/overlays/overlay_measured.png filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_metal_barrier.png filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_parked_dark_car.png filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_pedestrian.png filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_metal_barrier.png filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_parked_dark_car.png filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_pedestrian.png filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_metal_barrier.png filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_parked_dark_car.png filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_pedestrian.png filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_city_buildings.png filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_street_light.png filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_street_trees.png filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_twilight_sky.png filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_vehicle_dashboard.png filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_city_buildings.png filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_street_light.png filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_street_trees.png filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_twilight_sky.png filter=lfs diff=lfs merge=lfs -text
|
| 76 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_vehicle_dashboard.png filter=lfs diff=lfs merge=lfs -text
|
| 77 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 78 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_city_buildings.png filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_drainage_grate.png filter=lfs diff=lfs merge=lfs -text
|
| 80 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_parked_car_left.png filter=lfs diff=lfs merge=lfs -text
|
| 81 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_parked_suv_right.png filter=lfs diff=lfs merge=lfs -text
|
| 82 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_pedestrian_walking.png filter=lfs diff=lfs merge=lfs -text
|
| 83 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_shop_pedestrian.png filter=lfs diff=lfs merge=lfs -text
|
| 84 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_storefront_sign.png filter=lfs diff=lfs merge=lfs -text
|
| 85 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_street_signs.png filter=lfs diff=lfs merge=lfs -text
|
| 86 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_street_trees.png filter=lfs diff=lfs merge=lfs -text
|
| 87 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_traveling_dark_suv.png filter=lfs diff=lfs merge=lfs -text
|
| 88 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_twilight_sky.png filter=lfs diff=lfs merge=lfs -text
|
| 89 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_vehicle_dashboard.png filter=lfs diff=lfs merge=lfs -text
|
| 90 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_white_car.png filter=lfs diff=lfs merge=lfs -text
|
| 91 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/references/ref_yellow_lines.png filter=lfs diff=lfs merge=lfs -text
|
| 92 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 93 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/crops/detect_refine_black_sedan.png filter=lfs diff=lfs merge=lfs -text
|
| 94 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/crops/detect_refine_silver_car.png filter=lfs diff=lfs merge=lfs -text
|
| 95 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/crops/detect_refine_waiting_pedestrian.png filter=lfs diff=lfs merge=lfs -text
|
| 96 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/crops/diversify_input_black_sedan.png filter=lfs diff=lfs merge=lfs -text
|
| 97 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/crops/diversify_input_silver_car.png filter=lfs diff=lfs merge=lfs -text
|
| 98 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/crops/diversify_input_waiting_pedestrian.png filter=lfs diff=lfs merge=lfs -text
|
| 99 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 100 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/references/ref_black_sedan.png filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/references/ref_silver_car.png filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000003/references/ref_waiting_pedestrian.png filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/crops/detect_refine_dark_parked_car.png filter=lfs diff=lfs merge=lfs -text
|
| 105 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/crops/detect_refine_street_lines.png filter=lfs diff=lfs merge=lfs -text
|
| 106 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/crops/diversify_input_dark_parked_car.png filter=lfs diff=lfs merge=lfs -text
|
| 107 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/crops/diversify_input_street_lines.png filter=lfs diff=lfs merge=lfs -text
|
| 108 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 109 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/references/ref_dark_parked_car.png filter=lfs diff=lfs merge=lfs -text
|
| 110 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/references/ref_delivery_truck.png filter=lfs diff=lfs merge=lfs -text
|
| 111 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/references/ref_street_lines.png filter=lfs diff=lfs merge=lfs -text
|
| 112 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/references/ref_traffic_light.png filter=lfs diff=lfs merge=lfs -text
|
| 113 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000004/references/ref_walker.png filter=lfs diff=lfs merge=lfs -text
|
| 114 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 115 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/crops/detect_refine_concrete_barrier.png filter=lfs diff=lfs merge=lfs -text
|
| 116 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/crops/detect_refine_silver_car.png filter=lfs diff=lfs merge=lfs -text
|
| 117 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/crops/diversify_input_concrete_barrier.png filter=lfs diff=lfs merge=lfs -text
|
| 118 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/crops/diversify_input_silver_car.png filter=lfs diff=lfs merge=lfs -text
|
| 119 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/crops/diversify_input_uniformed_officer.png filter=lfs diff=lfs merge=lfs -text
|
| 120 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 121 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/references/ref_bystander_in_suit.png filter=lfs diff=lfs merge=lfs -text
|
| 122 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/references/ref_concrete_barrier.png filter=lfs diff=lfs merge=lfs -text
|
| 123 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/references/ref_firefighter.png filter=lfs diff=lfs merge=lfs -text
|
| 124 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/references/ref_silver_car.png filter=lfs diff=lfs merge=lfs -text
|
| 125 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/references/ref_traffic_light.png filter=lfs diff=lfs merge=lfs -text
|
| 126 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000005/references/ref_uniformed_officer.png filter=lfs diff=lfs merge=lfs -text
|
| 127 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 128 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/crops/detect_refine_dark_building_facade.png filter=lfs diff=lfs merge=lfs -text
|
| 129 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/crops/detect_refine_double_solid_line.png filter=lfs diff=lfs merge=lfs -text
|
| 130 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/crops/diversify_input_dark_building_facade.png filter=lfs diff=lfs merge=lfs -text
|
| 131 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/crops/diversify_input_double_solid_line.png filter=lfs diff=lfs merge=lfs -text
|
| 132 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/crops/diversify_input_white_panel_van.png filter=lfs diff=lfs merge=lfs -text
|
| 133 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 134 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/references/ref_awning_building_corner.png filter=lfs diff=lfs merge=lfs -text
|
| 135 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/references/ref_dark_building_facade.png filter=lfs diff=lfs merge=lfs -text
|
| 136 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/references/ref_distant_pedestrian.png filter=lfs diff=lfs merge=lfs -text
|
| 137 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/references/ref_double_solid_line.png filter=lfs diff=lfs merge=lfs -text
|
| 138 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/references/ref_emergency_vehicle.png filter=lfs diff=lfs merge=lfs -text
|
| 139 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/references/ref_green_street_sign.png filter=lfs diff=lfs merge=lfs -text
|
| 140 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/references/ref_vertical_illuminated_sign.png filter=lfs diff=lfs merge=lfs -text
|
| 141 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000006/references/ref_white_panel_van.png filter=lfs diff=lfs merge=lfs -text
|
| 142 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 143 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/detect_refine_brick_building_right.png filter=lfs diff=lfs merge=lfs -text
|
| 144 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/detect_refine_crosswalk_markings.png filter=lfs diff=lfs merge=lfs -text
|
| 145 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/detect_refine_dashboard.png filter=lfs diff=lfs merge=lfs -text
|
| 146 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/detect_refine_iron_balcony.png filter=lfs diff=lfs merge=lfs -text
|
| 147 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/detect_refine_multi_story_building_left.png filter=lfs diff=lfs merge=lfs -text
|
| 148 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/detect_refine_overhead_wires.png filter=lfs diff=lfs merge=lfs -text
|
| 149 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/detect_refine_street_light_pole.png filter=lfs diff=lfs merge=lfs -text
|
| 150 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/diversify_input_dashboard.png filter=lfs diff=lfs merge=lfs -text
|
| 151 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/diversify_input_iron_balcony.png filter=lfs diff=lfs merge=lfs -text
|
| 152 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/diversify_input_multi_story_building_left.png filter=lfs diff=lfs merge=lfs -text
|
| 153 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/diversify_input_overhead_wires.png filter=lfs diff=lfs merge=lfs -text
|
| 154 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/crops/diversify_input_street_light_pole.png filter=lfs diff=lfs merge=lfs -text
|
| 155 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 156 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_brick_building_right.png filter=lfs diff=lfs merge=lfs -text
|
| 157 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_bunch_of_balloons.png filter=lfs diff=lfs merge=lfs -text
|
| 158 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_crosswalk_markings.png filter=lfs diff=lfs merge=lfs -text
|
| 159 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_dark_car_1.png filter=lfs diff=lfs merge=lfs -text
|
| 160 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_dark_car_2.png filter=lfs diff=lfs merge=lfs -text
|
| 161 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_dashboard.png filter=lfs diff=lfs merge=lfs -text
|
| 162 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_iron_balcony.png filter=lfs diff=lfs merge=lfs -text
|
| 163 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_multi_story_building_left.png filter=lfs diff=lfs merge=lfs -text
|
| 164 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_overhead_wires.png filter=lfs diff=lfs merge=lfs -text
|
| 165 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_white_garbage_bag.png filter=lfs diff=lfs merge=lfs -text
|
| 166 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_white_sedan.png filter=lfs diff=lfs merge=lfs -text
|
| 167 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000007/references/ref_woman_in_dark_dress.png filter=lfs diff=lfs merge=lfs -text
|
| 168 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 169 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/detect_refine_dashboard_reflection.png filter=lfs diff=lfs merge=lfs -text
|
| 170 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/detect_refine_pedestrian_walking_away.png filter=lfs diff=lfs merge=lfs -text
|
| 171 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/detect_refine_street_lamp.png filter=lfs diff=lfs merge=lfs -text
|
| 172 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/diversify_input_dashboard_reflection.png filter=lfs diff=lfs merge=lfs -text
|
| 173 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/diversify_input_pedestrian_walking_away.png filter=lfs diff=lfs merge=lfs -text
|
| 174 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/diversify_input_sign_holder.png filter=lfs diff=lfs merge=lfs -text
|
| 175 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/diversify_input_street_lamp.png filter=lfs diff=lfs merge=lfs -text
|
| 176 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/diversify_input_woman_waiting.png filter=lfs diff=lfs merge=lfs -text
|
| 177 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/crops/diversify_input_young_man_waiting.png filter=lfs diff=lfs merge=lfs -text
|
| 178 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 179 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_businessman_waiting.png filter=lfs diff=lfs merge=lfs -text
|
| 180 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_dashboard_reflection.png filter=lfs diff=lfs merge=lfs -text
|
| 181 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_pedestrian_crossing_right.png filter=lfs diff=lfs merge=lfs -text
|
| 182 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_pedestrian_standing.png filter=lfs diff=lfs merge=lfs -text
|
| 183 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_pedestrian_walking_away.png filter=lfs diff=lfs merge=lfs -text
|
| 184 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_pedestrian_walking_away_sidewalk.png filter=lfs diff=lfs merge=lfs -text
|
| 185 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_sign_holder.png filter=lfs diff=lfs merge=lfs -text
|
| 186 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_street_lamp.png filter=lfs diff=lfs merge=lfs -text
|
| 187 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_woman_waiting.png filter=lfs diff=lfs merge=lfs -text
|
| 188 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000008/references/ref_young_man_waiting.png filter=lfs diff=lfs merge=lfs -text
|
| 189 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 190 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/crops/detect_refine_metal_railing.png filter=lfs diff=lfs merge=lfs -text
|
| 191 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/crops/detect_refine_overpass.png filter=lfs diff=lfs merge=lfs -text
|
| 192 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/crops/detect_refine_yellow_lane_line.png filter=lfs diff=lfs merge=lfs -text
|
| 193 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/crops/diversify_input_metal_railing.png filter=lfs diff=lfs merge=lfs -text
|
| 194 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/crops/diversify_input_overpass.png filter=lfs diff=lfs merge=lfs -text
|
| 195 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/crops/diversify_input_street_light.png filter=lfs diff=lfs merge=lfs -text
|
| 196 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/crops/diversify_input_yellow_lane_line.png filter=lfs diff=lfs merge=lfs -text
|
| 197 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 198 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/references/ref_metal_railing.png filter=lfs diff=lfs merge=lfs -text
|
| 199 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/references/ref_overpass.png filter=lfs diff=lfs merge=lfs -text
|
| 200 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/references/ref_pedestrian_in_suit.png filter=lfs diff=lfs merge=lfs -text
|
| 201 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000009/references/ref_yellow_lane_line.png filter=lfs diff=lfs merge=lfs -text
|
| 202 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/bbox_overlay.png filter=lfs diff=lfs merge=lfs -text
|
| 203 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/detect_refine_black_suv.png filter=lfs diff=lfs merge=lfs -text
|
| 204 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/detect_refine_man_in_grey_sweater.png filter=lfs diff=lfs merge=lfs -text
|
| 205 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/detect_refine_pedestrian_in_light_blue.png filter=lfs diff=lfs merge=lfs -text
|
| 206 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/detect_refine_pedestrian_in_striped_shirt.png filter=lfs diff=lfs merge=lfs -text
|
| 207 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/detect_refine_pedestrian_walking_away.png filter=lfs diff=lfs merge=lfs -text
|
| 208 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/diversify_input_black_suv.png filter=lfs diff=lfs merge=lfs -text
|
| 209 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/diversify_input_man_in_grey_sweater.png filter=lfs diff=lfs merge=lfs -text
|
| 210 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/diversify_input_man_in_pink_shirt.png filter=lfs diff=lfs merge=lfs -text
|
| 211 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/diversify_input_pedestrian_in_light_blue.png filter=lfs diff=lfs merge=lfs -text
|
| 212 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/diversify_input_pedestrian_in_striped_shirt.png filter=lfs diff=lfs merge=lfs -text
|
| 213 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/diversify_input_pedestrian_walking_away.png filter=lfs diff=lfs merge=lfs -text
|
| 214 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/crops/diversify_input_pedestrian_with_backpack.png filter=lfs diff=lfs merge=lfs -text
|
| 215 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/main_image.png filter=lfs diff=lfs merge=lfs -text
|
| 216 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_black_suv.png filter=lfs diff=lfs merge=lfs -text
|
| 217 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_man_in_grey_sweater.png filter=lfs diff=lfs merge=lfs -text
|
| 218 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_man_in_pink_shirt.png filter=lfs diff=lfs merge=lfs -text
|
| 219 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_pedestrian_in_light_blue.png filter=lfs diff=lfs merge=lfs -text
|
| 220 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_pedestrian_in_light_jacket.png filter=lfs diff=lfs merge=lfs -text
|
| 221 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_pedestrian_in_red.png filter=lfs diff=lfs merge=lfs -text
|
| 222 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_pedestrian_in_striped_shirt.png filter=lfs diff=lfs merge=lfs -text
|
| 223 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_pedestrian_walking_away.png filter=lfs diff=lfs merge=lfs -text
|
| 224 |
+
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000010/references/ref_pedestrian_with_backpack.png filter=lfs diff=lfs merge=lfs -text
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/README.md
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# samples_v8
|
| 2 |
+
|
| 3 |
+
Generated with `data_recipe_v8.md`: vocabulary-first planning, adaptive canvas selection, structured JSON compose prompts, no identity verification, no gate, SAM white-background reference postprocessing, and strict reference-completeness verification with regenerate-until-pass behavior.
|
| 4 |
+
|
| 5 |
+
- chat model: `gcp/google/gemini-3.1-pro-preview`
|
| 6 |
+
- image model: `gcp/google/gemini-3-pro-image-preview`
|
| 7 |
+
- people references: `white_bg_full_body_front`
|
| 8 |
+
- non-person references: `white_bg_encyclopedia_photo`
|
| 9 |
+
- SAM postprocess: every generated reference is segmented with `sam_vit_b` and pasted onto pure `#ffffff` background
|
| 10 |
+
- reference verify max attempts per subject: `10`
|
| 11 |
+
- allowed canvases: `[{"aspect_ratio": "1:1", "size": [1024, 1024], "style": "photorealistic"}, {"aspect_ratio": "4:3", "size": [1152, 864], "style": "photorealistic"}, {"aspect_ratio": "3:4", "size": [864, 1152], "style": "photorealistic"}, {"aspect_ratio": "3:2", "size": [1248, 832], "style": "photorealistic"}, {"aspect_ratio": "2:3", "size": [832, 1248], "style": "photorealistic"}, {"aspect_ratio": "16:9", "size": [1280, 720], "style": "photorealistic"}, {"aspect_ratio": "9:16", "size": [720, 1280], "style": "photorealistic"}]`
|
| 12 |
+
- scenario mode: `driving`
|
| 13 |
+
- pools: `vocab_task_pool`, `plan_pool`, `scene_pool`, `detection_pool`, `reference_pool`
|
| 14 |
+
- bbox overlay: `bbox_overlay.png` draws every planned subject bbox; a sample is rejected and regenerated if any planned subject is still missing after VLM detection retries
|
| 15 |
+
- detection max attempts per subject: `3`
|
| 16 |
+
- launch args: `{"compose_workers": 3, "detect_max_attempts": 3, "detect_workers": 3, "emit_workers": 4, "idle_sleep": 1.0, "image_inflight": 32, "image_interval": 0.05, "image_max_retries": 8, "max_retries": 3, "no_topup": false, "plan_workers": 6, "ref_verify_max_attempts": 10, "reference_workers": 6, "requeue_in_progress": true, "seed": 1781927993, "status_interval": 30.0, "subject_detect_workers": 24, "target_samples": 10}`
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/dataset.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/dataset.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/bbox_overlay.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/compose_prompt.txt
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Render the following JSON scene specification as a photorealistic 1248x832 image using a true 3:2 canvas. The rendered image must be a coherent driving scenario with an outdoor road, street, highway, intersection, curbside, parking, or traffic environment; do not render a non-driving indoor scene or product-catalog scene. Every listed person and object must appear visibly in the image. Keep normal proportions and the requested aspect ratio. The foreground must contain only subjects explicitly listed in the JSON scene specification. Do not add any unlisted foreground people, animals, vehicles, props, tools, products, signs, readable text, logos, or other localizable subjects. Background context may include non-localizable scenery only when it does not introduce a distinct foreground subject. No text, no labels, no logos, no watermarks.
|
| 2 |
+
JSON scene specification:
|
| 3 |
+
{
|
| 4 |
+
"format": "structured_json_prompt",
|
| 5 |
+
"canvas": {
|
| 6 |
+
"size": [
|
| 7 |
+
1248,
|
| 8 |
+
832
|
| 9 |
+
],
|
| 10 |
+
"aspect_ratio": "3:2",
|
| 11 |
+
"style": "photorealistic"
|
| 12 |
+
},
|
| 13 |
+
"scene": {
|
| 14 |
+
"setting": "A curbside along a city street on an overcast day",
|
| 15 |
+
"activity": "A pedestrian is walking along the edge of the street near a parked dark car and a temporary metal barricade",
|
| 16 |
+
"composition": "Medium wide shot, eye-level perspective. The pedestrian is situated in the foreground-left, walking parallel to the curb. A silver metal barrier forms a line separating the walking area from the street, and a dark sedan is parked on the right side of the frame.",
|
| 17 |
+
"constraints": [
|
| 18 |
+
"no text",
|
| 19 |
+
"no labels",
|
| 20 |
+
"no watermarks",
|
| 21 |
+
"true 3:2 composition",
|
| 22 |
+
"final canvas size 1248x832",
|
| 23 |
+
"normal human and object proportions",
|
| 24 |
+
"no squeezed perspective",
|
| 25 |
+
"no anamorphic stretching",
|
| 26 |
+
"every listed person and object must be visibly present",
|
| 27 |
+
"the foreground may contain only the listed people and objects",
|
| 28 |
+
"no extra foreground people, animals, vehicles, props, tools, products, signs, readable text, logos, or other localizable subjects absent from this JSON",
|
| 29 |
+
"the entire image must be a coherent driving scenario",
|
| 30 |
+
"the scene must include an outdoor road, street, highway, intersection, curbside, parking, or traffic environment",
|
| 31 |
+
"integrate all listed subjects as road users, vehicles, roadside objects, traffic infrastructure, or driving-context objects",
|
| 32 |
+
"do not render an office, kitchen, studio, product catalog, indoor room, or unrelated non-driving scene"
|
| 33 |
+
]
|
| 34 |
+
},
|
| 35 |
+
"people": [
|
| 36 |
+
{
|
| 37 |
+
"name": "pedestrian",
|
| 38 |
+
"source_index": 1,
|
| 39 |
+
"source_image_id": "CrowdHuman:data/data_69/273278,12fc4700013112375.jpg:person:3",
|
| 40 |
+
"source_name": "pedestrian",
|
| 41 |
+
"description": "A person wearing a dark coat and trousers, walking confidently.",
|
| 42 |
+
"role_in_scene": "Walking along the curbside near the barrier."
|
| 43 |
+
}
|
| 44 |
+
],
|
| 45 |
+
"objects": [
|
| 46 |
+
{
|
| 47 |
+
"name": "parked_dark_car",
|
| 48 |
+
"source_index": 1,
|
| 49 |
+
"source_image_id": "BDD100K:bcb356f6-520dd65c:object:9",
|
| 50 |
+
"source_name": "parked dark car",
|
| 51 |
+
"description": "A dark-colored sedan.",
|
| 52 |
+
"role_in_scene": "Parked on the street near the curb in the background right."
|
| 53 |
+
},
|
| 54 |
+
{
|
| 55 |
+
"name": "metal_barrier",
|
| 56 |
+
"source_index": 0,
|
| 57 |
+
"source_image_id": "CrowdHuman:data/data_74/284193,1da20000b642be5b.jpg:object:5",
|
| 58 |
+
"source_name": "metal barrier",
|
| 59 |
+
"description": "A silver metal barricade placed along the street.",
|
| 60 |
+
"role_in_scene": "Positioned along the curb to section off the pedestrian area from the road."
|
| 61 |
+
}
|
| 62 |
+
]
|
| 63 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_metal_barrier.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_parked_dark_car.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/detect_refine_pedestrian.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_metal_barrier.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_parked_dark_car.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/crops/diversify_input_pedestrian.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/detections.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"name": "pedestrian",
|
| 4 |
+
"present": true,
|
| 5 |
+
"bbox": [
|
| 6 |
+
0.1528,
|
| 7 |
+
0.301,
|
| 8 |
+
0.2511,
|
| 9 |
+
0.7071
|
| 10 |
+
],
|
| 11 |
+
"confidence": 0.98,
|
| 12 |
+
"notes": "The closest and most prominent pedestrian matches the description provided perfectly.",
|
| 13 |
+
"coarse_bbox": [
|
| 14 |
+
0.15,
|
| 15 |
+
0.303,
|
| 16 |
+
0.251,
|
| 17 |
+
0.709
|
| 18 |
+
],
|
| 19 |
+
"refine_crop": "crops/detect_refine_pedestrian.png"
|
| 20 |
+
},
|
| 21 |
+
{
|
| 22 |
+
"name": "parked_dark_car",
|
| 23 |
+
"present": true,
|
| 24 |
+
"bbox": [
|
| 25 |
+
0.5163,
|
| 26 |
+
0.3897,
|
| 27 |
+
0.9968,
|
| 28 |
+
0.9244
|
| 29 |
+
],
|
| 30 |
+
"confidence": 0.98,
|
| 31 |
+
"notes": "The large dark gray sedan taking up most of the crop matches the description of 'parked dark car'.",
|
| 32 |
+
"coarse_bbox": [
|
| 33 |
+
0.516,
|
| 34 |
+
0.39,
|
| 35 |
+
0.995,
|
| 36 |
+
0.917
|
| 37 |
+
],
|
| 38 |
+
"refine_crop": "crops/detect_refine_parked_dark_car.png"
|
| 39 |
+
},
|
| 40 |
+
{
|
| 41 |
+
"name": "metal_barrier",
|
| 42 |
+
"present": true,
|
| 43 |
+
"bbox": [
|
| 44 |
+
0.3454,
|
| 45 |
+
0.4302,
|
| 46 |
+
0.5465,
|
| 47 |
+
0.8402
|
| 48 |
+
],
|
| 49 |
+
"confidence": 0.98,
|
| 50 |
+
"notes": "A prominent silver metal barricade is clearly visible in the foreground, taking up a significant portion of the image. The bounding box tightly encompasses this main barricade.",
|
| 51 |
+
"coarse_bbox": [
|
| 52 |
+
0.339,
|
| 53 |
+
0.432,
|
| 54 |
+
0.556,
|
| 55 |
+
0.839
|
| 56 |
+
],
|
| 57 |
+
"refine_crop": "crops/detect_refine_metal_barrier.png"
|
| 58 |
+
}
|
| 59 |
+
]
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/main_image.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/plan.json
ADDED
|
@@ -0,0 +1,107 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000001",
|
| 3 |
+
"target_total": 3,
|
| 4 |
+
"target_people": 1,
|
| 5 |
+
"target_objects": 2,
|
| 6 |
+
"compose_prompt": {
|
| 7 |
+
"format": "structured_json_prompt",
|
| 8 |
+
"canvas": {
|
| 9 |
+
"size": [
|
| 10 |
+
1248,
|
| 11 |
+
832
|
| 12 |
+
],
|
| 13 |
+
"aspect_ratio": "3:2",
|
| 14 |
+
"style": "photorealistic"
|
| 15 |
+
},
|
| 16 |
+
"scene": {
|
| 17 |
+
"setting": "A curbside along a city street on an overcast day",
|
| 18 |
+
"activity": "A pedestrian is walking along the edge of the street near a parked dark car and a temporary metal barricade",
|
| 19 |
+
"composition": "Medium wide shot, eye-level perspective. The pedestrian is situated in the foreground-left, walking parallel to the curb. A silver metal barrier forms a line separating the walking area from the street, and a dark sedan is parked on the right side of the frame.",
|
| 20 |
+
"constraints": [
|
| 21 |
+
"no text",
|
| 22 |
+
"no labels",
|
| 23 |
+
"no watermarks",
|
| 24 |
+
"true 3:2 composition",
|
| 25 |
+
"final canvas size 1248x832",
|
| 26 |
+
"normal human and object proportions",
|
| 27 |
+
"no squeezed perspective",
|
| 28 |
+
"no anamorphic stretching",
|
| 29 |
+
"every listed person and object must be visibly present",
|
| 30 |
+
"the foreground may contain only the listed people and objects",
|
| 31 |
+
"no extra foreground people, animals, vehicles, props, tools, products, signs, readable text, logos, or other localizable subjects absent from this JSON",
|
| 32 |
+
"the entire image must be a coherent driving scenario",
|
| 33 |
+
"the scene must include an outdoor road, street, highway, intersection, curbside, parking, or traffic environment",
|
| 34 |
+
"integrate all listed subjects as road users, vehicles, roadside objects, traffic infrastructure, or driving-context objects",
|
| 35 |
+
"do not render an office, kitchen, studio, product catalog, indoor room, or unrelated non-driving scene"
|
| 36 |
+
]
|
| 37 |
+
},
|
| 38 |
+
"people": [
|
| 39 |
+
{
|
| 40 |
+
"name": "pedestrian",
|
| 41 |
+
"source_index": 1,
|
| 42 |
+
"source_image_id": "CrowdHuman:data/data_69/273278,12fc4700013112375.jpg:person:3",
|
| 43 |
+
"source_name": "pedestrian",
|
| 44 |
+
"description": "A person wearing a dark coat and trousers, walking confidently.",
|
| 45 |
+
"role_in_scene": "Walking along the curbside near the barrier."
|
| 46 |
+
}
|
| 47 |
+
],
|
| 48 |
+
"objects": [
|
| 49 |
+
{
|
| 50 |
+
"name": "parked_dark_car",
|
| 51 |
+
"source_index": 1,
|
| 52 |
+
"source_image_id": "BDD100K:bcb356f6-520dd65c:object:9",
|
| 53 |
+
"source_name": "parked dark car",
|
| 54 |
+
"description": "A dark-colored sedan.",
|
| 55 |
+
"role_in_scene": "Parked on the street near the curb in the background right."
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"name": "metal_barrier",
|
| 59 |
+
"source_index": 0,
|
| 60 |
+
"source_image_id": "CrowdHuman:data/data_74/284193,1da20000b642be5b.jpg:object:5",
|
| 61 |
+
"source_name": "metal barrier",
|
| 62 |
+
"description": "A silver metal barricade placed along the street.",
|
| 63 |
+
"role_in_scene": "Positioned along the curb to section off the pedestrian area from the road."
|
| 64 |
+
}
|
| 65 |
+
]
|
| 66 |
+
},
|
| 67 |
+
"expected_subjects": [
|
| 68 |
+
{
|
| 69 |
+
"name": "pedestrian",
|
| 70 |
+
"is_person": true,
|
| 71 |
+
"subject_type": "person",
|
| 72 |
+
"source_set": "people_set",
|
| 73 |
+
"source_image_id": "CrowdHuman:data/data_69/273278,12fc4700013112375.jpg:person:3",
|
| 74 |
+
"source_name": "pedestrian",
|
| 75 |
+
"source_description": "A person wearing a dark coat and trousers. Source dataset: CrowdHuman. Scene context: A bustling city street lined with trees showcasing vibrant yellow autumn foliage, with many pedestrians walking in both directions.",
|
| 76 |
+
"sub_caption": "pedestrian: A person wearing a dark coat and trousers, walking confidently.. Scene role: Walking along the curbside near the barrier.",
|
| 77 |
+
"ref_style": "white_bg_full_body_front"
|
| 78 |
+
},
|
| 79 |
+
{
|
| 80 |
+
"name": "parked_dark_car",
|
| 81 |
+
"is_person": false,
|
| 82 |
+
"subject_type": "object",
|
| 83 |
+
"source_set": "obj_set",
|
| 84 |
+
"source_image_id": "BDD100K:bcb356f6-520dd65c:object:9",
|
| 85 |
+
"source_name": "parked dark car",
|
| 86 |
+
"source_description": "A dark-colored sedan parked on the right side of the street, behind the silver car. Source dataset: BDD100K. Scene context: A large white New York City bus is driving down a city street on an overcast day with other cars parked and driving around it.",
|
| 87 |
+
"sub_caption": "parked dark car: A dark-colored sedan.. Scene role: Parked on the street near the curb in the background right.",
|
| 88 |
+
"ref_style": "white_bg_encyclopedia_photo"
|
| 89 |
+
},
|
| 90 |
+
{
|
| 91 |
+
"name": "metal_barrier",
|
| 92 |
+
"is_person": false,
|
| 93 |
+
"subject_type": "object",
|
| 94 |
+
"source_set": "obj_set",
|
| 95 |
+
"source_image_id": "CrowdHuman:data/data_74/284193,1da20000b642be5b.jpg:object:5",
|
| 96 |
+
"source_name": "metal barrier",
|
| 97 |
+
"source_description": "silver metal barricade placed near the entrance Source dataset: CrowdHuman. Scene context: People are gathered outside the entrance of a stone building with arched doorways and large windows.",
|
| 98 |
+
"sub_caption": "metal barrier: A silver metal barricade placed along the street.. Scene role: Positioned along the curb to section off the pedestrian area from the road.",
|
| 99 |
+
"ref_style": "white_bg_encyclopedia_photo"
|
| 100 |
+
}
|
| 101 |
+
],
|
| 102 |
+
"vocab_task_path": "sample_000001/vocab_task.json",
|
| 103 |
+
"model_ids": {
|
| 104 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 105 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 106 |
+
}
|
| 107 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references.json
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"references": [
|
| 3 |
+
{
|
| 4 |
+
"name": "pedestrian",
|
| 5 |
+
"ref_image": "references/ref_pedestrian.png",
|
| 6 |
+
"raw_ref_image": "references/raw_ref_pedestrian_attempt_01.png",
|
| 7 |
+
"diversify_input": "crops/diversify_input_pedestrian.png",
|
| 8 |
+
"sam_white_bg": {
|
| 9 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_pedestrian_attempt_01.png",
|
| 10 |
+
"output": "references/ref_pedestrian.png",
|
| 11 |
+
"mask": "references/sam_mask_pedestrian.png",
|
| 12 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 13 |
+
"sam_model_type": "vit_b",
|
| 14 |
+
"sam_device": "auto",
|
| 15 |
+
"sam_working_size": [
|
| 16 |
+
640,
|
| 17 |
+
640
|
| 18 |
+
],
|
| 19 |
+
"sam_max_side": 640,
|
| 20 |
+
"sam_downscale": 0.625,
|
| 21 |
+
"prompt_box_xyxy": [
|
| 22 |
+
330.0,
|
| 23 |
+
42.0,
|
| 24 |
+
698.0,
|
| 25 |
+
1007.0
|
| 26 |
+
],
|
| 27 |
+
"mask_score": 3.413244,
|
| 28 |
+
"mask_area_ratio": 0.159381,
|
| 29 |
+
"elapsed_seconds": 33.2771
|
| 30 |
+
},
|
| 31 |
+
"reference_verify": "references/reference_verify_pedestrian.json",
|
| 32 |
+
"reference_verify_passed": true,
|
| 33 |
+
"reference_attempts": 1
|
| 34 |
+
},
|
| 35 |
+
{
|
| 36 |
+
"name": "parked_dark_car",
|
| 37 |
+
"ref_image": "references/ref_parked_dark_car.png",
|
| 38 |
+
"raw_ref_image": "references/raw_ref_parked_dark_car_attempt_01.png",
|
| 39 |
+
"diversify_input": "crops/diversify_input_parked_dark_car.png",
|
| 40 |
+
"sam_white_bg": {
|
| 41 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_parked_dark_car_attempt_01.png",
|
| 42 |
+
"output": "references/ref_parked_dark_car.png",
|
| 43 |
+
"mask": "references/sam_mask_parked_dark_car.png",
|
| 44 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 45 |
+
"sam_model_type": "vit_b",
|
| 46 |
+
"sam_device": "auto",
|
| 47 |
+
"sam_working_size": [
|
| 48 |
+
640,
|
| 49 |
+
640
|
| 50 |
+
],
|
| 51 |
+
"sam_max_side": 640,
|
| 52 |
+
"sam_downscale": 0.625,
|
| 53 |
+
"prompt_box_xyxy": [
|
| 54 |
+
47.0,
|
| 55 |
+
315.0,
|
| 56 |
+
976.0,
|
| 57 |
+
694.0
|
| 58 |
+
],
|
| 59 |
+
"mask_score": 3.4345,
|
| 60 |
+
"mask_area_ratio": 0.180014,
|
| 61 |
+
"elapsed_seconds": 7.1991
|
| 62 |
+
},
|
| 63 |
+
"reference_verify": "references/reference_verify_parked_dark_car.json",
|
| 64 |
+
"reference_verify_passed": true,
|
| 65 |
+
"reference_attempts": 1
|
| 66 |
+
},
|
| 67 |
+
{
|
| 68 |
+
"name": "metal_barrier",
|
| 69 |
+
"ref_image": "references/ref_metal_barrier.png",
|
| 70 |
+
"raw_ref_image": "references/raw_ref_metal_barrier_attempt_01.png",
|
| 71 |
+
"diversify_input": "crops/diversify_input_metal_barrier.png",
|
| 72 |
+
"sam_white_bg": {
|
| 73 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_metal_barrier_attempt_01.png",
|
| 74 |
+
"output": "references/ref_metal_barrier.png",
|
| 75 |
+
"mask": "references/sam_mask_metal_barrier.png",
|
| 76 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 77 |
+
"sam_model_type": "vit_b",
|
| 78 |
+
"sam_device": "auto",
|
| 79 |
+
"sam_working_size": [
|
| 80 |
+
640,
|
| 81 |
+
640
|
| 82 |
+
],
|
| 83 |
+
"sam_max_side": 640,
|
| 84 |
+
"sam_downscale": 0.625,
|
| 85 |
+
"prompt_box_xyxy": [
|
| 86 |
+
2.0,
|
| 87 |
+
107.0,
|
| 88 |
+
1009.0,
|
| 89 |
+
986.0
|
| 90 |
+
],
|
| 91 |
+
"mask_score": 1.555076,
|
| 92 |
+
"mask_area_ratio": 0.845579,
|
| 93 |
+
"elapsed_seconds": 7.2854
|
| 94 |
+
},
|
| 95 |
+
"reference_verify": "references/reference_verify_metal_barrier.json",
|
| 96 |
+
"reference_verify_passed": true,
|
| 97 |
+
"reference_attempts": 1
|
| 98 |
+
}
|
| 99 |
+
],
|
| 100 |
+
"reference_errors": {}
|
| 101 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_metal_barrier.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_parked_dark_car.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/ref_pedestrian.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/reference_verify_metal_barrier.json
ADDED
|
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "metal_barrier",
|
| 3 |
+
"passed": true,
|
| 4 |
+
"accepted_attempt": 1,
|
| 5 |
+
"attempts": [
|
| 6 |
+
{
|
| 7 |
+
"attempt": 1,
|
| 8 |
+
"raw_ref_image": "references/raw_ref_metal_barrier_attempt_01.png",
|
| 9 |
+
"candidate_ref_image": "references/candidate_ref_metal_barrier_attempt_01.png",
|
| 10 |
+
"candidate_sam_mask": "references/candidate_sam_mask_metal_barrier_attempt_01.png",
|
| 11 |
+
"sam_white_bg": {
|
| 12 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_metal_barrier_attempt_01.png",
|
| 13 |
+
"output": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/candidate_ref_metal_barrier_attempt_01.png",
|
| 14 |
+
"mask": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/candidate_sam_mask_metal_barrier_attempt_01.png",
|
| 15 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 16 |
+
"sam_model_type": "vit_b",
|
| 17 |
+
"sam_device": "auto",
|
| 18 |
+
"sam_working_size": [
|
| 19 |
+
640,
|
| 20 |
+
640
|
| 21 |
+
],
|
| 22 |
+
"sam_max_side": 640,
|
| 23 |
+
"sam_downscale": 0.625,
|
| 24 |
+
"prompt_box_xyxy": [
|
| 25 |
+
2.0,
|
| 26 |
+
107.0,
|
| 27 |
+
1009.0,
|
| 28 |
+
986.0
|
| 29 |
+
],
|
| 30 |
+
"mask_score": 1.555076,
|
| 31 |
+
"mask_area_ratio": 0.845579,
|
| 32 |
+
"elapsed_seconds": 7.2854
|
| 33 |
+
},
|
| 34 |
+
"verify": {
|
| 35 |
+
"passed": true,
|
| 36 |
+
"subject_visible": true,
|
| 37 |
+
"complete_subject": true,
|
| 38 |
+
"cropped_or_truncated": false,
|
| 39 |
+
"single_main_subject": true,
|
| 40 |
+
"white_background": true,
|
| 41 |
+
"failure_reasons": [],
|
| 42 |
+
"notes": "The metal barrier is fully visible and isolated against a white background."
|
| 43 |
+
}
|
| 44 |
+
}
|
| 45 |
+
]
|
| 46 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/reference_verify_parked_dark_car.json
ADDED
|
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "parked_dark_car",
|
| 3 |
+
"passed": true,
|
| 4 |
+
"accepted_attempt": 1,
|
| 5 |
+
"attempts": [
|
| 6 |
+
{
|
| 7 |
+
"attempt": 1,
|
| 8 |
+
"raw_ref_image": "references/raw_ref_parked_dark_car_attempt_01.png",
|
| 9 |
+
"candidate_ref_image": "references/candidate_ref_parked_dark_car_attempt_01.png",
|
| 10 |
+
"candidate_sam_mask": "references/candidate_sam_mask_parked_dark_car_attempt_01.png",
|
| 11 |
+
"sam_white_bg": {
|
| 12 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_parked_dark_car_attempt_01.png",
|
| 13 |
+
"output": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/candidate_ref_parked_dark_car_attempt_01.png",
|
| 14 |
+
"mask": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/candidate_sam_mask_parked_dark_car_attempt_01.png",
|
| 15 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 16 |
+
"sam_model_type": "vit_b",
|
| 17 |
+
"sam_device": "auto",
|
| 18 |
+
"sam_working_size": [
|
| 19 |
+
640,
|
| 20 |
+
640
|
| 21 |
+
],
|
| 22 |
+
"sam_max_side": 640,
|
| 23 |
+
"sam_downscale": 0.625,
|
| 24 |
+
"prompt_box_xyxy": [
|
| 25 |
+
47.0,
|
| 26 |
+
315.0,
|
| 27 |
+
976.0,
|
| 28 |
+
694.0
|
| 29 |
+
],
|
| 30 |
+
"mask_score": 3.4345,
|
| 31 |
+
"mask_area_ratio": 0.180014,
|
| 32 |
+
"elapsed_seconds": 7.1991
|
| 33 |
+
},
|
| 34 |
+
"verify": {
|
| 35 |
+
"passed": true,
|
| 36 |
+
"subject_visible": true,
|
| 37 |
+
"complete_subject": true,
|
| 38 |
+
"cropped_or_truncated": false,
|
| 39 |
+
"single_main_subject": true,
|
| 40 |
+
"white_background": true,
|
| 41 |
+
"failure_reasons": [],
|
| 42 |
+
"notes": "The image shows a complete dark-colored sedan isolated on a white background, which perfectly fits the subject description."
|
| 43 |
+
}
|
| 44 |
+
}
|
| 45 |
+
]
|
| 46 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/reference_verify_pedestrian.json
ADDED
|
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "pedestrian",
|
| 3 |
+
"passed": true,
|
| 4 |
+
"accepted_attempt": 1,
|
| 5 |
+
"attempts": [
|
| 6 |
+
{
|
| 7 |
+
"attempt": 1,
|
| 8 |
+
"raw_ref_image": "references/raw_ref_pedestrian_attempt_01.png",
|
| 9 |
+
"candidate_ref_image": "references/candidate_ref_pedestrian_attempt_01.png",
|
| 10 |
+
"candidate_sam_mask": "references/candidate_sam_mask_pedestrian_attempt_01.png",
|
| 11 |
+
"sam_white_bg": {
|
| 12 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_pedestrian_attempt_01.png",
|
| 13 |
+
"output": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/candidate_ref_pedestrian_attempt_01.png",
|
| 14 |
+
"mask": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/candidate_sam_mask_pedestrian_attempt_01.png",
|
| 15 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 16 |
+
"sam_model_type": "vit_b",
|
| 17 |
+
"sam_device": "auto",
|
| 18 |
+
"sam_working_size": [
|
| 19 |
+
640,
|
| 20 |
+
640
|
| 21 |
+
],
|
| 22 |
+
"sam_max_side": 640,
|
| 23 |
+
"sam_downscale": 0.625,
|
| 24 |
+
"prompt_box_xyxy": [
|
| 25 |
+
330.0,
|
| 26 |
+
42.0,
|
| 27 |
+
698.0,
|
| 28 |
+
1007.0
|
| 29 |
+
],
|
| 30 |
+
"mask_score": 3.413244,
|
| 31 |
+
"mask_area_ratio": 0.159381,
|
| 32 |
+
"elapsed_seconds": 33.2771
|
| 33 |
+
},
|
| 34 |
+
"verify": {
|
| 35 |
+
"passed": true,
|
| 36 |
+
"subject_visible": true,
|
| 37 |
+
"complete_subject": true,
|
| 38 |
+
"cropped_or_truncated": false,
|
| 39 |
+
"single_main_subject": true,
|
| 40 |
+
"white_background": true,
|
| 41 |
+
"failure_reasons": [],
|
| 42 |
+
"notes": "The image shows a full body of a person on a white background with no cropping. It is a suitable reference."
|
| 43 |
+
}
|
| 44 |
+
}
|
| 45 |
+
]
|
| 46 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/sam_mask_metal_barrier.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/sam_mask_parked_dark_car.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/references/sam_mask_pedestrian.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/row.json
ADDED
|
@@ -0,0 +1,164 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"sample_id": "sample_000001",
|
| 3 |
+
"target_total": 3,
|
| 4 |
+
"target_people": 1,
|
| 5 |
+
"target_objects": 2,
|
| 6 |
+
"canvas_size": [
|
| 7 |
+
1248,
|
| 8 |
+
832
|
| 9 |
+
],
|
| 10 |
+
"canvas_aspect_ratio": "3:2",
|
| 11 |
+
"main_image": "main_image.png",
|
| 12 |
+
"bbox_overlay": "bbox_overlay.png",
|
| 13 |
+
"plan": "plan.json",
|
| 14 |
+
"detections": "detections.json",
|
| 15 |
+
"vocab_task": "vocab_task.json",
|
| 16 |
+
"n_planned": 3,
|
| 17 |
+
"n_detected": 3,
|
| 18 |
+
"n_subjects": 3,
|
| 19 |
+
"subjects": [
|
| 20 |
+
{
|
| 21 |
+
"name": "pedestrian",
|
| 22 |
+
"is_person": true,
|
| 23 |
+
"subject_type": "person",
|
| 24 |
+
"source_set": "people_set",
|
| 25 |
+
"source_image_id": "CrowdHuman:data/data_69/273278,12fc4700013112375.jpg:person:3",
|
| 26 |
+
"source_name": "pedestrian",
|
| 27 |
+
"source_description": "A person wearing a dark coat and trousers. Source dataset: CrowdHuman. Scene context: A bustling city street lined with trees showcasing vibrant yellow autumn foliage, with many pedestrians walking in both directions.",
|
| 28 |
+
"sub_caption": "pedestrian: A person wearing a dark coat and trousers, walking confidently.. Scene role: Walking along the curbside near the barrier.",
|
| 29 |
+
"measured_bbox": [
|
| 30 |
+
0.1528,
|
| 31 |
+
0.301,
|
| 32 |
+
0.2511,
|
| 33 |
+
0.7071
|
| 34 |
+
],
|
| 35 |
+
"detection_confidence": 0.98,
|
| 36 |
+
"ref_style": "white_bg_full_body_front",
|
| 37 |
+
"ref_image": "references/ref_pedestrian.png",
|
| 38 |
+
"raw_ref_image": "references/raw_ref_pedestrian_attempt_01.png",
|
| 39 |
+
"reference_verify": "references/reference_verify_pedestrian.json",
|
| 40 |
+
"reference_verify_passed": true,
|
| 41 |
+
"reference_attempts": 1,
|
| 42 |
+
"sam_white_bg": {
|
| 43 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_pedestrian_attempt_01.png",
|
| 44 |
+
"output": "references/ref_pedestrian.png",
|
| 45 |
+
"mask": "references/sam_mask_pedestrian.png",
|
| 46 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 47 |
+
"sam_model_type": "vit_b",
|
| 48 |
+
"sam_device": "auto",
|
| 49 |
+
"sam_working_size": [
|
| 50 |
+
640,
|
| 51 |
+
640
|
| 52 |
+
],
|
| 53 |
+
"sam_max_side": 640,
|
| 54 |
+
"sam_downscale": 0.625,
|
| 55 |
+
"prompt_box_xyxy": [
|
| 56 |
+
330.0,
|
| 57 |
+
42.0,
|
| 58 |
+
698.0,
|
| 59 |
+
1007.0
|
| 60 |
+
],
|
| 61 |
+
"mask_score": 3.413244,
|
| 62 |
+
"mask_area_ratio": 0.159381,
|
| 63 |
+
"elapsed_seconds": 33.2771
|
| 64 |
+
}
|
| 65 |
+
},
|
| 66 |
+
{
|
| 67 |
+
"name": "parked_dark_car",
|
| 68 |
+
"is_person": false,
|
| 69 |
+
"subject_type": "object",
|
| 70 |
+
"source_set": "obj_set",
|
| 71 |
+
"source_image_id": "BDD100K:bcb356f6-520dd65c:object:9",
|
| 72 |
+
"source_name": "parked dark car",
|
| 73 |
+
"source_description": "A dark-colored sedan parked on the right side of the street, behind the silver car. Source dataset: BDD100K. Scene context: A large white New York City bus is driving down a city street on an overcast day with other cars parked and driving around it.",
|
| 74 |
+
"sub_caption": "parked dark car: A dark-colored sedan.. Scene role: Parked on the street near the curb in the background right.",
|
| 75 |
+
"measured_bbox": [
|
| 76 |
+
0.5163,
|
| 77 |
+
0.3897,
|
| 78 |
+
0.9968,
|
| 79 |
+
0.9244
|
| 80 |
+
],
|
| 81 |
+
"detection_confidence": 0.98,
|
| 82 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 83 |
+
"ref_image": "references/ref_parked_dark_car.png",
|
| 84 |
+
"raw_ref_image": "references/raw_ref_parked_dark_car_attempt_01.png",
|
| 85 |
+
"reference_verify": "references/reference_verify_parked_dark_car.json",
|
| 86 |
+
"reference_verify_passed": true,
|
| 87 |
+
"reference_attempts": 1,
|
| 88 |
+
"sam_white_bg": {
|
| 89 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_parked_dark_car_attempt_01.png",
|
| 90 |
+
"output": "references/ref_parked_dark_car.png",
|
| 91 |
+
"mask": "references/sam_mask_parked_dark_car.png",
|
| 92 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 93 |
+
"sam_model_type": "vit_b",
|
| 94 |
+
"sam_device": "auto",
|
| 95 |
+
"sam_working_size": [
|
| 96 |
+
640,
|
| 97 |
+
640
|
| 98 |
+
],
|
| 99 |
+
"sam_max_side": 640,
|
| 100 |
+
"sam_downscale": 0.625,
|
| 101 |
+
"prompt_box_xyxy": [
|
| 102 |
+
47.0,
|
| 103 |
+
315.0,
|
| 104 |
+
976.0,
|
| 105 |
+
694.0
|
| 106 |
+
],
|
| 107 |
+
"mask_score": 3.4345,
|
| 108 |
+
"mask_area_ratio": 0.180014,
|
| 109 |
+
"elapsed_seconds": 7.1991
|
| 110 |
+
}
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "metal_barrier",
|
| 114 |
+
"is_person": false,
|
| 115 |
+
"subject_type": "object",
|
| 116 |
+
"source_set": "obj_set",
|
| 117 |
+
"source_image_id": "CrowdHuman:data/data_74/284193,1da20000b642be5b.jpg:object:5",
|
| 118 |
+
"source_name": "metal barrier",
|
| 119 |
+
"source_description": "silver metal barricade placed near the entrance Source dataset: CrowdHuman. Scene context: People are gathered outside the entrance of a stone building with arched doorways and large windows.",
|
| 120 |
+
"sub_caption": "metal barrier: A silver metal barricade placed along the street.. Scene role: Positioned along the curb to section off the pedestrian area from the road.",
|
| 121 |
+
"measured_bbox": [
|
| 122 |
+
0.3454,
|
| 123 |
+
0.4302,
|
| 124 |
+
0.5465,
|
| 125 |
+
0.8402
|
| 126 |
+
],
|
| 127 |
+
"detection_confidence": 0.98,
|
| 128 |
+
"ref_style": "white_bg_encyclopedia_photo",
|
| 129 |
+
"ref_image": "references/ref_metal_barrier.png",
|
| 130 |
+
"raw_ref_image": "references/raw_ref_metal_barrier_attempt_01.png",
|
| 131 |
+
"reference_verify": "references/reference_verify_metal_barrier.json",
|
| 132 |
+
"reference_verify_passed": true,
|
| 133 |
+
"reference_attempts": 1,
|
| 134 |
+
"sam_white_bg": {
|
| 135 |
+
"input": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/driving/samples/sample_000001/references/raw_ref_metal_barrier_attempt_01.png",
|
| 136 |
+
"output": "references/ref_metal_barrier.png",
|
| 137 |
+
"mask": "references/sam_mask_metal_barrier.png",
|
| 138 |
+
"sam_checkpoint": "/lustre/fs12/portfolios/nvr/projects/nvr_elm_llm/users/hcai/dataset/tmp/lmlu/codex_gen_data/checkpoints/sam/sam_vit_b_01ec64.pth",
|
| 139 |
+
"sam_model_type": "vit_b",
|
| 140 |
+
"sam_device": "auto",
|
| 141 |
+
"sam_working_size": [
|
| 142 |
+
640,
|
| 143 |
+
640
|
| 144 |
+
],
|
| 145 |
+
"sam_max_side": 640,
|
| 146 |
+
"sam_downscale": 0.625,
|
| 147 |
+
"prompt_box_xyxy": [
|
| 148 |
+
2.0,
|
| 149 |
+
107.0,
|
| 150 |
+
1009.0,
|
| 151 |
+
986.0
|
| 152 |
+
],
|
| 153 |
+
"mask_score": 1.555076,
|
| 154 |
+
"mask_area_ratio": 0.845579,
|
| 155 |
+
"elapsed_seconds": 7.2854
|
| 156 |
+
}
|
| 157 |
+
}
|
| 158 |
+
],
|
| 159 |
+
"not_emitted": [],
|
| 160 |
+
"model_ids": {
|
| 161 |
+
"chat_model": "gcp/google/gemini-3.1-pro-preview",
|
| 162 |
+
"image_model": "gcp/google/gemini-3-pro-image-preview"
|
| 163 |
+
}
|
| 164 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000001/vocab_task.json
ADDED
|
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"task_id": "sample_000001",
|
| 3 |
+
"sample_id": "sample_000001",
|
| 4 |
+
"sample_index": 1,
|
| 5 |
+
"target_total": 3,
|
| 6 |
+
"target_people": 1,
|
| 7 |
+
"target_objects": 2,
|
| 8 |
+
"people_candidates": [
|
| 9 |
+
{
|
| 10 |
+
"candidate_index": 0,
|
| 11 |
+
"source_offset": 13962,
|
| 12 |
+
"image_id": "CrowdHuman:data/data_13/282555,65d1d00050480dce.jpg:person:2",
|
| 13 |
+
"name": "toddler",
|
| 14 |
+
"description": "A young child with short brown hair, wearing a light blue patterned sweater, being carried by the woman in blue. Source dataset: CrowdHuman. Scene context: Two women, one carrying a toddler and the other walking hand-in-hand with a young girl, are crossing a street with parked cars in the background."
|
| 15 |
+
},
|
| 16 |
+
{
|
| 17 |
+
"candidate_index": 1,
|
| 18 |
+
"source_offset": 171812,
|
| 19 |
+
"image_id": "CrowdHuman:data/data_69/273278,12fc4700013112375.jpg:person:3",
|
| 20 |
+
"name": "pedestrian",
|
| 21 |
+
"description": "A person wearing a dark coat and trousers. Source dataset: CrowdHuman. Scene context: A bustling city street lined with trees showcasing vibrant yellow autumn foliage, with many pedestrians walking in both directions."
|
| 22 |
+
}
|
| 23 |
+
],
|
| 24 |
+
"object_candidates": [
|
| 25 |
+
{
|
| 26 |
+
"candidate_index": 0,
|
| 27 |
+
"source_offset": 129279,
|
| 28 |
+
"image_id": "CrowdHuman:data/data_74/284193,1da20000b642be5b.jpg:object:5",
|
| 29 |
+
"name": "metal barrier",
|
| 30 |
+
"description": "silver metal barricade placed near the entrance Source dataset: CrowdHuman. Scene context: People are gathered outside the entrance of a stone building with arched doorways and large windows."
|
| 31 |
+
},
|
| 32 |
+
{
|
| 33 |
+
"candidate_index": 1,
|
| 34 |
+
"source_offset": 182609,
|
| 35 |
+
"image_id": "BDD100K:bcb356f6-520dd65c:object:9",
|
| 36 |
+
"name": "parked dark car",
|
| 37 |
+
"description": "A dark-colored sedan parked on the right side of the street, behind the silver car. Source dataset: BDD100K. Scene context: A large white New York City bus is driving down a city street on an overcast day with other cars parked and driving around it."
|
| 38 |
+
},
|
| 39 |
+
{
|
| 40 |
+
"candidate_index": 2,
|
| 41 |
+
"source_offset": 92980,
|
| 42 |
+
"image_id": "CrowdHuman:data/data_56/273278,97d7f00040d24761.jpg:object:4",
|
| 43 |
+
"name": "paved path",
|
| 44 |
+
"description": "A textured paved walkway the group is walking on. Source dataset: CrowdHuman. Scene context: A group of five adults walking together and conversing in a park-like outdoor setting."
|
| 45 |
+
},
|
| 46 |
+
{
|
| 47 |
+
"candidate_index": 3,
|
| 48 |
+
"source_offset": 83796,
|
| 49 |
+
"image_id": "CrowdHuman:data/data_51/273278,23a1a000c26da45e.jpg:object:0",
|
| 50 |
+
"name": "plastic bag",
|
| 51 |
+
"description": "White plastic shopping bag held by the seated woman. Source dataset: CrowdHuman. Scene context: People are standing and sitting inside a brightly lit train or subway car."
|
| 52 |
+
}
|
| 53 |
+
],
|
| 54 |
+
"rng_seed": 1782032722,
|
| 55 |
+
"created_at": 1782292413.1601257
|
| 56 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/bbox_overlay.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/compose_prompt.txt
ADDED
|
@@ -0,0 +1,159 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Render the following JSON scene specification as a photorealistic 1152x864 image using a true 4:3 canvas. The rendered image must be a coherent driving scenario with an outdoor road, street, highway, intersection, curbside, parking, or traffic environment; do not render a non-driving indoor scene or product-catalog scene. Every listed person and object must appear visibly in the image. Keep normal proportions and the requested aspect ratio. The foreground must contain only subjects explicitly listed in the JSON scene specification. Do not add any unlisted foreground people, animals, vehicles, props, tools, products, signs, readable text, logos, or other localizable subjects. Background context may include non-localizable scenery only when it does not introduce a distinct foreground subject. No text, no labels, no logos, no watermarks.
|
| 2 |
+
JSON scene specification:
|
| 3 |
+
{
|
| 4 |
+
"format": "structured_json_prompt",
|
| 5 |
+
"canvas": {
|
| 6 |
+
"size": [
|
| 7 |
+
1152,
|
| 8 |
+
864
|
| 9 |
+
],
|
| 10 |
+
"aspect_ratio": "4:3",
|
| 11 |
+
"style": "photorealistic"
|
| 12 |
+
},
|
| 13 |
+
"scene": {
|
| 14 |
+
"setting": "city street at twilight viewed from inside a moving vehicle",
|
| 15 |
+
"activity": "driving down a two-way street with parked and moving cars, while pedestrians walk on the adjacent sidewalk",
|
| 16 |
+
"composition": "first-person dashboard perspective, looking down the road, clear depth of field receding to the horizon, road centralized, dashboard anchors the bottom frame",
|
| 17 |
+
"constraints": [
|
| 18 |
+
"no text",
|
| 19 |
+
"no labels",
|
| 20 |
+
"no watermarks",
|
| 21 |
+
"true 4:3 composition",
|
| 22 |
+
"final canvas size 1152x864",
|
| 23 |
+
"normal human and object proportions",
|
| 24 |
+
"no squeezed perspective",
|
| 25 |
+
"no anamorphic stretching",
|
| 26 |
+
"every listed person and object must be visibly present",
|
| 27 |
+
"the foreground may contain only the listed people and objects",
|
| 28 |
+
"no extra foreground people, animals, vehicles, props, tools, products, signs, readable text, logos, or other localizable subjects absent from this JSON",
|
| 29 |
+
"the entire image must be a coherent driving scenario",
|
| 30 |
+
"the scene must include an outdoor road, street, highway, intersection, curbside, parking, or traffic environment",
|
| 31 |
+
"integrate all listed subjects as road users, vehicles, roadside objects, traffic infrastructure, or driving-context objects",
|
| 32 |
+
"do not render an office, kitchen, studio, product catalog, indoor room, or unrelated non-driving scene"
|
| 33 |
+
]
|
| 34 |
+
},
|
| 35 |
+
"people": [
|
| 36 |
+
{
|
| 37 |
+
"name": "pedestrian_walking",
|
| 38 |
+
"source_index": 0,
|
| 39 |
+
"source_image_id": "BDD100K:c5d864fa-b0b2380b:person:2",
|
| 40 |
+
"source_name": "pedestrian",
|
| 41 |
+
"description": "Person walking away from the camera on the right sidewalk, wearing dark clothing.",
|
| 42 |
+
"role_in_scene": "walking along the sidewalk on the right side of the street"
|
| 43 |
+
},
|
| 44 |
+
{
|
| 45 |
+
"name": "shop_pedestrian",
|
| 46 |
+
"source_index": 2,
|
| 47 |
+
"source_image_id": "BDD100K:b714a088-861a043b:person:2",
|
| 48 |
+
"source_name": "pedestrian",
|
| 49 |
+
"description": "Person standing near a shop entrance on the right, partially obscured.",
|
| 50 |
+
"role_in_scene": "standing on the sidewalk near the storefronts on the right"
|
| 51 |
+
}
|
| 52 |
+
],
|
| 53 |
+
"objects": [
|
| 54 |
+
{
|
| 55 |
+
"name": "city_buildings",
|
| 56 |
+
"source_index": 1,
|
| 57 |
+
"source_image_id": "CrowdHuman:data/data_9/283554,31eeb000e9237b31.jpg:object:9",
|
| 58 |
+
"source_name": "building",
|
| 59 |
+
"description": "Various city buildings of different heights forming the skyline and lining the street.",
|
| 60 |
+
"role_in_scene": "framing the street and forming the background skyline"
|
| 61 |
+
},
|
| 62 |
+
{
|
| 63 |
+
"name": "street_signs",
|
| 64 |
+
"source_index": 6,
|
| 65 |
+
"source_image_id": "BDD100K:b5ab0e46-8eab4733:object:8",
|
| 66 |
+
"source_name": "street signs",
|
| 67 |
+
"description": "Various blank street signs attached to a pole on the right side of the street.",
|
| 68 |
+
"role_in_scene": "mounted on a pole next to the right sidewalk"
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"name": "storefront_sign",
|
| 72 |
+
"source_index": 7,
|
| 73 |
+
"source_image_id": "CrowdHuman:data/data_4/273275,46a6f0005d04fc24.jpg:object:7",
|
| 74 |
+
"source_name": "storefront sign",
|
| 75 |
+
"description": "A dark hanging sign framework attached to a building on the right, devoid of readable text.",
|
| 76 |
+
"role_in_scene": "hanging above the shop entrance on the right side of the road"
|
| 77 |
+
},
|
| 78 |
+
{
|
| 79 |
+
"name": "parked_suv_right",
|
| 80 |
+
"source_index": 11,
|
| 81 |
+
"source_image_id": "BDD100K:c54441e6-400c221e:object:4",
|
| 82 |
+
"source_name": "parked SUV",
|
| 83 |
+
"description": "Dark-colored SUV parked on the right side of the road.",
|
| 84 |
+
"role_in_scene": "parked alongside the right curb"
|
| 85 |
+
},
|
| 86 |
+
{
|
| 87 |
+
"name": "parked_car_left",
|
| 88 |
+
"source_index": 12,
|
| 89 |
+
"source_image_id": "BDD100K:bb2e43e4-5e7a7129:object:6",
|
| 90 |
+
"source_name": "car",
|
| 91 |
+
"description": "A dark car parked along the left curb further ahead.",
|
| 92 |
+
"role_in_scene": "parked alongside the left curb"
|
| 93 |
+
},
|
| 94 |
+
{
|
| 95 |
+
"name": "traveling_dark_suv",
|
| 96 |
+
"source_index": 14,
|
| 97 |
+
"source_image_id": "BDD100K:c889c950-865ca5b6:object:0",
|
| 98 |
+
"source_name": "dark SUV",
|
| 99 |
+
"description": "A dark SUV traveling in the left lane, with visible red taillights reflecting the twilight.",
|
| 100 |
+
"role_in_scene": "driving in the adjacent lane"
|
| 101 |
+
},
|
| 102 |
+
{
|
| 103 |
+
"name": "street_light",
|
| 104 |
+
"source_index": 15,
|
| 105 |
+
"source_image_id": "BDD100K:c84f848e-2a5e0737:object:2",
|
| 106 |
+
"source_name": "street light",
|
| 107 |
+
"description": "Tall pole with a bright light on top, illuminating the road from the right side.",
|
| 108 |
+
"role_in_scene": "providing illumination from the right sidewalk"
|
| 109 |
+
},
|
| 110 |
+
{
|
| 111 |
+
"name": "vehicle_dashboard",
|
| 112 |
+
"source_index": 16,
|
| 113 |
+
"source_image_id": "BDD100K:b5032e1d-dad95b60:object:9",
|
| 114 |
+
"source_name": "dashboard",
|
| 115 |
+
"description": "The dark, reflective dashboard and lower windshield area of the camera vehicle in the foreground.",
|
| 116 |
+
"role_in_scene": "anchoring the bottom of the frame to establish a driver's perspective"
|
| 117 |
+
},
|
| 118 |
+
{
|
| 119 |
+
"name": "drainage_grate",
|
| 120 |
+
"source_index": 17,
|
| 121 |
+
"source_image_id": "BDD100K:b4d0e72d-3b208072:object:16",
|
| 122 |
+
"source_name": "drainage grate",
|
| 123 |
+
"description": "A metal drainage grate on the edge of the road on the right.",
|
| 124 |
+
"role_in_scene": "embedded in the road surface near the right curb"
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"name": "white_car",
|
| 128 |
+
"source_index": 20,
|
| 129 |
+
"source_image_id": "BDD100K:b3a102ed-6ef54f5e:object:3",
|
| 130 |
+
"source_name": "white car",
|
| 131 |
+
"description": "A white car visible further down the road in the right lane.",
|
| 132 |
+
"role_in_scene": "driving ahead in the same lane"
|
| 133 |
+
},
|
| 134 |
+
{
|
| 135 |
+
"name": "yellow_lines",
|
| 136 |
+
"source_index": 22,
|
| 137 |
+
"source_image_id": "BDD100K:c417a291-7802692d:object:8",
|
| 138 |
+
"source_name": "yellow lines",
|
| 139 |
+
"description": "Double yellow painted lines separating opposite directions of traffic.",
|
| 140 |
+
"role_in_scene": "painted down the center of the road"
|
| 141 |
+
},
|
| 142 |
+
{
|
| 143 |
+
"name": "street_trees",
|
| 144 |
+
"source_index": 23,
|
| 145 |
+
"source_image_id": "BDD100K:c4891df0-24371ae1:object:3",
|
| 146 |
+
"source_name": "trees",
|
| 147 |
+
"description": "Numerous trees with dense green foliage lining both sides of the road.",
|
| 148 |
+
"role_in_scene": "growing along the sidewalks, adding greenery"
|
| 149 |
+
},
|
| 150 |
+
{
|
| 151 |
+
"name": "twilight_sky",
|
| 152 |
+
"source_index": 25,
|
| 153 |
+
"source_image_id": "BDD100K:c13c0d1f-00dfd075:object:9",
|
| 154 |
+
"source_name": "sky",
|
| 155 |
+
"description": "Clear twilight sky transitioning from bright near the horizon to dark blue at the top.",
|
| 156 |
+
"role_in_scene": "visible above the buildings and trees at the end of the road"
|
| 157 |
+
}
|
| 158 |
+
]
|
| 159 |
+
}
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_city_buildings.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_drainage_grate.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_parked_car_left.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_parked_suv_right.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_pedestrian_walking.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_shop_pedestrian.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_storefront_sign.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_street_light.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_street_signs.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_street_trees.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_traveling_dark_suv.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_twilight_sky.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_vehicle_dashboard.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_white_car.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/detect_refine_yellow_lines.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_city_buildings.png
ADDED
|
Git LFS Details
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_drainage_grate.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_parked_car_left.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_parked_suv_right.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_pedestrian_walking.png
ADDED
|
samples_v8/driving/BDD100K_CityPersons_CrowdHuman_samples_clean/sample_000002/crops/diversify_input_shop_pedestrian.png
ADDED
|