diff --git a/src/components/DatasetMetadataModal.tsx b/src/components/DatasetMetadataModal.tsx index 9658992..d8d21b3 100644 --- a/src/components/DatasetMetadataModal.tsx +++ b/src/components/DatasetMetadataModal.tsx @@ -101,7 +101,13 @@ export function DatasetMetadataModal({ ['Annotation format', formatValue(dataset.annotation_format)], ['Number of images', formatImageCount(dataset.num_images)], ['Size', formatBytesDecimal(dataset.zip_size_bytes)], - ] as const; + ...(dataset.augmented_num_images != null + ? ([['Augmented images', formatImageCount(dataset.augmented_num_images)]] as const) + : []), + ...(dataset.augmented_zip_size_bytes != null + ? ([['Augmented size', formatBytesDecimal(dataset.augmented_zip_size_bytes)]] as const) + : []), + ] as [string, string][]; const loader = formatLoaderInstructions(dataset); return ( diff --git a/src/lib/datasets.ts b/src/lib/datasets.ts index a542f5d..f4056ff 100644 --- a/src/lib/datasets.ts +++ b/src/lib/datasets.ts @@ -17,6 +17,7 @@ export interface Dataset { annotation_format: string | null; num_images: number | null; augmented_num_images: number | null; + augmented_zip_size_bytes: number | null; documentation: string | null; classes: string | null; stats_mean: number[] | null; @@ -129,6 +130,7 @@ function normalizeDataset(raw: unknown): Dataset | null { annotation_format: firstString(raw.annotation_format), num_images: toNumber(raw.num_images ?? raw.n_images ?? raw.image_count), augmented_num_images: augmentedNumImages, + augmented_zip_size_bytes: toNumber(raw.augmented_zip_size_bytes ?? raw.augmentedZipSizeBytes), documentation: firstString(raw.documentation, raw.docs_url, raw.doc_url, raw.url), classes: toText(raw.classes), stats_mean: toNumberArray(raw.stats_mean ?? stats?.mean), @@ -158,6 +160,7 @@ function mergeDataset(current: Dataset, incoming: Dataset): Dataset { annotation_format: current.annotation_format ?? incoming.annotation_format, num_images: current.num_images ?? incoming.num_images, augmented_num_images: current.augmented_num_images ?? incoming.augmented_num_images, + augmented_zip_size_bytes: current.augmented_zip_size_bytes ?? incoming.augmented_zip_size_bytes, documentation: current.documentation ?? incoming.documentation, classes: current.classes ?? incoming.classes, stats_mean: current.stats_mean ?? incoming.stats_mean, diff --git a/static/data/hf_datasets.json b/static/data/hf_datasets.json index 13b9232..e7ab61e 100644 --- a/static/data/hf_datasets.json +++ b/static/data/hf_datasets.json @@ -84,6 +84,89 @@ "citation": null, "parent_dataset": null, "zip_size_bytes": 246700000, + "augmented_zip_size_bytes": 6020000000, + "source": "huggingface" + }, + { + "name": "synthetic_cowpea_pod_detection", + "machine_learning_task": "object_detection", + "agricultural_task": "crop_detection", + "environment": "field", + "real_or_synthetic": "synthetic", + "crop_types": [ + "cowpea" + ], + "sensor_modality": "rgb", + "platform": "ground", + "input_data_format": "image_folder", + "annotation_format": "coco_json", + "num_images": 1440, + "augmented_num_images": 7200, + "classes": [ + "Pod" + ], + "stats_mean": null, + "stats_std": null, + "examples_image_url": null, + "license": null, + "citation": null, + "parent_dataset": null, + "zip_size_bytes": 222000000, + "augmented_zip_size_bytes": 5440000000, + "source": "huggingface" + }, + { + "name": "GEMINI_cowpea_pod_detection", + "machine_learning_task": "object_detection", + "agricultural_task": "crop_detection", + "environment": "field", + "location": "California", + "real_or_synthetic": "real", + "crop_types": [ + "cowpea" + ], + "sensor_modality": "rgb", + "platform": "ground", + "input_data_format": "image_folder", + "annotation_format": "coco_json", + "num_images": 569, + "classes": [ + "Pod" + ], + "stats_mean": null, + "stats_std": null, + "examples_image_url": null, + "license": null, + "citation": null, + "parent_dataset": null, + "zip_size_bytes": 45600000, + "source": "huggingface" + }, + { + "name": "GEMINI_cowpea_flower_detection", + "machine_learning_task": "object_detection", + "agricultural_task": "crop_detection", + "location": "California", + "environment": "field", + "real_or_synthetic": "real", + "crop_types": [ + "cowpea" + ], + "sensor_modality": "rgb", + "platform": "ground", + "input_data_format": "image_folder", + "annotation_format": "coco_json", + "num_images": 990, + "classes": [ + "Flower" + ], + "stats_mean": null, + "stats_std": null, + "examples_image_url": null, + "license": null, + "citation": null, + "parent_dataset": null, + "zip_size_bytes": 79700000, "source": "huggingface" } ] \ No newline at end of file