PyPI - megadetector - Versions diffs - 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl - Mend

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (197) hide show

megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/efficientnet/model.py +8 -8
megadetector/classification/efficientnet/utils.py +6 -5
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +26 -26
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -2
megadetector/data_management/camtrap_dp_to_coco.py +79 -46
megadetector/data_management/cct_json_utils.py +103 -103
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +210 -193
megadetector/data_management/databases/add_width_and_height_to_db.py +86 -12
megadetector/data_management/databases/combine_coco_camera_traps_files.py +40 -40
megadetector/data_management/databases/integrity_check_json_db.py +228 -200
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +88 -39
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +133 -125
megadetector/data_management/labelme_to_yolo.py +159 -73
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +365 -107
megadetector/data_management/lila/get_lila_annotation_counts.py +35 -33
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +73 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +28 -19
megadetector/data_management/mewc_to_md.py +344 -340
megadetector/data_management/ocr_tools.py +262 -255
megadetector/data_management/read_exif.py +249 -227
megadetector/data_management/remap_coco_categories.py +90 -28
megadetector/data_management/remove_exif.py +81 -21
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +588 -120
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +248 -122
megadetector/data_management/yolo_to_coco.py +333 -191
megadetector/detection/change_detection.py +832 -0
megadetector/detection/process_video.py +340 -337
megadetector/detection/pytorch_detector.py +358 -278
megadetector/detection/run_detector.py +399 -186
megadetector/detection/run_detector_batch.py +404 -377
megadetector/detection/run_inference_with_yolov5_val.py +340 -327
megadetector/detection/run_tiled_inference.py +257 -249
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +332 -295
megadetector/postprocessing/add_max_conf.py +19 -11
megadetector/postprocessing/categorize_detections_by_size.py +45 -45
megadetector/postprocessing/classification_postprocessing.py +468 -433
megadetector/postprocessing/combine_batch_outputs.py +23 -23
megadetector/postprocessing/compare_batch_results.py +590 -525
megadetector/postprocessing/convert_output_format.py +106 -102
megadetector/postprocessing/create_crop_folder.py +347 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -499
megadetector/postprocessing/load_api_results.py +48 -27
megadetector/postprocessing/md_to_coco.py +133 -102
megadetector/postprocessing/md_to_labelme.py +107 -90
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +92 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -301
megadetector/postprocessing/remap_detection_categories.py +91 -38
megadetector/postprocessing/render_detection_confusion_matrix.py +214 -205
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +704 -679
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +18 -19
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +54 -33
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +67 -67
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +156 -74
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +10 -10
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/ct_utils.py +1049 -211
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +632 -529
megadetector/utils/path_utils.py +1520 -431
megadetector/utils/process_utils.py +41 -41
megadetector/utils/split_locations_into_train_val.py +62 -62
megadetector/utils/string_utils.py +148 -27
megadetector/utils/url_utils.py +489 -176
megadetector/utils/wi_utils.py +2658 -2526
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +34 -30
megadetector/visualization/render_images_with_thumbnails.py +39 -74
megadetector/visualization/visualization_utils.py +487 -435
megadetector/visualization/visualize_db.py +232 -198
megadetector/visualization/visualize_detector_output.py +82 -76
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/METADATA +5 -2
megadetector-10.0.0.dist-info/RECORD +139 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/WHEEL +1 -1
megadetector/api/batch_processing/api_core/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/score.py +0 -439
megadetector/api/batch_processing/api_core/server.py +0 -294
megadetector/api/batch_processing/api_core/server_api_config.py +0 -97
megadetector/api/batch_processing/api_core/server_app_config.py +0 -55
megadetector/api/batch_processing/api_core/server_batch_job_manager.py +0 -220
megadetector/api/batch_processing/api_core/server_job_status_table.py +0 -149
megadetector/api/batch_processing/api_core/server_orchestration.py +0 -360
megadetector/api/batch_processing/api_core/server_utils.py +0 -88
megadetector/api/batch_processing/api_core_support/__init__.py +0 -0
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
megadetector/api/batch_processing/api_support/__init__.py +0 -0
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +0 -152
megadetector/api/batch_processing/data_preparation/__init__.py +0 -0
megadetector/api/synchronous/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/api_backend.py +0 -151
megadetector/api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -263
megadetector/api/synchronous/api_core/animal_detection_api/config.py +0 -35
megadetector/api/synchronous/api_core/tests/__init__.py +0 -0
megadetector/api/synchronous/api_core/tests/load_test.py +0 -110
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector/utils/azure_utils.py +0 -178
megadetector/utils/sas_blob_utils.py +0 -509
megadetector-5.0.28.dist-info/RECORD +0 -209
/megadetector/{api/batch_processing/__init__.py → __init__.py} +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/top_level.txt +0 -0

megadetector/classification/save_mislabeled.py CHANGED Viewed

@@ -1,4 +1,4 @@
-"""
+r"""
 save_mislabeled.py
@@ -10,7 +10,7 @@ List of known mislabeled images is stored in Azure Blob Storage.
 * blob: megadb_mislabeled/{dataset}.csv, one file per dataset
 Each file megadb_mislabeled/{dataset}.csv has two columns:
 * 'file': str, blob name
 * 'correct_class': optional str, correct dataset class
@@ -41,7 +41,7 @@ import pandas as pd
 #%% Main function
 def update_mislabeled_images(container_path: str, input_csv_path: str) -> None:
     df = pd.read_csv(input_csv_path, index_col=False)
     # error checking
@@ -62,7 +62,7 @@ def update_mislabeled_images(container_path: str, input_csv_path: str) -> None:
     df['file'] = df['blob_dirname'] + '/' + df['File']
     for ds, ds_df in df.groupby('dataset'):
         sr_path = os.path.join(container_path, 'megadb_mislabeled', f'{ds}.csv')
         if os.path.exists(sr_path):
             old_sr = pd.read_csv(sr_path, index_col='file', squeeze=True)
@@ -89,7 +89,7 @@ def update_mislabeled_images(container_path: str, input_csv_path: str) -> None:
 #%% Command-line driver
 def _parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser(
         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
         description='Merges classification results with Batch Detection API '
@@ -104,7 +104,7 @@ def _parse_args() -> argparse.Namespace:
 if __name__ == '__main__':
     args = _parse_args()
     update_mislabeled_images(container_path=args.container_path,
                              input_csv_path=args.input_csv)

megadetector/classification/train_classifier.py CHANGED Viewed

@@ -44,7 +44,7 @@ from megadetector.visualization import plot_utils
 #%% Example usage
-"""
+"""
     python train_classifier.py run_idfg /ssd/crops_sq \
         -m "efficientnet-b0" --pretrained --finetune --label-weighted \
         --epochs 50 --batch-size 512 --lr 1e-4 \

megadetector/classification/train_classifier_tf.py CHANGED Viewed

@@ -54,7 +54,7 @@ EFFICIENTNET_MODELS: Mapping[str, Mapping[str, Any]] = {
 #%% Example usage
-"""
+"""
     python train_classifier_tf.py run_idfg /ssd/crops_sq \
         -m "efficientnet-b0" --pretrained --finetune --label-weighted \
         --epochs 50 --batch-size 512 --lr 1e-4 \
@@ -97,7 +97,7 @@ def create_dataset(
     Returns: tf.data.Dataset
     """
     # images dataset
     img_ds = tf.data.Dataset.from_tensor_slices(img_files)
     img_ds = img_ds.map(lambda p: tf.io.read_file(img_base_dir + os.sep + p),
@@ -162,7 +162,7 @@ def create_dataloaders(
         datasets: dict, maps split to DataLoader
         label_names: list of str, label names in order of label id
     """
     df, label_names, split_to_locs = load_dataset_csv(
         dataset_csv_path, label_index_json_path, splits_json_path,
         multilabel=multilabel, label_weighted=label_weighted,
@@ -238,7 +238,7 @@ def build_model(model_name: str, num_classes: int, img_size: int,
     """
     Creates a model with an EfficientNet base.
     """
     class_name = EFFICIENTNET_MODELS[model_name]['cls']
     dropout = EFFICIENTNET_MODELS[model_name]['dropout']
@@ -279,7 +279,7 @@ def log_images_with_confidence(
         epoch: int
         tag: str
     """
     for label_id, heap in heap_dict.items():
         label_name = label_names[label_id]
@@ -319,7 +319,7 @@ def track_extreme_examples(tp_heaps: dict[int, list[HeapItem]],
         img_files: tf.Tensor, shape [batch_size], type tf.string
         logits: tf.Tensor, shape [batch_size, num_classes]
     """
     labels = labels.numpy().tolist()
     inputs = inputs.numpy().astype(np.uint8)
     img_files = img_files.numpy().astype(str).tolist()
@@ -480,7 +480,7 @@ def log_run(split: str, epoch: int, writer: tf.summary.SummaryWriter,
     Args:
         metrics: dict, keys already prefixed with {split}/
     """
     per_class_recall = recall_from_confusion_matrix(cm, label_names)
     metrics.update(prefix_all_keys(per_class_recall, f'{split}/label_recall/'))
@@ -518,7 +518,7 @@ def main(dataset_dir: str,
          seed: Optional[int] = None,
          logdir: str = '',
          cache_splits: Sequence[str] = ()) -> None:
     # input validation
     assert os.path.exists(dataset_dir)
     assert os.path.exists(cropped_images_dir)
@@ -597,7 +597,7 @@ def main(dataset_dir: str,
             model.base_model.trainable = True
         print('- train:')
         train_metrics, train_heaps, train_cm = run_epoch(
             model, loader=loaders['train'], weighted=label_weighted,
             loss_fn=loss_fn, weight_decay=weight_decay, optimizer=optimizer,

megadetector/classification/train_utils.py CHANGED Viewed

@@ -35,7 +35,7 @@ class HeapItem:
     """
     A wrapper over non-comparable data with a comparable priority value.
     """
     priority: Any
     data: Any = dataclasses.field(compare=False, repr=False)
@@ -53,7 +53,7 @@ def add_to_heap(h: list[Any], item: HeapItem, k: Optional[int] = None) -> None:
         item: HeapItem
         k: int, desired capacity of the heap, or None for no limit
     """
     if k is None or len(h) < k:
         heapq.heappush(h, item)
     else:
@@ -66,17 +66,17 @@ def prefix_all_keys(d: Mapping[str, Any], prefix: str) -> dict[str, Any]:
     """
     Returns a new dict where the keys are prefixed by <prefix>.
     """
     return {f'{prefix}{k}': v for k, v in d.items()}
 def fig_to_img(fig: matplotlib.figure.Figure) -> np.ndarray:
     """
     Converts a matplotlib figure to an image represented by a numpy array.
     Returns: np.ndarray, type uint8, shape [H, W, 3]
     """
     with io.BytesIO() as b:
         fig.savefig(b, transparent=False, bbox_inches='tight', pad_inches=0,
                     format='png')
@@ -103,7 +103,7 @@ def imgs_with_confidences(imgs_list: list[tuple[Any, ...]],
         fig: matplotlib.figure.Figure
         img_files: list of str
     """
     imgs, img_files, tags, titles = [], [], [], []
     for img, label_id, topk_conf, topk_preds, img_file in imgs_list:
         imgs.append(img)
@@ -140,7 +140,7 @@ def plot_img_grid(imgs: Sequence[Any], row_h: float, col_w: float,
     Returns: matplotlib.figure.Figure
     """
     # input validation
     num_images = len(imgs)
     if tags is not None:
@@ -186,7 +186,7 @@ def load_splits(splits_json_path: str) -> dict[str, set[tuple[str, str]]]:
     Returns: dict, maps split to set of (dataset, location) tuples
     """
     with open(splits_json_path, 'r') as f:
         split_to_locs_js = json.load(f)
     split_to_locs = {
@@ -235,7 +235,7 @@ def load_dataset_csv(dataset_csv_path: str,
         label_names: list of str, label names in order of label id
         split_to_locs: dict, maps split to set of (dataset, location) tuples
     """
     # read in dataset CSV and create merged (dataset, location) col
     df = pd.read_csv(dataset_csv_path, index_col=False, float_precision='high')
     df['dataset_location'] = list(zip(df['dataset'], df['location']))
@@ -315,7 +315,7 @@ def recall_from_confusion_matrix(
     Returns: dict, label_name => recall
     """
     result = {
         label_name: confusion_matrix[i, i] / (confusion_matrix[i].sum() + 1e-8)
         for i, label_name in enumerate(label_names)

megadetector/data_management/annotations/annotation_constants.py CHANGED Viewed

@@ -4,7 +4,7 @@ annotation_constants.py
 Defines default categories for MegaDetector output boxes.
-Used throughout the repo; do not change unless you are Dan or Siyu.  In fact, do not change unless
+Used throughout the repo; do not change unless you are Dan or Siyu.  In fact, do not change unless
 you are both Dan *and* Siyu.
 We use integer IDs here; this is different from the MD .json file format,
@@ -31,4 +31,3 @@ detector_bbox_category_name_to_id = {}
 for cat in detector_bbox_categories:
     detector_bbox_category_id_to_name[cat['id']] = cat['name']
     detector_bbox_category_name_to_id[cat['name']] = cat['id']

megadetector/data_management/camtrap_dp_to_coco.py CHANGED Viewed

@@ -19,6 +19,8 @@ Currently supports only sequence-level labeling.
 import os
 import json
+import argparse
 import pandas as pd
 from dateutil import parser as dateparser
@@ -31,22 +33,26 @@ from collections import defaultdict
 def camtrap_dp_to_coco(camtrap_dp_folder,output_file=None):
     """
     Convert the Camtrap DP package in [camtrap_dp_folder] to COCO.
     Does not validate images, just converts.  Use integrity_check_json_db to validate
-    the resulting COCO file.
+    the resulting COCO file.
     Optionally writes the results to [output_file]
+    Args:
+        camtrap_dp_folder (str): input folder, containing a CamtrapDP package
+        output_file (str, optional): COCO-formatted output file
     """
     required_files = ('datapackage.json','deployments.csv','events.csv','media.csv','observations.csv')
     for fn in required_files:
         fn_abs = os.path.join(camtrap_dp_folder,fn)
         assert os.path.isfile(fn_abs), 'Could not find required file {}'.format(fn_abs)
     with open(os.path.join(camtrap_dp_folder,'datapackage.json'),'r') as f:
         datapackage = json.load(f)
     assert datapackage['profile'] == 'https://raw.githubusercontent.com/tdwg/camtrap-dp/1.0/camtrap-dp-profile.json', \
         'I only know how to parse Camtrap DP 1.0 packages'
@@ -54,7 +60,7 @@ def camtrap_dp_to_coco(camtrap_dp_folder,output_file=None):
     events_file = None
     media_file = None
     observations_file = None
     resources = datapackage['resources']
     for r in resources:
         if r['name'] == 'deployments':
@@ -70,19 +76,19 @@ def camtrap_dp_to_coco(camtrap_dp_folder,output_file=None):
     assert events_file is not None, 'No events file specified'
     assert media_file is not None, 'No media file specified'
     assert observations_file is not None, 'No observation file specified'
     deployments_df = pd.read_csv(os.path.join(camtrap_dp_folder,deployments_file))
     events_df = pd.read_csv(os.path.join(camtrap_dp_folder,events_file))
     media_df = pd.read_csv(os.path.join(camtrap_dp_folder,media_file))
     observations_df = pd.read_csv(os.path.join(camtrap_dp_folder,observations_file))
     print('Read {} deployment lines'.format(len(deployments_df)))
     print('Read {} events lines'.format(len(events_df)))
     print('Read {} media lines'.format(len(media_df)))
     print('Read {} observation lines'.format(len(observations_df)))
     media_id_to_media_info = {}
     # i_row = 0; row = media_df.iloc[i_row]
     for i_row,row in media_df.iterrows():
         media_info = {}
@@ -94,23 +100,23 @@ def camtrap_dp_to_coco(camtrap_dp_folder,output_file=None):
         media_info['frame_num'] = -1
         media_info['seq_num_frames'] = -1
         media_id_to_media_info[row['mediaID']] = media_info
     event_id_to_media_ids = defaultdict(list)
     # i_row = 0; row = events_df.iloc[i_row]
     for i_row,row in events_df.iterrows():
         media_id = row['mediaID']
         assert media_id in media_id_to_media_info
         event_id_to_media_ids[row['eventID']].append(media_id)
     event_id_to_category_names = defaultdict(set)
     # i_row = 0; row = observations_df.iloc[i_row]
     for i_row,row in observations_df.iterrows():
         if row['observationLevel'] != 'event':
             raise ValueError("I don't know how to parse image-level events yet")
         if row['observationType'] == 'blank':
             event_id_to_category_names[row['eventID']].add('empty')
         elif row['observationType'] == 'unknown':
@@ -122,7 +128,7 @@ def camtrap_dp_to_coco(camtrap_dp_folder,output_file=None):
             assert row['observationType'] == 'animal'
             assert isinstance(row['scientificName'],str)
             event_id_to_category_names[row['eventID']].add(row['scientificName'])
     # Sort images within an event into frame numbers
     #
     # event_id = next(iter(event_id_to_media_ids))
@@ -134,7 +140,7 @@ def camtrap_dp_to_coco(camtrap_dp_folder,output_file=None):
             media_info['frame_num'] = i_media
             media_info['seq_num_frames'] = len(media_info_this_event)
             media_info['seq_id'] = event_id
     # Create category names
     category_name_to_category_id = {'empty':0}
     for event_id in event_id_to_category_names:
@@ -142,18 +148,18 @@ def camtrap_dp_to_coco(camtrap_dp_folder,output_file=None):
         for name in category_names_this_event:
             if name not in category_name_to_category_id:
                 category_name_to_category_id[name] = len(category_name_to_category_id)
     # Move everything into COCO format
     images = list(media_id_to_media_info.values())
     categories = []
     for name in category_name_to_category_id:
         categories.append({'name':name,'id':category_name_to_category_id[name]})
     info = {'version':1.0,'description':datapackage['name']}
     # Create annotations
     annotations = []
     for event_id in event_id_to_media_ids.keys():
         i_ann = 0
         media_ids_this_event = event_id_to_media_ids[event_id]
@@ -168,23 +174,23 @@ def camtrap_dp_to_coco(camtrap_dp_folder,output_file=None):
                 ann['category_id'] = category_name_to_category_id[category_name]
                 ann['sequence_level_annotation'] = True
                 annotations.append(ann)
     coco_data = {}
     coco_data['images'] = images
     coco_data['annotations'] = annotations
     coco_data['categories'] = categories
     coco_data['info'] = info
     for im in coco_data['images']:
         im['datetime'] = str(im['datetime'] )
     if output_file is not None:
         with open(output_file,'w') as f:
             json.dump(coco_data,f,indent=1)
     return coco_data
 #%% Interactive driver
 if False:
@@ -192,19 +198,19 @@ if False:
     pass
     #%%
     camtrap_dp_folder = r'C:\temp\pilot2\pilot2'
     coco_file = os.path.join(camtrap_dp_folder,'test-coco.json')
     coco_data = camtrap_dp_to_coco(camtrap_dp_folder,
                                    output_file=coco_file)
     #%% Validate
     from megadetector.data_management.databases.integrity_check_json_db import \
         integrity_check_json_db, IntegrityCheckOptions
     options = IntegrityCheckOptions()
     options.baseDir = camtrap_dp_folder
     options.bCheckImageSizes = False
     options.bCheckImageExistence = True
@@ -213,25 +219,52 @@ if False:
     options.iMaxNumImages = -1
     options.nThreads = 1
     options.verbose = True
-    sortedCategories, data, errorInfo = integrity_check_json_db(coco_file,options)
+    sorted_categories, data, error_info = integrity_check_json_db(coco_file,options)
     #%% Preview
     from megadetector.visualization.visualize_db import DbVizOptions, visualize_db
     options = DbVizOptions()
     options.parallelize_rendering = True
     options.parallelize_rendering_with_threads = True
     options.parallelize_rendering_n_cores = 10
     preview_dir = r'c:\temp\camtrapdp-preview'
-    htmlOutputFile,image_db = visualize_db(coco_file, preview_dir, camtrap_dp_folder, options=options)
+    html_output_file, image_db = visualize_db(coco_file, preview_dir, camtrap_dp_folder, options=options)
     from megadetector.utils.path_utils import open_file
-    open_file(htmlOutputFile)
+    open_file(html_output_file)
 #%% Command-line driver
-# TODO
+def main():
+    """
+    Command-line interface to convert Camtrap DP to COCO.
+    """
+    parser = argparse.ArgumentParser(description='Convert Camtrap DP to COCO format')
+    parser.add_argument('camtrap_dp_folder', type=str,
+                        help='Input folder, containing a CamtrapDP package')
+    parser.add_argument('--output_file', type=str, default=None,
+                        help='COCO-formatted output file (defaults to [camtrap_dp_folder]_coco.json)')
+    args = parser.parse_args()
+    if args.output_file is None:
+        # Default output file name: [camtrap_dp_folder]_coco.json
+        #
+        # Remove trailing slash if present
+        folder_name = args.camtrap_dp_folder.rstrip(os.sep)
+        output_file = folder_name + '_coco.json'
+    else:
+        output_file = args.output_file
+    camtrap_dp_to_coco(camtrap_dp_folder=args.camtrap_dp_folder, output_file=output_file)
+    print(f"Successfully converted Camtrap DP package at '{args.camtrap_dp_folder}' to " + \
+          f"COCO format at '{output_file}'")
+if __name__ == '__main__':
+    main()

megadetector 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl