PyPI - megadetector - Versions diffs - 5.0.27__py3-none-any.whl → 5.0.29__py3-none-any.whl - Mend

megadetector 5.0.27py3-none-any.whl → 5.0.29py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (176) hide show

megadetector/api/batch_processing/api_core/batch_service/score.py +4 -5
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +1 -1
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +1 -1
megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/api/synchronous/api_core/tests/load_test.py +2 -3
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +23 -23
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -1
megadetector/data_management/camtrap_dp_to_coco.py +45 -45
megadetector/data_management/cct_json_utils.py +101 -101
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +189 -189
megadetector/data_management/databases/add_width_and_height_to_db.py +3 -2
megadetector/data_management/databases/combine_coco_camera_traps_files.py +38 -38
megadetector/data_management/databases/integrity_check_json_db.py +202 -188
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +38 -38
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +130 -124
megadetector/data_management/labelme_to_yolo.py +78 -72
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +91 -91
megadetector/data_management/lila/get_lila_annotation_counts.py +30 -30
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +70 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +13 -14
megadetector/data_management/mewc_to_md.py +339 -340
megadetector/data_management/ocr_tools.py +258 -252
megadetector/data_management/read_exif.py +232 -223
megadetector/data_management/remap_coco_categories.py +26 -26
megadetector/data_management/remove_exif.py +31 -20
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +41 -41
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +117 -120
megadetector/data_management/yolo_to_coco.py +195 -188
megadetector/detection/change_detection.py +831 -0
megadetector/detection/process_video.py +341 -338
megadetector/detection/pytorch_detector.py +308 -266
megadetector/detection/run_detector.py +186 -166
megadetector/detection/run_detector_batch.py +366 -364
megadetector/detection/run_inference_with_yolov5_val.py +328 -325
megadetector/detection/run_tiled_inference.py +312 -253
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +291 -283
megadetector/postprocessing/add_max_conf.py +15 -11
megadetector/postprocessing/categorize_detections_by_size.py +44 -44
megadetector/postprocessing/classification_postprocessing.py +808 -311
megadetector/postprocessing/combine_batch_outputs.py +20 -21
megadetector/postprocessing/compare_batch_results.py +528 -517
megadetector/postprocessing/convert_output_format.py +97 -97
megadetector/postprocessing/create_crop_folder.py +220 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -0
megadetector/postprocessing/load_api_results.py +25 -22
megadetector/postprocessing/md_to_coco.py +129 -98
megadetector/postprocessing/md_to_labelme.py +89 -83
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +87 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -302
megadetector/postprocessing/remap_detection_categories.py +36 -36
megadetector/postprocessing/render_detection_confusion_matrix.py +205 -199
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +702 -677
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +15 -15
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +14 -14
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +66 -69
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +33 -33
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +11 -11
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/azure_utils.py +22 -22
megadetector/utils/ct_utils.py +1019 -200
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +541 -518
megadetector/utils/path_utils.py +1511 -406
megadetector/utils/process_utils.py +41 -41
megadetector/utils/sas_blob_utils.py +53 -49
megadetector/utils/split_locations_into_train_val.py +73 -60
megadetector/utils/string_utils.py +147 -26
megadetector/utils/url_utils.py +463 -173
megadetector/utils/wi_utils.py +2629 -2868
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +21 -21
megadetector/visualization/render_images_with_thumbnails.py +37 -73
megadetector/visualization/visualization_utils.py +424 -404
megadetector/visualization/visualize_db.py +197 -190
megadetector/visualization/visualize_detector_output.py +126 -98
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/METADATA +6 -3
megadetector-5.0.29.dist-info/RECORD +163 -0
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/WHEEL +1 -1
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector-5.0.27.dist-info/RECORD +0 -208
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/top_level.txt +0 -0

megadetector/postprocessing/separate_detections_into_folders.py CHANGED Viewed

@@ -5,7 +5,7 @@ separate_detections_into_folders.py
 **Overview**
 Given a .json file with batch processing results, separate the files in that
-set of results into folders that contain animals/people/vehicles/nothing,
+set of results into folders that contain animals/people/vehicles/nothing,
 according to per-class thresholds.
 Image files are copied, not moved.
@@ -63,15 +63,15 @@ In this scenario, the folders within "animals" will be:
 deer, cow, multiple, unclassified
-"multiple" in this case only means "deer and cow"; if an image is classified as containing a
+"multiple" in this case only means "deer and cow"; if an image is classified as containing a
 bird and a bear, that would end up in "unclassified", since the folder separation is based only
 on the categories you provide at the command line.
-No classification-based separation is done within the animal_person, animal_vehicle, or
+No classification-based separation is done within the animal_person, animal_vehicle, or
 animal_person_vehicle folders.
 """
 #%% Constants and imports
 import argparse
@@ -108,13 +108,13 @@ class SeparateDetectionsIntoFoldersOptions:
     """
     Options used to parameterize separate_detections_into_folders()
     """
     def __init__(self,threshold=None):
         #: Default threshold for categories not specified in category_name_to_threshold
         self.threshold = None
-        #: Dict mapping category names to thresholds; for example, an image with only a detection of class
+        #: Dict mapping category names to thresholds; for example, an image with only a detection of class
         #: "animal" whose confidence is greater than or equal to category_name_to_threshold['animal']
         #: will be put in the "animal" folder.
         self.category_name_to_threshold = {
@@ -122,130 +122,130 @@ class SeparateDetectionsIntoFoldersOptions:
             'person': self.threshold,
             'vehicle': self.threshold
         }
         #: Number of workers to use, set to <= 1 to disable parallelization
         self.n_threads = 1
         #: By default, this function errors if you try to output to an existing folder
         self.allow_existing_directory = False
         #: By default, this function errors if any of the images specified in the results file don't
         #: exist in the source folder.
         self.allow_missing_files = False
         #: Whether to overwrite images that already exist in the target folder; only relevant if
         #: [allow_existing_directory] is True
         self.overwrite = True
         #: Whether to skip empty images; if this is False, empty images (i.e., images with no detections
         #: above the corresponding threshold) will be copied to an "empty" folder.
         self.skip_empty_images = False
         #: The MD results .json file to process
         self.results_file = None
         #: The folder containing source images; filenames in [results_file] should be relative to this
         #: folder.
         self.base_input_folder = None
         #: The folder to which we should write output images; see the module header comment for information
         #: about how that folder will be structured.
         self.base_output_folder = None
         #: Should we move rather than copy?
         self.move_images = False
         #: Should we render boxes on the output images?  Makes everything a lot slower.
         self.render_boxes = False
         #: Line thickness in pixels; only relevant if [render_boxes] is True
         self.line_thickness = default_line_thickness
         #: Box expansion in pixels; only relevant if [render_boxes] is True
         self.box_expansion = default_box_expansion
         #: Originally specified as a string that looks like this:
         #:
         #: deer=0.75,cow=0.75
         #:
-        #: String, converted internally to a dict mapping name:threshold
+        #: String, converted internally to a dict mapping name:threshold
         self.classification_thresholds = None
         ## Debug or internal attributes
         #: Do not set explicitly; populated from data when using classification results
         self.classification_category_id_to_name = None
         #: Do not set explicitly; populated from data when using classification results
         self.classification_categories = None
         #: Used to test this script; sets a limit on the number of images to process.
         self.debug_max_images = None
         #: Do not set explicitly; this gets created based on [results_file]
         #:
         #:Dictionary mapping categories (plus combinations of categories, and 'empty') to output folders
         self.category_name_to_folder = None
         #: Do not set explicitly; this gets loaded from [results_file]
         self.category_id_to_category_name = None
         #: List of category names for which we should blur detections, most commonly ['person']
         #:
-        #: Can also be a comma-separated list.
+        #: Can also be a comma-separated list.
         self.category_names_to_blur = None
         #: Remove all empty folders from the target folder at the end of the process,
         #: whether or not they were created by this script
         self.remove_empty_folders = False
     # ...__init__()
-# ...class SeparateDetectionsIntoFoldersOptions
+# ...class SeparateDetectionsIntoFoldersOptions
 #%% Support functions
 def _path_is_abs(p): return (len(p) > 1) and (p[0] == '/' or p[1] == ':')
 printed_missing_file_warning = False
 def _process_detections(im,options):
     """
     Process all detections for a single image
     May modify *im*.
     """
     global printed_missing_file_warning
     relative_filename = im['file']
-    detections = None
+    detections = None
     if 'detections' in im:
         detections = im['detections']
     categories_above_threshold = None
     if detections is None:
         assert im['failure'] is not None and len(im['failure']) > 0
         target_folder = options.category_name_to_folder['failure']
     else:
         category_name_to_max_confidence = {}
         category_names = options.category_id_to_category_name.values()
         for category_name in category_names:
             category_name_to_max_confidence[category_name] = 0.0
         # Find the maximum confidence for each category
         #
         # det = detections[0]
         for det in detections:
             category_id = det['category']
             # For zero-confidence detections, we occasionally have leftover goop
             # from COCO classes
             if category_id not in options.category_id_to_category_name:
@@ -253,79 +253,79 @@ def _process_detections(im,options):
                     category_id,relative_filename))
                 # assert det['conf'] < invalid_category_epsilon
                 continue
             category_name = options.category_id_to_category_name[category_id]
             if det['conf'] > category_name_to_max_confidence[category_name]:
                 category_name_to_max_confidence[category_name] = det['conf']
         # ...for each detection on this image
         # Count the number of thresholds exceeded
         categories_above_threshold = []
         for category_name in category_names:
             threshold = options.category_name_to_threshold[category_name]
             assert threshold is not None
             max_confidence_this_category = category_name_to_max_confidence[category_name]
             if max_confidence_this_category >= threshold:
                 categories_above_threshold.append(category_name)
         # ...for each category
         categories_above_threshold.sort()
         using_classification_folders = (options.classification_thresholds is not None and \
                                         len(options.classification_thresholds) > 0)
         # If this is above multiple thresholds
         if len(categories_above_threshold) > 1:
             # Currently "animal_person" images get put into the "animal_person" folder, even if we're
             # doing species-based separation.  Ideally, we would optionally put these in either the "deer"
             # folder or a "deer_person" folder, but this is pretty esoteric, so not worrying about this
             # for now.
             target_folder = options.category_name_to_folder['_'.join(categories_above_threshold)]
         elif len(categories_above_threshold) == 0:
             target_folder = options.category_name_to_folder['empty']
         else:
             assert len(categories_above_threshold) == 1
             target_folder = options.category_name_to_folder[categories_above_threshold[0]]
             # Are we making species classification folders, and is this an animal?
             if ('animal' in categories_above_threshold) and (using_classification_folders):
                 # Do we need to put this into a specific species folder?
                 # Find the animal-class detections that are above threshold
                 category_name_to_id = {v: k for k, v in options.category_id_to_category_name.items()}
                 animal_category_id = category_name_to_id['animal']
                 valid_animal_detections = [d for d in detections if \
                                            (d['category'] == animal_category_id and \
                                            d['conf'] >= options.category_name_to_threshold['animal'])]
                 # Count the number of classification categories that are above threshold for at
                 # least one detection
                 classification_categories_above_threshold = set()
                 # d = valid_animal_detections[0]
                 for d in valid_animal_detections:
                     if 'classifications' not in d or d['classifications'] is None:
                         continue
                     # classification = d['classifications'][0]
                     for classification in d['classifications']:
                         classification_category_id = classification[0]
                         classification_confidence = classification[1]
-                        # Do we have a threshold for this category, and if so, is
+                        # Do we have a threshold for this category, and if so, is
                         # this classification above threshold?
                         assert options.classification_category_id_to_name is not None
                         classification_category_name = \
@@ -334,78 +334,78 @@ def _process_detections(im,options):
                             (classification_confidence > \
                              options.classification_thresholds[classification_category_name]):
                             classification_categories_above_threshold.add(classification_category_name)
                     # ...for each classification
                 # ...for each detection
                 if len(classification_categories_above_threshold) == 0:
                     classification_folder_name = 'unclassified'
                 elif len(classification_categories_above_threshold) > 1:
                     classification_folder_name = 'multiple'
                 else:
                     assert len(classification_categories_above_threshold) == 1
-                    classification_folder_name = list(classification_categories_above_threshold)[0]
+                    classification_folder_name = list(classification_categories_above_threshold)[0]
                 target_folder = os.path.join(target_folder,classification_folder_name)
-            # ...if we have to deal with classification subfolders
+            # ...if we have to deal with classification subfolders
         # ...if we have 0/1/more categories above threshold
     # ...if this is/isn't a failure case
     source_path = os.path.join(options.base_input_folder,relative_filename)
     if not os.path.isfile(source_path):
         if not options.allow_missing_files:
             raise ValueError('Cannot find file {}'.format(source_path))
         else:
             if not printed_missing_file_warning:
-                print('Warning: cannot find at least one file ({})'.format(source_path))
+                print('Warning: cannot find at least one file ({})'.format(source_path))
                 printed_missing_file_warning = True
             return
     target_path = os.path.join(target_folder,relative_filename)
     if (not options.overwrite) and (os.path.isfile(target_path)):
         return
     target_dir = os.path.dirname(target_path)
     os.makedirs(target_dir,exist_ok=True)
     # Skip this image if it's empty and we're not processing empty images
     if ((categories_above_threshold is None) or (len(categories_above_threshold) == 0)) and \
         options.skip_empty_images:
         return
     # At this point, this image is getting copied; we may or may not also need to
     # draw bounding boxes or blur pixels.
     # Do a simple copy operation if we don't need to manipulate the images (render boxes, blur pixels)
     if (not options.render_boxes and (options.category_names_to_blur is None)) or \
         (categories_above_threshold is None) or \
         (len(categories_above_threshold) == 0):
         if options.move_images:
             shutil.move(source_path,target_path)
         else:
             shutil.copyfile(source_path,target_path)
     else:
         # Open the source image
         pil_image = vis_utils.load_image(source_path)
         # Blur regions in the image if necessary
         category_names_to_blur = options.category_names_to_blur
         if category_names_to_blur is not None:
             if isinstance(category_names_to_blur,str):
                 category_names_to_blur = category_names_to_blur.split(',')
                 category_names_to_blur = [s.strip() for s in category_names_to_blur]
             detections_to_blur = []
             for d in detections:
                 category_name = options.category_id_to_category_name[d['category']]
@@ -414,74 +414,74 @@ def _process_detections(im,options):
                     detections_to_blur.append(d)
             if len(detections_to_blur) > 0:
                 blur_detections(pil_image,detections_to_blur)
         # Render bounding boxes for each category separately, because
         # we allow different thresholds for each category.
         category_name_to_id = {v: k for k, v in options.category_id_to_category_name.items()}
         assert len(category_name_to_id) == len(options.category_id_to_category_name)
         classification_label_map = None
         if using_classification_folders:
             classification_label_map = options.classification_categories
         for category_name in categories_above_threshold:
             category_id = category_name_to_id[category_name]
             category_threshold = options.category_name_to_threshold[category_name]
             assert category_threshold is not None
             category_detections = [d for d in detections if d['category'] == category_id]
             # When we're not using classification folders, remove classification
             # information to maintain standard detection colors.
             if not using_classification_folders:
                 for d in category_detections:
                     if 'classifications' in d:
                         del d['classifications']
             vis_utils.render_detection_bounding_boxes(
-                category_detections,
+                category_detections,
                 pil_image,
-                label_map=options.detection_categories,
+                label_map=options.detection_categories,
                 classification_label_map=classification_label_map,
                 confidence_threshold=category_threshold,
                 thickness=options.line_thickness,
                 expansion=options.box_expansion)
         # ...for each category
         # Try to preserve EXIF data and image quality when saving
-        vis_utils.exif_preserving_save(pil_image,target_path)
+        vis_utils.exif_preserving_save(pil_image,target_path)
     # ...if we don't/do need to render boxes
 # ...def _process_detections()
 #%% Main function
 def separate_detections_into_folders(options):
     """
     Given a .json file with batch processing results, separate the files in that
-    set of results into folders that contain animals/people/vehicles/nothing,
-    according to per-class thresholds.  See the header comment of this module for
+    set of results into folders that contain animals/people/vehicles/nothing,
+    according to per-class thresholds.  See the header comment of this module for
     more details about the output folder structure.
     Args:
         options (SeparateDetectionsIntoFoldersOptions): parameters guiding image
         separation, see the SeparateDetectionsIntoFoldersOptions documentation for specific
         options.
     """
     # Input validation
     # Currently we don't support moving (instead of copying) when we're also rendering
     # bounding boxes or blurring humans.
     assert not (options.render_boxes and options.move_images), \
         'Cannot specify both render_boxes and move_images'
     assert not ((options.category_names_to_blur is not None) and options.move_images), \
         'Cannot specify both category_names_to_blur and move_images'
     # Create output folder if necessary
     if (os.path.isdir(options.base_output_folder)) and \
         (len(os.listdir(options.base_output_folder) ) > 0):
@@ -490,113 +490,113 @@ def separate_detections_into_folders(options):
                   'you mean to delete an old version?')
         else:
             raise ValueError('Target folder exists and is not empty')
-    os.makedirs(options.base_output_folder,exist_ok=True)
-    # Load detection results
+    os.makedirs(options.base_output_folder,exist_ok=True)
+    # Load detection results
     print('Loading detection results')
     results = json.load(open(options.results_file))
     images = results['images']
     for im in images:
         fn = im['file']
         assert not _path_is_abs(fn), 'Cannot process results with absolute image paths'
     print('Processing detections for {} images'.format(len(images)))
     default_threshold = options.threshold
-    if default_threshold is None:
-        default_threshold = get_typical_confidence_threshold_from_results(results)
-    detection_categories = results['detection_categories']
+    if default_threshold is None:
+        default_threshold = get_typical_confidence_threshold_from_results(results)
+    detection_categories = results['detection_categories']
     options.detection_categories = detection_categories
     options.category_id_to_category_name = detection_categories
     # Map class names to output folders
     options.category_name_to_folder = {}
     options.category_name_to_folder['empty'] = os.path.join(options.base_output_folder,'empty')
     options.category_name_to_folder['failure'] =\
         os.path.join(options.base_output_folder,'processing_failure')
     # Create all combinations of categories
     category_names = list(detection_categories.values())
     category_names.sort()
     # category_name = category_names[0]
-    for category_name in category_names:
+    for category_name in category_names:
         # Do we have a custom threshold for this category?
         if category_name not in options.category_name_to_threshold:
             print('Warning: category {} in detection file, but not in threshold mapping'.format(
                 category_name))
             options.category_name_to_threshold[category_name] = None
         if options.category_name_to_threshold[category_name] is None:
             options.category_name_to_threshold[category_name] = default_threshold
         category_threshold = options.category_name_to_threshold[category_name]
         print('Processing category {} at threshold {}'.format(category_name,category_threshold))
     target_category_names = []
     for c in category_names:
         target_category_names.append(c)
     for combination_length in range(2,len(category_names)+1):
         combined_category_names = list(itertools.combinations(category_names,combination_length))
-        for combination in combined_category_names:
+        for combination in combined_category_names:
             combined_name = '_'.join(combination)
             target_category_names.append(combined_name)
     # Create folder mappings for each category
     for category_name in target_category_names:
         folder_name = category_name
-        if category_name in friendly_folder_names:
+        if category_name in friendly_folder_names:
             folder_name = friendly_folder_names[category_name]
         options.category_name_to_folder[category_name] = \
             os.path.join(options.base_output_folder,folder_name)
     # Create the actual folders
     for folder in options.category_name_to_folder.values():
-        os.makedirs(folder,exist_ok=True)
+        os.makedirs(folder,exist_ok=True)
     # Handle species classification thresholds, if specified
     if options.classification_thresholds is not None:
         assert 'classification_categories' in results and \
             results['classification_categories'] is not None, \
             'Classification thresholds specified, but no classification results available'
         classification_categories = results['classification_categories']
         classification_category_name_to_id = {v: k for k, v in classification_categories.items()}
         classification_category_id_to_name = {k: v for k, v in classification_categories.items()}
         options.classification_category_id_to_name = classification_category_id_to_name
         options.classification_categories = classification_categories
         if isinstance(options.classification_thresholds,str):
             # E.g. deer=0.75,cow=0.75
             tokens = options.classification_thresholds.split(',')
             classification_thresholds = {}
             # token = tokens[0]
             for token in tokens:
                 subtokens = token.split('=')
                 assert len(subtokens) == 2 and is_float(subtokens[1]), \
-                    'Illegal classification threshold {}'.format(token)
+                    'Illegal classification threshold {}'.format(token)
                 classification_thresholds[subtokens[0]] = float(subtokens[1])
             # ...for each token
-            options.classification_thresholds = classification_thresholds
+            options.classification_thresholds = classification_thresholds
         # ...if classification thresholds are still in string format
         # Validate the classes in the threshold list
         for class_name in options.classification_thresholds.keys():
             assert class_name in classification_category_name_to_id, \
@@ -604,40 +604,40 @@ def separate_detections_into_folders(options):
                     class_name)
     # ...if we need to deal with classification categories
     if options.n_threads <= 1 or options.debug_max_images is not None:
         # i_image = 14; im = images[i_image]; im
         for i_image,im in enumerate(tqdm(images)):
             if options.debug_max_images is not None and i_image > options.debug_max_images:
                 break
             _process_detections(im,options)
         # ...for each image
     else:
         print('Starting a pool with {} threads'.format(options.n_threads))
         pool = ThreadPool(options.n_threads)
         process_detections_with_options = partial(_process_detections, options=options)
         _ = list(tqdm(pool.imap(process_detections_with_options, images), total=len(images)))
     if options.remove_empty_folders:
         print('Removing empty folders from {}'.format(options.base_output_folder))
         remove_empty_folders(options.base_output_folder)
 #  ...def separate_detections_into_folders
 #%% Interactive driver
 if False:
     pass
     #%%
     options = SeparateDetectionsIntoFoldersOptions()
     options.results_file = os.path.expanduser(
         '~/data/snapshot-safari-2022-08-16-KRU-v5a.0.0_detections.json')
     options.base_input_folder = os.path.expanduser('~/data/KRU/KRU_public')
@@ -645,11 +645,11 @@ if False:
     options.n_threads = 100
     options.render_boxes = True
     options.allow_existing_directory = True
     #%%
     options = SeparateDetectionsIntoFoldersOptions()
     options.results_file = os.path.expanduser('~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json')
     options.base_input_folder = os.path.expanduser('~/data/ENA24/images')
     options.base_output_folder = os.path.expanduser('~/data/ENA24-separated')
@@ -657,31 +657,45 @@ if False:
     options.classification_thresholds = 'deer=0.75,cow=0.75,bird=0.75'
     options.render_boxes = True
     options.allow_existing_directory = True
     #%%
     separate_detections_into_folders(options)
     #%% Testing various command-line invocations
     """
     # With boxes, no classification
-    python separate_detections_into_folders.py ~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json ~/data/ENA24/images ~/data/ENA24-separated --threshold 0.17 --animal_threshold 0.2 --n_threads 10 --allow_existing_directory --render_boxes --line_thickness 10 --box_expansion 10
+    python separate_detections_into_folders.py \
+        ~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json \
+        ~/data/ENA24/images ~/data/ENA24-separated \
+        --threshold 0.17 --animal_threshold 0.2 --n_threads 10 \
+        --allow_existing_directory --render_boxes --line_thickness 10 --box_expansion 10
     # No boxes, no classification (default)
-    python separate_detections_into_folders.py ~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json ~/data/ENA24/images ~/data/ENA24-separated --threshold 0.17 --animal_threshold 0.2 --n_threads 10 --allow_existing_directory
+    python separate_detections_into_folders.py \
+        ~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json \
+        ~/data/ENA24/images ~/data/ENA24-separated \
+        --threshold 0.17 --animal_threshold 0.2 --n_threads 10 --allow_existing_directory
     # With boxes, with classification
-    python separate_detections_into_folders.py ~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json ~/data/ENA24/images ~/data/ENA24-separated --threshold 0.17 --animal_threshold 0.2 --n_threads 10 --allow_existing_directory --render_boxes --line_thickness 10 --box_expansion 10 --classification_thresholds "deer=0.75,cow=0.75,bird=0.75"
+    python separate_detections_into_folders.py \
+        ~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json ~/data/ENA24/images ~/data/ENA24-separated \
+        --threshold 0.17 --animal_threshold 0.2 --n_threads 10 --allow_existing_directory \
+        --render_boxes --line_thickness 10 --box_expansion 10 \
+        --classification_thresholds "deer=0.75,cow=0.75,bird=0.75"
     # No boxes, with classification
-    python separate_detections_into_folders.py ~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json ~/data/ENA24/images ~/data/ENA24-separated --threshold 0.17 --animal_threshold 0.2 --n_threads 10 --allow_existing_directory --classification_thresholds "deer=0.75,cow=0.75,bird=0.75"
-    """
+    python separate_detections_into_folders.py \
+        ~/data/ena24-2022-06-15-v5a.0.0_megaclassifier.json ~/data/ENA24/images ~/data/ENA24-separated \
+        --threshold 0.17 --animal_threshold 0.2 --n_threads 10 --allow_existing_directory \
+        --classification_thresholds "deer=0.75,cow=0.75,bird=0.75"
+    """
 #%% Command-line driver
-def main():
+def main(): # noqa
     parser = argparse.ArgumentParser()
     parser.add_argument('results_file', type=str, help='Input .json filename')
     parser.add_argument('base_input_folder', type=str, help='Input image folder')
@@ -690,7 +704,7 @@ def main():
     parser.add_argument('--threshold', type=float, default=None,
                         help='Default confidence threshold for all categories (defaults to ' + \
                             'selection based on model version, other options may override this ' + \
-                            'for specific categories)')
+                            'for specific categories)')
     parser.add_argument('--animal_threshold', type=float, default=None,
                         help='Confidence threshold for the animal category')
     parser.add_argument('--human_threshold', type=float, default=None,
@@ -700,21 +714,21 @@ def main():
     parser.add_argument('--classification_thresholds', type=str, default=None,
                         help='List of classification thresholds to use for species-based folder ' + \
                              'separation, formatted as, e.g., "deer=0.75,cow=0.75"')
     parser.add_argument('--n_threads', type=int, default=1,
                         help='Number of threads to use for parallel operation (default=1)')
-    parser.add_argument('--allow_existing_directory', action='store_true',
+    parser.add_argument('--allow_existing_directory', action='store_true',
                         help='Proceed even if the target directory exists and is not empty')
-    parser.add_argument('--no_overwrite', action='store_true',
+    parser.add_argument('--no_overwrite', action='store_true',
                         help='Skip images that already exist in the target folder, must also ' + \
-                             'specify --allow_existing_directory')
+                             'specify --allow_existing_directory')
     parser.add_argument('--skip_empty_images', action='store_true',
                         help='Do not copy empty images to the output folder')
     parser.add_argument('--move_images', action='store_true',
                         help='Move images (rather than copying) (not recommended this if you have not ' + \
                              'backed up your data!)')
     parser.add_argument('--render_boxes', action='store_true',
                         help='Render bounding boxes on output images; may result in some ' + \
                              'metadata not being transferred')
@@ -727,20 +741,21 @@ def main():
                              'using render_boxes (defaults to {})'.format(
                              default_box_expansion))
     parser.add_argument('--category_names_to_blur', type=str, default=None,
-                        help='Comma-separated list of category names to blur (or a single category name, e.g. "person")')
+                        help='Comma-separated list of category names to blur ' + \
+                             '(or a single category name, e.g. "person")')
     parser.add_argument('--remove_empty_folders', action='store_true',
                         help='Remove all empty folders from the target folder at the end of the process, ' + \
                              'whether or not they were created by this script')
     if len(sys.argv[1:])==0:
         parser.print_help()
         parser.exit()
-    args = parser.parse_args()
+    args = parser.parse_args()
     # Convert to an options object
     options = SeparateDetectionsIntoFoldersOptions()
     args_to_object(args, options)
     def validate_threshold(v,name):
@@ -748,27 +763,27 @@ def main():
         if v is not None:
             assert v >= 0.0 and v <= 1.0, \
                 'Illegal {} threshold {}'.format(name,v)
     validate_threshold(args.threshold,'default')
     validate_threshold(args.animal_threshold,'animal')
     validate_threshold(args.vehicle_threshold,'vehicle')
     validate_threshold(args.human_threshold,'human')
     if args.threshold is not None:
         if args.animal_threshold is not None \
             and args.human_threshold is not None \
             and args.vehicle_threshold is not None:
                 raise ValueError('Default threshold specified, but all category thresholds ' + \
                                  'also specified... not exactly wrong, but it\'s likely that you ' + \
-                                 'meant something else.')
+                                 'meant something else.')
     options.category_name_to_threshold['animal'] = args.animal_threshold
     options.category_name_to_threshold['person'] = args.human_threshold
     options.category_name_to_threshold['vehicle'] = args.vehicle_threshold
     options.overwrite = (not args.no_overwrite)
     separate_detections_into_folders(options)
-if __name__ == '__main__':
+if __name__ == '__main__':
     main()

megadetector 5.0.27__py3-none-any.whl → 5.0.29__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.27py3-none-any.whl → 5.0.29py3-none-any.whl