PyPI - megadetector - Versions diffs - 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl - Mend

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (197) hide show

megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/efficientnet/model.py +8 -8
megadetector/classification/efficientnet/utils.py +6 -5
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +26 -26
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -2
megadetector/data_management/camtrap_dp_to_coco.py +79 -46
megadetector/data_management/cct_json_utils.py +103 -103
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +210 -193
megadetector/data_management/databases/add_width_and_height_to_db.py +86 -12
megadetector/data_management/databases/combine_coco_camera_traps_files.py +40 -40
megadetector/data_management/databases/integrity_check_json_db.py +228 -200
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +88 -39
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +133 -125
megadetector/data_management/labelme_to_yolo.py +159 -73
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +365 -107
megadetector/data_management/lila/get_lila_annotation_counts.py +35 -33
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +73 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +28 -19
megadetector/data_management/mewc_to_md.py +344 -340
megadetector/data_management/ocr_tools.py +262 -255
megadetector/data_management/read_exif.py +249 -227
megadetector/data_management/remap_coco_categories.py +90 -28
megadetector/data_management/remove_exif.py +81 -21
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +588 -120
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +248 -122
megadetector/data_management/yolo_to_coco.py +333 -191
megadetector/detection/change_detection.py +832 -0
megadetector/detection/process_video.py +340 -337
megadetector/detection/pytorch_detector.py +358 -278
megadetector/detection/run_detector.py +399 -186
megadetector/detection/run_detector_batch.py +404 -377
megadetector/detection/run_inference_with_yolov5_val.py +340 -327
megadetector/detection/run_tiled_inference.py +257 -249
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +332 -295
megadetector/postprocessing/add_max_conf.py +19 -11
megadetector/postprocessing/categorize_detections_by_size.py +45 -45
megadetector/postprocessing/classification_postprocessing.py +468 -433
megadetector/postprocessing/combine_batch_outputs.py +23 -23
megadetector/postprocessing/compare_batch_results.py +590 -525
megadetector/postprocessing/convert_output_format.py +106 -102
megadetector/postprocessing/create_crop_folder.py +347 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -499
megadetector/postprocessing/load_api_results.py +48 -27
megadetector/postprocessing/md_to_coco.py +133 -102
megadetector/postprocessing/md_to_labelme.py +107 -90
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +92 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -301
megadetector/postprocessing/remap_detection_categories.py +91 -38
megadetector/postprocessing/render_detection_confusion_matrix.py +214 -205
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +704 -679
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +18 -19
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +54 -33
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +67 -67
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +156 -74
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +10 -10
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/ct_utils.py +1049 -211
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +632 -529
megadetector/utils/path_utils.py +1520 -431
megadetector/utils/process_utils.py +41 -41
megadetector/utils/split_locations_into_train_val.py +62 -62
megadetector/utils/string_utils.py +148 -27
megadetector/utils/url_utils.py +489 -176
megadetector/utils/wi_utils.py +2658 -2526
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +34 -30
megadetector/visualization/render_images_with_thumbnails.py +39 -74
megadetector/visualization/visualization_utils.py +487 -435
megadetector/visualization/visualize_db.py +232 -198
megadetector/visualization/visualize_detector_output.py +82 -76
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/METADATA +5 -2
megadetector-10.0.0.dist-info/RECORD +139 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/WHEEL +1 -1
megadetector/api/batch_processing/api_core/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/score.py +0 -439
megadetector/api/batch_processing/api_core/server.py +0 -294
megadetector/api/batch_processing/api_core/server_api_config.py +0 -97
megadetector/api/batch_processing/api_core/server_app_config.py +0 -55
megadetector/api/batch_processing/api_core/server_batch_job_manager.py +0 -220
megadetector/api/batch_processing/api_core/server_job_status_table.py +0 -149
megadetector/api/batch_processing/api_core/server_orchestration.py +0 -360
megadetector/api/batch_processing/api_core/server_utils.py +0 -88
megadetector/api/batch_processing/api_core_support/__init__.py +0 -0
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
megadetector/api/batch_processing/api_support/__init__.py +0 -0
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +0 -152
megadetector/api/batch_processing/data_preparation/__init__.py +0 -0
megadetector/api/synchronous/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/api_backend.py +0 -151
megadetector/api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -263
megadetector/api/synchronous/api_core/animal_detection_api/config.py +0 -35
megadetector/api/synchronous/api_core/tests/__init__.py +0 -0
megadetector/api/synchronous/api_core/tests/load_test.py +0 -110
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector/utils/azure_utils.py +0 -178
megadetector/utils/sas_blob_utils.py +0 -509
megadetector-5.0.28.dist-info/RECORD +0 -209
/megadetector/{api/batch_processing/__init__.py → __init__.py} +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/top_level.txt +0 -0

megadetector/visualization/visualization_utils.py CHANGED Viewed

@@ -96,7 +96,7 @@ DEFAULT_COLORS = [
 def open_image(input_file, ignore_exif_rotation=False):
     """
     Opens an image in binary format using PIL.Image and converts to RGB mode.
     Supports local files or URLs.
     This operation is lazy; image will not be actually loaded until the first
@@ -112,7 +112,7 @@ def open_image(input_file, ignore_exif_rotation=False):
     Returns:
         PIL.Image.Image: A PIL Image object in RGB mode
     """
     if (isinstance(input_file, str)
             and input_file.startswith(('http://', 'https://'))):
         try:
@@ -124,7 +124,7 @@ def open_image(input_file, ignore_exif_rotation=False):
                 for i_retry in range(0,n_retries):
                     try:
                         time.sleep(retry_sleep_time)
-                        response = requests.get(input_file)
+                        response = requests.get(input_file)
                     except Exception as e:
                         print(f'Error retrieving image {input_file} on retry {i_retry}: {e}')
                         continue
@@ -141,7 +141,7 @@ def open_image(input_file, ignore_exif_rotation=False):
     else:
         image = Image.open(input_file)
     # Convert to RGB if necessary
     if image.mode not in ('RGBA', 'RGB', 'L', 'I;16'):
         raise AttributeError(
@@ -158,11 +158,11 @@ def open_image(input_file, ignore_exif_rotation=False):
         #
         try:
             exif = image._getexif()
-            orientation: int = exif.get(274, None)
+            orientation: int = exif.get(274, None)
             if (orientation is not None) and (orientation != EXIF_IMAGE_NO_ROTATION):
                 assert orientation in EXIF_IMAGE_ROTATIONS, \
                     'Mirrored rotations are not supported'
-                image = image.rotate(EXIF_IMAGE_ROTATIONS[orientation], expand=True)
+                image = image.rotate(EXIF_IMAGE_ROTATIONS[orientation], expand=True)
         except Exception:
             pass
@@ -175,90 +175,95 @@ def exif_preserving_save(pil_image,output_file,quality='keep',default_quality=85
     """
     Saves [pil_image] to [output_file], making a moderate attempt to preserve EXIF
     data and JPEG quality.  Neither is guaranteed.
     Also see:
     https://discuss.dizzycoding.com/determining-jpg-quality-in-python-pil/
     ...for more ways to preserve jpeg quality if quality='keep' doesn't do the trick.
     Args:
         pil_image (Image): the PIL Image object to save
         output_file (str): the destination file
-        quality (str or int, optional): can be "keep" (default), or an integer from 0 to 100.
+        quality (str or int, optional): can be "keep" (default), or an integer from 0 to 100.
             This is only used if PIL thinks the the source image is a JPEG.  If you load a JPEG
             and resize it in memory, for example, it's no longer a JPEG.
-        default_quality (int, optional): determines output quality when quality == 'keep' and we are
+        default_quality (int, optional): determines output quality when quality == 'keep' and we are
             saving a non-JPEG source to a JPEG file
         verbose (bool, optional): enable additional debug console output
     """
     # Read EXIF metadata
     exif = pil_image.info['exif'] if ('exif' in pil_image.info) else None
     # Quality preservation is only supported for JPEG sources.
     if pil_image.format != "JPEG":
         if quality == 'keep':
             if verbose:
                 print('Warning: quality "keep" passed when saving a non-JPEG source (during save to {})'.format(
                     output_file))
-            quality = default_quality
-    # Some output formats don't support the quality parameter, so we try once with,
+            quality = default_quality
+    # Some output formats don't support the quality parameter, so we try once with,
     # and once without.  This is a horrible cascade of if's, but it's a consequence of
     # the fact that "None" is not supported for either "exif" or "quality".
     try:
         if exif is not None:
             pil_image.save(output_file, exif=exif, quality=quality)
         else:
             pil_image.save(output_file, quality=quality)
     except Exception:
         if verbose:
             print('Warning: failed to write {}, trying again without quality parameter'.format(output_file))
         if exif is not None:
-            pil_image.save(output_file, exif=exif)
+            pil_image.save(output_file, exif=exif)
         else:
             pil_image.save(output_file)
 # ...def exif_preserving_save(...)
 def load_image(input_file, ignore_exif_rotation=False):
     """
-    Loads an image file.  This is the non-lazy version of open_file(); i.e.,
+    Loads an image file.  This is the non-lazy version of open_file(); i.e.,
     it forces image decoding before returning.
     Args:
         input_file (str or BytesIO): can be a path to an image file (anything
             that PIL can open), a URL, or an image as a stream of bytes
         ignore_exif_rotation (bool, optional): don't rotate the loaded pixels,
             even if we are loading a JPEG and that JPEG says it should be rotated
-    Returns:
+    Returns:
         PIL.Image.Image: a PIL Image object in RGB mode
     """
     image = open_image(input_file, ignore_exif_rotation=ignore_exif_rotation)
     image.load()
     return image
-def resize_image(image, target_width=-1, target_height=-1, output_file=None,
-                 no_enlarge_width=False, verbose=False, quality='keep'):
+def resize_image(image,
+                 target_width=-1,
+                 target_height=-1,
+                 output_file=None,
+                 no_enlarge_width=False,
+                 verbose=False,
+                 quality='keep'):
     """
     Resizes a PIL Image object to the specified width and height; does not resize
     in place. If either width or height are -1, resizes with aspect ratio preservation.
-    If target_width and target_height are both -1, does not modify the image, but
+    If target_width and target_height are both -1, does not modify the image, but
     will write to output_file if supplied.
-    If no resizing is required, and an Image object is supplied, returns the original Image
+    If no resizing is required, and an Image object is supplied, returns the original Image
     object (i.e., does not copy).
     Args:
         image (Image or str): PIL Image object or a filename (local file or URL)
         target_width (int, optional): width to which we should resize this image, or -1
@@ -267,14 +272,14 @@ def resize_image(image, target_width=-1, target_height=-1, output_file=None,
             to let target_width determine the size
         output_file (str, optional): file to which we should save this image; if None,
             just returns the image without saving
-        no_enlarge_width (bool, optional): if [no_enlarge_width] is True, and
-            [target width] is larger than the original image width, does not modify the image,
+        no_enlarge_width (bool, optional): if [no_enlarge_width] is True, and
+            [target width] is larger than the original image width, does not modify the image,
             but will write to output_file if supplied
         verbose (bool, optional): enable additional debug output
         quality (str or int, optional): passed to exif_preserving_save, see docs for more detail
-    returns:
-        PIL.Image.Image: the resized image, which may be the original image if no resizing is
+    Returns:
+        PIL.Image.Image: the resized image, which may be the original image if no resizing is
             required
     """
@@ -282,20 +287,20 @@ def resize_image(image, target_width=-1, target_height=-1, output_file=None,
     if isinstance(image,str):
         image_fn = image
         image = load_image(image)
     if target_width is None:
         target_width = -1
     if target_height is None:
         target_height = -1
     resize_required = True
     # No resize was requested, this is always a no-op
     if target_width == -1 and target_height == -1:
         resize_required = False
     # Does either dimension need to scale according to the other?
     elif target_width == -1 or target_height == -1:
@@ -309,42 +314,42 @@ def resize_image(image, target_width=-1, target_height=-1, output_file=None,
         else:
             # w = ar * h
             target_width = int(aspect_ratio * target_height)
     # If we're not enlarging images and this would be an enlarge operation
     if (no_enlarge_width) and (target_width > image.size[0]):
         if verbose:
             print('Bypassing image enlarge for {} --> {}'.format(
                 image_fn,str(output_file)))
         resize_required = False
     # If the target size is the same as the original size
     if (target_width == image.size[0]) and (target_height == image.size[1]):
-        resize_required = False
+        resize_required = False
     if not resize_required:
         if output_file is not None:
             if verbose:
                 print('No resize required for resize {} --> {}'.format(
                     image_fn,str(output_file)))
             exif_preserving_save(image,output_file,quality=quality,verbose=verbose)
         return image
     assert target_width > 0 and target_height > 0, \
         'Invalid image resize target {},{}'.format(target_width,target_height)
-    # The antialiasing parameter changed between Pillow versions 9 and 10, and for a bit,
+    # The antialiasing parameter changed between Pillow versions 9 and 10, and for a bit,
     # I'd like to support both.
     try:
         resized_image = image.resize((target_width, target_height), Image.ANTIALIAS)
-    except:
+    except Exception:
         resized_image = image.resize((target_width, target_height), Image.Resampling.LANCZOS)
     if output_file is not None:
         exif_preserving_save(resized_image,output_file,quality=quality,verbose=verbose)
     return resized_image
 # ...def resize_image(...)
@@ -357,28 +362,28 @@ def crop_image(detections, image, confidence_threshold=0.15, expansion=0):
     Args:
         detections (list): a list of dictionaries with keys 'conf' and 'bbox';
-            boxes are length-four arrays formatted as [x,y,w,h], normalized,
+            boxes are length-four arrays formatted as [x,y,w,h], normalized,
             upper-left origin (this is the standard MD detection format)
         image (Image or str): the PIL Image object from which we should crop detections,
             or an image filename
         confidence_threshold (float, optional): only crop detections above this threshold
         expansion (int, optional): a number of pixels to include on each side of a cropped
             detection
     Returns:
-        list: a possibly-empty list of PIL Image objects
+        list: a possibly-empty list of PIL Image objects
     """
     ret_images = []
     if isinstance(image,str):
         image = load_image(image)
     for detection in detections:
         score = float(detection['conf'])
-        if score >= confidence_threshold:
+        if (confidence_threshold is None) or (score >= confidence_threshold):
             x1, y1, w_box, h_box = detection['bbox']
             ymin,xmin,ymax,xmax = y1, x1, y1 + h_box, x1 + w_box
@@ -417,17 +422,18 @@ def blur_detections(image,detections,blur_radius=40):
     """
     Blur the regions in [image] corresponding to the MD-formatted list [detections].
     [image] is modified in place.
     Args:
         image (PIL.Image.Image): image in which we should blur specific regions
         detections (list): list of detections in the MD output format, see render
             detection_bounding_boxes for more detail.
+        blur_radius (int, optional): radius of blur kernel in pixels
     """
     img_width, img_height = image.size
     for d in detections:
         bbox = d['bbox']
         x_norm, y_norm, width_norm, height_norm = bbox
@@ -436,29 +442,29 @@ def blur_detections(image,detections,blur_radius=40):
         y = int(y_norm * img_height)
         width = int(width_norm * img_width)
         height = int(height_norm * img_height)
         # Calculate box boundaries
         left = max(0, x)
         top = max(0, y)
         right = min(img_width, x + width)
         bottom = min(img_height, y + height)
         # Crop the region, blur it, and paste it back
         region = image.crop((left, top, right, bottom))
         blurred_region = region.filter(ImageFilter.GaussianBlur(radius=blur_radius))
         image.paste(blurred_region, (left, top))
     # ...for each detection
 # ...def blur_detections(...)
-def render_detection_bounding_boxes(detections,
+def render_detection_bounding_boxes(detections,
                                     image,
                                     label_map='show_categories',
-                                    classification_label_map=None,
-                                    confidence_threshold=0,
-                                    thickness=DEFAULT_BOX_THICKNESS,
+                                    classification_label_map=None,
+                                    confidence_threshold=0.0,
+                                    thickness=DEFAULT_BOX_THICKNESS,
                                     expansion=0,
                                     classification_confidence_threshold=0.3,
                                     max_classifications=3,
@@ -472,17 +478,16 @@ def render_detection_bounding_boxes(detections,
     """
     Renders bounding boxes (with labels and confidence values) on an image for all
     detections above a threshold.
     Renders classification labels if present.
     [image] is modified in place.
     Args:
         detections (list): list of detections in the MD output format, for example:
             .. code-block::none
                 [
                     {
                         "category": "2",
@@ -495,15 +500,15 @@ def render_detection_bounding_boxes(detections,
                         ]
                     }
                 ]
                 ...where the bbox coordinates are [x, y, box_width, box_height].
                 (0, 0) is the upper-left.  Coordinates are normalized.
             Supports classification results, in the standard format:
             .. code-block::none
                 [
                     {
                         "category": "2",
@@ -523,30 +528,30 @@ def render_detection_bounding_boxes(detections,
                 ]
         image (PIL.Image.Image): image on which we should render detections
-        label_map (dict, optional): optional, mapping the numeric label to a string name. The type of the
-            numeric label (typically strings) needs to be consistent with the keys in label_map; no casting is
-            carried out. If [label_map] is None, no labels are shown (not even numbers and confidence values).
-            If you want category numbers and confidence values without class labels, use the default value,
+        label_map (dict, optional): optional, mapping the numeric label to a string name. The type of the
+            numeric label (typically strings) needs to be consistent with the keys in label_map; no casting is
+            carried out. If [label_map] is None, no labels are shown (not even numbers and confidence values).
+            If you want category numbers and confidence values without class labels, use the default value,
             the string 'show_categories'.
-        classification_label_map (dict, optional): optional, mapping of the string class labels to the actual
-            class names. The type of the numeric label (typically strings) needs to be consistent with the keys
-            in label_map; no casting is  carried out. If [label_map] is None, no labels are shown (not even numbers
+        classification_label_map (dict, optional): optional, mapping of the string class labels to the actual
+            class names. The type of the numeric label (typically strings) needs to be consistent with the keys
+            in label_map; no casting is  carried out. If [label_map] is None, no labels are shown (not even numbers
             and confidence values).
-        confidence_threshold (float or dict, optional), threshold above which boxes are rendered.  Can also be a
-            dictionary mapping category IDs to thresholds.
-        thickness (int, optional): line thickness in pixels
-        expansion (int, optional): number of pixels to expand bounding boxes on each side
-        classification_confidence_threshold (float, optional): confidence above which classification results
-            are displayed
-        max_classifications (int, optional): maximum number of classification results rendered for one image
+        confidence_threshold (float or dict, optional): threshold above which boxes are rendered.  Can also be a
+            dictionary mapping category IDs to thresholds.
+        thickness (int, optional): line thickness in pixels
+        expansion (int, optional): number of pixels to expand bounding boxes on each side
+        classification_confidence_threshold (float, optional): confidence above which classification results
+            are displayed
+        max_classifications (int, optional): maximum number of classification results rendered for one image
         colormap (list, optional): list of color names, used to choose colors for categories by
-            indexing with the values in [classes]; defaults to a reasonable set of colors
-        textalign (int, optional): TEXTALIGN_LEFT, TEXTALIGN_CENTER, or TEXTALIGN_RIGHT
-        vtextalign (int, optional): VTEXTALIGN_TOP or VTEXTALIGN_BOTTOM
-        label_font_size (float, optional): font size for labels
-        custom_strings: optional set of strings to append to detection labels, should have the
-            same length as [detections].  Appended before any classification labels.
-        box_sort_order (str, optional): sorting scheme for detection boxes, can be None, "confidence", or
+            indexing with the values in [classes]; defaults to a reasonable set of colors
+        textalign (int, optional): TEXTALIGN_LEFT, TEXTALIGN_CENTER, or TEXTALIGN_RIGHT
+        vtextalign (int, optional): VTEXTALIGN_TOP or VTEXTALIGN_BOTTOM
+        label_font_size (float, optional): font size for labels
+        custom_strings (list of str, optional): optional set of strings to append to detection labels, should
+            have the same length as [detections].  Appended before any classification labels.
+        box_sort_order (str, optional): sorting scheme for detection boxes, can be None, "confidence", or
             "reverse_confidence".
         verbose (bool, optional): enable additional debug output
     """
@@ -554,52 +559,52 @@ def render_detection_bounding_boxes(detections,
     # Input validation
     if (label_map is not None) and (isinstance(label_map,str)) and (label_map == 'show_categories'):
         label_map = {}
     if custom_strings is not None:
         assert len(custom_strings) == len(detections), \
             '{} custom strings provided for {} detections'.format(
                 len(custom_strings),len(detections))
     display_boxes = []
     # list of lists, one list of strings for each bounding box (to accommodate multiple labels)
-    display_strs = []
+    display_strs = []
     # for color selection
-    classes = []
+    classes = []
     if box_sort_order is not None:
-        if box_sort_order == 'confidence':
+        if box_sort_order == 'confidence':
             detections = sort_list_of_dicts_by_key(detections,k='conf',reverse=False)
         elif box_sort_order == 'reverse_confidence':
             detections = sort_list_of_dicts_by_key(detections,k='conf',reverse=True)
         else:
             raise ValueError('Unrecognized sorting scheme {}'.format(box_sort_order))
     for i_detection,detection in enumerate(detections):
         score = detection['conf']
         if isinstance(confidence_threshold,dict):
             rendering_threshold = confidence_threshold[detection['category']]
         else:
-            rendering_threshold = confidence_threshold
+            rendering_threshold = confidence_threshold
         # Always render objects with a confidence of "None", this is typically used
-        # for ground truth data.
-        if score is None or score >= rendering_threshold:
+        # for ground truth data.
+        if (score is None) or (rendering_threshold is None) or (score >= rendering_threshold):
             x1, y1, w_box, h_box = detection['bbox']
             display_boxes.append([y1, x1, y1 + h_box, x1 + w_box])
             # The class index to use for coloring this box, which may be based on the detection
             # category or on the most confident classification category.
             clss = detection['category']
-            # This will be a list of strings that should be rendered above/below this box
+            # This will be a list of strings that should be rendered above/below this box
             displayed_label = []
             if label_map is not None:
                 label = label_map[clss] if clss in label_map else clss
                 if score is not None:
@@ -618,27 +623,27 @@ def render_detection_bounding_boxes(detections,
             if ('classifications' in detection) and len(detection['classifications']) > 0:
                 classifications = detection['classifications']
                 if len(classifications) > max_classifications:
                     classifications = classifications[0:max_classifications]
                 max_classification_category = 0
                 max_classification_conf = -100
                 for classification in classifications:
                     classification_conf = classification[1]
                     if classification_conf is None or \
                        classification_conf < classification_confidence_threshold:
                         continue
                     class_key = classification[0]
                     # Is this the most confident classification for this detection?
                     if classification_conf > max_classification_conf:
                         max_classification_conf = classification_conf
                         max_classification_category = int(class_key)
                     if (classification_label_map is not None) and (class_key in classification_label_map):
                         class_name = classification_label_map[class_key]
                     else:
@@ -647,15 +652,15 @@ def render_detection_bounding_boxes(detections,
                         displayed_label += ['{}: {:5.1%}'.format(class_name.lower(), classification_conf)]
                     else:
                         displayed_label += ['{}'.format(class_name.lower())]
                 # ...for each classification
                 # To avoid duplicate colors with detection-only visualization, offset
                 # the classification class index by the number of detection classes
                 clss = annotation_constants.NUM_DETECTOR_CATEGORIES + max_classification_category
             # ...if we have classification results
             # display_strs is a list of labels for each box
             display_strs.append(displayed_label)
             classes.append(clss)
@@ -663,16 +668,21 @@ def render_detection_bounding_boxes(detections,
         # ...if the confidence of this detection is above threshold
     # ...for each detection
     display_boxes = np.array(display_boxes)
     if verbose:
         print('Rendering {} of {} detections'.format(len(display_boxes),len(detections)))
-    draw_bounding_boxes_on_image(image, display_boxes, classes,
-                                 display_strs=display_strs, thickness=thickness,
-                                 expansion=expansion, colormap=colormap,
-                                 textalign=textalign, vtextalign=vtextalign,
+    draw_bounding_boxes_on_image(image,
+                                 display_boxes,
+                                 classes,
+                                 display_strs=display_strs,
+                                 thickness=thickness,
+                                 expansion=expansion,
+                                 colormap=colormap,
+                                 textalign=textalign,
+                                 vtextalign=vtextalign,
                                  label_font_size=label_font_size)
 # ...render_detection_bounding_boxes(...)
@@ -693,13 +703,12 @@ def draw_bounding_boxes_on_image(image,
     Draws bounding boxes on an image.  Modifies the image in place.
     Args:
         image (PIL.Image): the image on which we should draw boxes
-        boxes (np.array): a two-dimensional numpy array of size [N, 4], where N is the
+        boxes (np.array): a two-dimensional numpy array of size [N, 4], where N is the
             number of boxes, and each row is (ymin, xmin, ymax, xmax).  Coordinates should be
             normalized to image height/width.
         classes (list): a list of ints or string-formatted ints corresponding to the
-             class labels of the boxes. This is only used for color selection.  Should have the same
+             class labels of the boxes. This is only used for color selection.  Should have the same
              length as [boxes].
         thickness (int, optional): line thickness in pixels
         expansion (int, optional): number of pixels to expand bounding boxes on each side
@@ -741,29 +750,29 @@ def get_text_size(font,s):
     """
     Get the expected width and height when rendering the string [s] in the font
     [font].
     Args:
         font (PIL.ImageFont): the font whose size we should query
         s (str): the string whose size we should query
     Returns:
-        tuple: (w,h), both floats in pixel coordinates
+        tuple: (w,h), both floats in pixel coordinates
     """
     # This is what we did w/Pillow 9
     # w,h = font.getsize(s)
     # I would *think* this would be the equivalent for Pillow 10
     # l,t,r,b = font.getbbox(s); w = r-l; h=b-t
     # ...but this actually produces the most similar results to Pillow 9
     # l,t,r,b = font.getbbox(s); w = r; h=b
     try:
-        l,t,r,b = font.getbbox(s); w = r; h=b
+        l,t,r,b = font.getbbox(s); w = r; h=b # noqa
     except Exception:
         w,h = font.getsize(s)
     return w,h
@@ -779,7 +788,7 @@ def draw_bounding_box_on_image(image,
                                use_normalized_coordinates=True,
                                label_font_size=DEFAULT_LABEL_FONT_SIZE,
                                colormap=None,
-                               textalign=TEXTALIGN_LEFT,
+                               textalign=TEXTALIGN_LEFT,
                                vtextalign=VTEXTALIGN_TOP,
                                text_rotation=None):
     """
@@ -794,9 +803,9 @@ def draw_bounding_box_on_image(image,
     are displayed below the bounding box.
     Adapted from:
     https://github.com/tensorflow/models/blob/master/research/object_detection/utils/visualization_utils.py
     Args:
         image (PIL.Image.Image): the image on which we should draw a box
         ymin (float): ymin of bounding box
@@ -807,24 +816,24 @@ def draw_bounding_box_on_image(image,
             a color; should be either an integer or a string-formatted integer
         thickness (int, optional): line thickness in pixels
         expansion (int, optional): number of pixels to expand bounding boxes on each side
-        display_str_list (list, optional): list of strings to display above the box (each to be shown on its
+        display_str_list (list, optional): list of strings to display above the box (each to be shown on its
             own line)
-        use_normalized_coordinates (bool, optional): if True (default), treat coordinates
+        use_normalized_coordinates (bool, optional): if True (default), treat coordinates
             ymin, xmin, ymax, xmax as relative to the image, otherwise coordinates as absolute pixel values
-        label_font_size (float, optional): font size
+        label_font_size (float, optional): font size
         colormap (list, optional): list of color names, used to choose colors for categories by
             indexing with the values in [classes]; defaults to a reasonable set of colors
-        textalign (int, optional): TEXTALIGN_LEFT, TEXTALIGN_CENTER, or TEXTALIGN_RIGHT
+        textalign (int, optional): TEXTALIGN_LEFT, TEXTALIGN_CENTER, or TEXTALIGN_RIGHT
         vtextalign (int, optional): VTEXTALIGN_TOP or VTEXTALIGN_BOTTOM
         text_rotation (float, optional): rotation to apply to text
     """
     if colormap is None:
         colormap = DEFAULT_COLORS
     if display_str_list is None:
         display_str_list = []
     if clss is None:
         # Default to the MegaDetector animal class ID (1)
         color = colormap[1]
@@ -840,12 +849,12 @@ def draw_bounding_box_on_image(image,
         (left, right, top, bottom) = (xmin, xmax, ymin, ymax)
     if expansion > 0:
         left -= expansion
         right += expansion
         top -= expansion
         bottom += expansion
         # Deliberately trimming to the width of the image only in the case where
         # box expansion is turned on.  There's not an obvious correct behavior here,
         # but the thinking is that if the caller provided an out-of-range bounding
@@ -861,9 +870,9 @@ def draw_bounding_box_on_image(image,
         left = min(left,im_width-1); right = min(right,im_width-1)
         top = min(top,im_height-1); bottom = min(bottom,im_height-1)
     # ...if we need to expand boxes
     draw.line([(left, top), (left, bottom), (right, bottom),
                (right, top), (left, top)], width=thickness, fill=color)
@@ -871,52 +880,52 @@ def draw_bounding_box_on_image(image,
         try:
             font = ImageFont.truetype('arial.ttf', label_font_size)
-        except IOError:
+        except OSError:
             font = ImageFont.load_default()
         display_str_heights = [get_text_size(font,ds)[1] for ds in display_str_list]
         # Each display_str has a top and bottom margin of 0.05x.
         total_display_str_height = (1 + 2 * 0.05) * sum(display_str_heights)
         # Reverse list and print from bottom to top
         for i_str,display_str in enumerate(display_str_list[::-1]):
             # Skip empty strings
             if len(display_str) == 0:
                 continue
-            text_width, text_height = get_text_size(font,display_str)
+            text_width, text_height = get_text_size(font,display_str)
             margin = int(np.ceil(0.05 * text_height))
             if text_rotation is not None and text_rotation != 0:
                 assert text_rotation == -90, \
                     'Only -90-degree text rotation is supported'
                 image_tmp = Image.new('RGB',(text_width+2*margin,text_height+2*margin))
                 image_tmp_draw = ImageDraw.Draw(image_tmp)
                 image_tmp_draw.rectangle([0,0,text_width+2*margin,text_height+2*margin],fill=color)
                 image_tmp_draw.text( (margin,margin), display_str, font=font, fill='black')
                 rotated_text = image_tmp.rotate(text_rotation,expand=1)
                 if textalign == TEXTALIGN_RIGHT:
                     text_left = right
                 else:
                     text_left = left
                 text_left = int(text_left + (text_height) * i_str)
                 if vtextalign == VTEXTALIGN_BOTTOM:
                     text_top = bottom - text_width
                 else:
                     text_top = top
                 text_left = int(text_left)
-                text_top = int(text_top)
+                text_top = int(text_top)
                 image.paste(rotated_text,[text_left,text_top])
             else:
                 # If the total height of the display strings added to the top of the bounding
                 # box exceeds the top of the image, stack the strings below the bounding box
                 # instead of above, and vice-versa if we're bottom-aligning.
@@ -933,32 +942,32 @@ def draw_bounding_box_on_image(image,
                     text_bottom = bottom + total_display_str_height
                     if (text_bottom + total_display_str_height) > im_height:
                         text_bottom = top
                 text_bottom = int(text_bottom) - i_str * (int(text_height + (2 * margin)))
                 text_left = left
                 if textalign == TEXTALIGN_RIGHT:
                     text_left = right - text_width
                 elif textalign == TEXTALIGN_CENTER:
                     text_left = ((right + left) / 2.0) - (text_width / 2.0)
-                text_left = int(text_left)
+                text_left = int(text_left)
                 draw.rectangle(
                     [(text_left, (text_bottom - text_height) - (2 * margin)),
                      (text_left + text_width, text_bottom)],
                     fill=color)
                 draw.text(
                     (text_left + margin, text_bottom - text_height - margin),
                     display_str,
                     fill='black',
                     font=font)
-            # ...if we're rotating text
+            # ...if we're rotating text
     # ...if we're rendering text
 # ...def draw_bounding_box_on_image(...)
@@ -966,9 +975,9 @@ def render_megadb_bounding_boxes(boxes_info, image):
     """
     Render bounding boxes to an image, where those boxes are in the mostly-deprecated
     MegaDB format, which looks like:
     .. code-block::none
         {
             "category": "animal",
             "bbox": [
@@ -977,16 +986,16 @@ def render_megadb_bounding_boxes(boxes_info, image):
                 0.187,
                 0.198
             ]
-        }
+        }
     Args:
         boxes_info (list): list of dicts, each dict represents a single detection
             where bbox coordinates are normalized [x_min, y_min, width, height]
         image (PIL.Image.Image): image to modify
     :meta private:
     """
     display_boxes = []
     display_strs = []
     classes = []  # ints, for selecting colors
@@ -1006,32 +1015,34 @@ def render_megadb_bounding_boxes(boxes_info, image):
 def render_db_bounding_boxes(boxes,
-                             classes,
-                             image,
+                             classes,
+                             image,
                              original_size=None,
-                             label_map=None,
-                             thickness=DEFAULT_BOX_THICKNESS,
+                             label_map=None,
+                             thickness=DEFAULT_BOX_THICKNESS,
                              expansion=0,
                              colormap=None,
                              textalign=TEXTALIGN_LEFT,
                              vtextalign=VTEXTALIGN_TOP,
                              text_rotation=None,
                              label_font_size=DEFAULT_LABEL_FONT_SIZE,
-                             tags=None):
+                             tags=None,
+                             boxes_are_normalized=False):
     """
     Render bounding boxes (with class labels) on an image.  This is a wrapper for
     draw_bounding_boxes_on_image, allowing the caller to operate on a resized image
     by providing the original size of the image; boxes will be scaled accordingly.
     This function assumes that bounding boxes are in absolute coordinates, typically
-    because they come from COCO camera traps .json files.
+    because they come from COCO camera traps .json files, unless boxes_are_normalized
+    is True.
     Args:
         boxes (list): list of length-4 tuples, foramtted as (x,y,w,h) (in pixels)
         classes (list): list of ints (or string-formatted ints), used to choose labels (either
             by literally rendering the class labels, or by indexing into [label_map])
         image (PIL.Image.Image): image object to modify
-        original_size (tuple, optional): if this is not None, and the size is different than
+        original_size (tuple, optional): if this is not None, and the size is different than
             the size of [image], we assume that [boxes] refer to the original size, and we scale
             them accordingly before rendering
         label_map (dict, optional): int --> str dictionary, typically mapping category IDs to
@@ -1047,6 +1058,7 @@ def render_db_bounding_boxes(boxes,
         label_font_size (float, optional): font size for labels
         tags (list, optional): list of strings of length len(boxes) that should be appended
             after each class name (e.g. to show scores)
+        boxes_are_normalized (bool, optional): whether boxes have already been normalized
     """
     display_boxes = []
@@ -1063,38 +1075,48 @@ def render_db_bounding_boxes(boxes,
         box = boxes[i_box]
         clss = classes[i_box]
         x_min_abs, y_min_abs, width_abs, height_abs = box[0:4]
-        ymin = y_min_abs / img_height
-        ymax = ymin + height_abs / img_height
+        # Normalize boxes if necessary
+        if boxes_are_normalized:
-        xmin = x_min_abs / img_width
-        xmax = xmin + width_abs / img_width
+            xmin = x_min_abs
+            xmax = x_min_abs + width_abs
+            ymin = y_min_abs
+            ymax = y_min_abs + height_abs
+        else:
+            ymin = y_min_abs / img_height
+            ymax = ymin + height_abs / img_height
+            xmin = x_min_abs / img_width
+            xmax = xmin + width_abs / img_width
         display_boxes.append([ymin, xmin, ymax, xmax])
         if label_map:
             clss = label_map[int(clss)]
         display_str = str(clss)
         # Do we have a tag to append to the class string?
         if tags is not None and tags[i_box] is not None and len(tags[i_box]) > 0:
             display_str += ' ' + tags[i_box]
         # need to be a string here because PIL needs to iterate through chars
         display_strs.append([display_str])
     # ...for each box
     display_boxes = np.array(display_boxes)
-    draw_bounding_boxes_on_image(image,
-                                 display_boxes,
-                                 classes,
+    draw_bounding_boxes_on_image(image,
+                                 display_boxes,
+                                 classes,
                                  display_strs=display_strs,
-                                 thickness=thickness,
+                                 thickness=thickness,
                                  expansion=expansion,
                                  colormap=colormap,
                                  textalign=textalign,
@@ -1105,12 +1127,12 @@ def render_db_bounding_boxes(boxes,
 # ...def render_db_bounding_boxes(...)
-def draw_bounding_boxes_on_file(input_file,
-                                output_file,
-                                detections,
+def draw_bounding_boxes_on_file(input_file,
+                                output_file,
+                                detections,
                                 confidence_threshold=0.0,
                                 detector_label_map=DEFAULT_DETECTOR_LABEL_MAP,
-                                thickness=DEFAULT_BOX_THICKNESS,
+                                thickness=DEFAULT_BOX_THICKNESS,
                                 expansion=0,
                                 colormap=None,
                                 label_font_size=DEFAULT_LABEL_FONT_SIZE,
@@ -1118,17 +1140,19 @@ def draw_bounding_boxes_on_file(input_file,
                                 target_size=None,
                                 ignore_exif_rotation=False):
     """
-    Renders detection bounding boxes on an image loaded from file, optionally writing the results to
+    Renders detection bounding boxes on an image loaded from file, optionally writing the results to
     a new image file.
     Args:
         input_file (str): filename or URL to load
-        output_file (str, optional): filename to which we should write the rendered image
+        output_file (str): filename to which we should write the rendered image
         detections (list): a list of dictionaries with keys 'conf', 'bbox', and 'category';
-            boxes are length-four arrays formatted as [x,y,w,h], normalized,
+            boxes are length-four arrays formatted as [x,y,w,h], normalized,
             upper-left origin (this is the standard MD detection format). 'category' is a string-int.
-        detector_label_map (dict, optional): a dict mapping category IDs to strings.  If this
-            is None, no confidence values or identifiers are shown.  If this is {}, just category
+        confidence_threshold (float, optional): only render detections with confidence above this
+            threshold
+        detector_label_map (dict, optional): a dict mapping category IDs to strings.  If this
+            is None, no confidence values or identifiers are shown.  If this is {}, just category
             indices and confidence values are shown.
         thickness (int, optional): line width in pixels for box rendering
         expansion (int, optional): box expansion in pixels
@@ -1141,45 +1165,50 @@ def draw_bounding_boxes_on_file(input_file,
             see resize_image() for documentation.  If None or (-1,-1), uses the original image size.
         ignore_exif_rotation (bool, optional): don't rotate the loaded pixels,
             even if we are loading a JPEG and that JPEG says it should be rotated.
     Returns:
         PIL.Image.Image: loaded and modified image
     """
     image = open_image(input_file, ignore_exif_rotation=ignore_exif_rotation)
     if target_size is not None:
         image = resize_image(image,target_size[0],target_size[1])
     render_detection_bounding_boxes(
-            detections, image, label_map=detector_label_map,
+            detections,
+            image,
+            label_map=detector_label_map,
             confidence_threshold=confidence_threshold,
-            thickness=thickness,expansion=expansion,colormap=colormap,
-            custom_strings=custom_strings,label_font_size=label_font_size)
+            thickness=thickness,
+            expansion=expansion,
+            colormap=colormap,
+            custom_strings=custom_strings,
+            label_font_size=label_font_size)
     if output_file is not None:
         image.save(output_file)
     return image
-def draw_db_boxes_on_file(input_file,
-                          output_file,
-                          boxes,
-                          classes=None,
-                          label_map=None,
-                          thickness=DEFAULT_BOX_THICKNESS,
+def draw_db_boxes_on_file(input_file,
+                          output_file,
+                          boxes,
+                          classes=None,
+                          label_map=None,
+                          thickness=DEFAULT_BOX_THICKNESS,
                           expansion=0,
                           ignore_exif_rotation=False):
     """
-    Render COCO-formatted bounding boxes (in absolute coordinates) on an image loaded from file,
+    Render COCO-formatted bounding boxes (in absolute coordinates) on an image loaded from file,
     writing the results to a new image file.
     Args:
         input_file (str): image file to read
         output_file (str): image file to write
         boxes (list): list of length-4 tuples, foramtted as (x,y,w,h) (in pixels)
-        classes (list, optional): list of ints (or string-formatted ints), used to choose
+        classes (list, optional): list of ints (or string-formatted ints), used to choose
             labels (either by literally rendering the class labels, or by indexing into [label_map])
         label_map (dict, optional): int --> str dictionary, typically mapping category IDs to
             species labels; if None, category labels are rendered verbatim (typically as numbers)
@@ -1188,90 +1217,95 @@ def draw_db_boxes_on_file(input_file,
             detection
         ignore_exif_rotation (bool, optional): don't rotate the loaded pixels,
             even if we are loading a JPEG and that JPEG says it should be rotated
     Returns:
         PIL.Image.Image: the loaded and modified image
     """
     image = open_image(input_file, ignore_exif_rotation=ignore_exif_rotation)
     if classes is None:
         classes = [0] * len(boxes)
-    render_db_bounding_boxes(boxes, classes, image, original_size=None,
-                             label_map=label_map, thickness=thickness, expansion=expansion)
+    render_db_bounding_boxes(boxes,
+                             classes,
+                             image,
+                             original_size=None,
+                             label_map=label_map,
+                             thickness=thickness,
+                             expansion=expansion)
     image.save(output_file)
     return image
 # ...def draw_bounding_boxes_on_file(...)
 def gray_scale_fraction(image,crop_size=(0.1,0.1)):
     """
-    Computes the fraction of the pixels in [image] that appear to be grayscale (R==G==B),
+    Computes the fraction of the pixels in [image] that appear to be grayscale (R==G==B),
     useful for approximating whether this is a night-time image when flash information is not
     available in EXIF data (or for video frames, where this information is often not available
     in structured metadata at all).
     Args:
         image (str or PIL.Image.Image): Image, filename, or URL to analyze
-        crop_size (optional): a 2-element list/tuple, representing the fraction of the
-            image to crop at the top and bottom, respectively, before analyzing (to minimize
+        crop_size (tuple of floats, optional): a 2-element list/tuple, representing the fraction of
+            the image to crop at the top and bottom, respectively, before analyzing (to minimize
             the possibility of including color elements in the image overlay)
     Returns:
         float: the fraction of pixels in [image] that appear to be grayscale (R==G==B)
     """
     if isinstance(image,str):
         image = Image.open(image)
     if image.mode == 'L':
         return 1.0
     if len(image.getbands()) == 1:
         return 1.0
     # Crop if necessary
     if crop_size[0] > 0 or crop_size[1] > 0:
         assert (crop_size[0] + crop_size[1]) < 1.0, \
             print('Illegal crop size: {}'.format(str(crop_size)))
         top_crop_pixels = int(image.height * crop_size[0])
         bottom_crop_pixels = int(image.height * crop_size[1])
         left = 0
         right = image.width
         # Remove pixels from the top
         first_crop_top = top_crop_pixels
-        first_crop_bottom = image.height
+        first_crop_bottom = image.height
         first_crop = image.crop((left, first_crop_top, right, first_crop_bottom))
         # Remove pixels from the bottom
         second_crop_top = 0
         second_crop_bottom = first_crop.height - bottom_crop_pixels
         second_crop = first_crop.crop((left, second_crop_top, right, second_crop_bottom))
         image = second_crop
     # It doesn't matter if these are actually R/G/B, they're just names
     r = np.array(image.getchannel(0))
     g = np.array(image.getchannel(1))
     b = np.array(image.getchannel(2))
     gray_pixels = np.logical_and(r == g, r == b)
     n_pixels = gray_pixels.size
     n_gray_pixels = gray_pixels.sum()
     return n_gray_pixels / n_pixels
     # Non-numpy way to do the same thing, briefly keeping this here for posterity
     if False:
         w, h = image.size
         n_pixels = w*h
         n_gray_pixels = 0
@@ -1279,25 +1313,25 @@ def gray_scale_fraction(image,crop_size=(0.1,0.1)):
             for j in range(h):
                 r, g, b = image.getpixel((i,j))
                 if r == g and r == b and g == b:
-                    n_gray_pixels += 1
+                    n_gray_pixels += 1
 # ...def gray_scale_fraction(...)
 def _resize_relative_image(fn_relative,
-                          input_folder,
-                          output_folder,
-                          target_width,
-                          target_height,
-                          no_enlarge_width,
-                          verbose,
-                          quality,
-                          overwrite=True):
+                           input_folder,
+                           output_folder,
+                           target_width,
+                           target_height,
+                           no_enlarge_width,
+                           verbose,
+                           quality,
+                           overwrite=True):
     """
     Internal function for resizing an image from one folder to another,
     maintaining relative path.
     """
     input_fn_abs = os.path.join(input_folder,fn_relative)
     output_fn_abs = os.path.join(output_folder,fn_relative)
@@ -1305,13 +1339,16 @@ def _resize_relative_image(fn_relative,
         status = 'skipped'
         error = None
         return {'fn_relative':fn_relative,'status':status,'error':error}
     os.makedirs(os.path.dirname(output_fn_abs),exist_ok=True)
     try:
-        _ = resize_image(input_fn_abs,
-                         output_file=output_fn_abs,
-                         target_width=target_width, target_height=target_height,
-                         no_enlarge_width=no_enlarge_width, verbose=verbose, quality=quality)
+        _ = resize_image(input_fn_abs,
+                         output_file=output_fn_abs,
+                         target_width=target_width,
+                         target_height=target_height,
+                         no_enlarge_width=no_enlarge_width,
+                         verbose=verbose,
+                         quality=quality)
         status = 'success'
         error = None
     except Exception as e:
@@ -1319,27 +1356,33 @@ def _resize_relative_image(fn_relative,
             print('Error resizing {}: {}'.format(fn_relative,str(e)))
         status = 'error'
         error = str(e)
     return {'fn_relative':fn_relative,'status':status,'error':error}
 # ...def _resize_relative_image(...)
 def _resize_absolute_image(input_output_files,
-                          target_width,target_height,no_enlarge_width,verbose,quality):
+                           target_width,
+                           target_height,
+                           no_enlarge_width,
+                           verbose,
+                           quality):
     """
     Internal wrapper for resize_image used in the context of a batch resize operation.
     """
     input_fn_abs = input_output_files[0]
     output_fn_abs = input_output_files[1]
     os.makedirs(os.path.dirname(output_fn_abs),exist_ok=True)
     try:
-        _ = resize_image(input_fn_abs,
-                         output_file=output_fn_abs,
-                         target_width=target_width, target_height=target_height,
-                         no_enlarge_width=no_enlarge_width, verbose=verbose, quality=quality)
+        _ = resize_image(input_fn_abs,
+                         output_file=output_fn_abs,
+                         target_width=target_width,
+                         target_height=target_height,
+                         no_enlarge_width=no_enlarge_width,
+                         verbose=verbose,
+                         quality=quality)
         status = 'success'
         error = None
     except Exception as e:
@@ -1347,7 +1390,7 @@ def _resize_absolute_image(input_output_files,
             print('Error resizing {}: {}'.format(input_fn_abs,str(e)))
         status = 'error'
         error = str(e)
     return {'input_fn':input_fn_abs,'output_fn':output_fn_abs,status:'status',
             'error':error}
@@ -1355,21 +1398,21 @@ def _resize_absolute_image(input_output_files,
 def resize_images(input_file_to_output_file,
-                  target_width=-1,
+                  target_width=-1,
                   target_height=-1,
-                  no_enlarge_width=False,
-                  verbose=False,
+                  no_enlarge_width=False,
+                  verbose=False,
                   quality='keep',
-                  pool_type='process',
+                  pool_type='process',
                   n_workers=10):
     """
     Resizes all images the dictionary [input_file_to_output_file].
     TODO: This is a little more redundant with resize_image_folder than I would like;
     refactor resize_image_folder to call resize_images.  Not doing that yet because
-    at the time I'm writing this comment, a lot of code depends on resize_image_folder
+    at the time I'm writing this comment, a lot of code depends on resize_image_folder
     and I don't want to rock the boat yet.
     Args:
         input_file_to_output_file (dict): dict mapping images that exist to the locations
             where the resized versions should be written
@@ -1377,8 +1420,8 @@ def resize_images(input_file_to_output_file,
             to let target_height determine the size
         target_height (int, optional): height to which we should resize this image, or -1
             to let target_width determine the size
-        no_enlarge_width (bool, optional): if [no_enlarge_width] is True, and
-            [target width] is larger than the original image width, does not modify the image,
+        no_enlarge_width (bool, optional): if [no_enlarge_width] is True, and
+            [target width] is larger than the original image width, does not modify the image,
             but will write to output_file if supplied
         verbose (bool, optional): enable additional debug output
         quality (str or int, optional): passed to exif_preserving_save, see docs for more detail
@@ -1389,20 +1432,20 @@ def resize_images(input_file_to_output_file,
     Returns:
         list: a list of dicts with keys 'input_fn', 'output_fn', 'status', and 'error'.
-        'status' will be 'success' or 'error'; 'error' will be None for successful cases,
+        'status' will be 'success' or 'error'; 'error' will be None for successful cases,
         otherwise will contain the image-specific error.
     """
     assert pool_type in ('process','thread'), 'Illegal pool type {}'.format(pool_type)
     input_output_file_pairs = []
     # Reformat input files as (input,output) tuples
     for input_fn in input_file_to_output_file:
         input_output_file_pairs.append((input_fn,input_file_to_output_file[input_fn]))
-    if n_workers == 1:
+    if n_workers == 1:
         results = []
         for i_o_file_pair in tqdm(input_output_file_pairs):
             results.append(_resize_absolute_image(i_o_file_pair,
@@ -1413,47 +1456,54 @@ def resize_images(input_file_to_output_file,
                             quality=quality))
     else:
-        if pool_type == 'thread':
-            pool = ThreadPool(n_workers); poolstring = 'threads'
-        else:
-            assert pool_type == 'process'
-            pool = Pool(n_workers); poolstring = 'processes'
-        if verbose:
-            print('Starting resizing pool with {} {}'.format(n_workers,poolstring))
-        p = partial(_resize_absolute_image,
-                target_width=target_width,
-                target_height=target_height,
-                no_enlarge_width=no_enlarge_width,
-                verbose=verbose,
-                quality=quality)
-        results = list(tqdm(pool.imap(p, input_output_file_pairs),total=len(input_output_file_pairs)))
+        pool = None
+        try:
+            if pool_type == 'thread':
+                pool = ThreadPool(n_workers); poolstring = 'threads'
+            else:
+                assert pool_type == 'process'
+                pool = Pool(n_workers); poolstring = 'processes'
+            if verbose:
+                print('Starting resizing pool with {} {}'.format(n_workers,poolstring))
+            p = partial(_resize_absolute_image,
+                    target_width=target_width,
+                    target_height=target_height,
+                    no_enlarge_width=no_enlarge_width,
+                    verbose=verbose,
+                    quality=quality)
+            results = list(tqdm(pool.imap(p, input_output_file_pairs),total=len(input_output_file_pairs)))
+        finally:
+            pool.close()
+            pool.join()
+            print("Pool closed and joined for image resizing")
     return results
 # ...def resize_images(...)
-def resize_image_folder(input_folder,
+def resize_image_folder(input_folder,
                         output_folder=None,
-                        target_width=-1,
+                        target_width=-1,
                         target_height=-1,
-                        no_enlarge_width=False,
-                        verbose=False,
+                        no_enlarge_width=False,
+                        verbose=False,
                         quality='keep',
-                        pool_type='process',
-                        n_workers=10,
+                        pool_type='process',
+                        n_workers=10,
                         recursive=True,
                         image_files_relative=None,
                         overwrite=True):
     """
     Resize all images in a folder (defaults to recursive).
     Defaults to in-place resizing (output_folder is optional).
     Args:
         input_folder (str): folder in which we should find images to resize
         output_folder (str, optional): folder in which we should write resized images.  If
@@ -1463,8 +1513,8 @@ def resize_image_folder(input_folder,
             to let target_height determine the size
         target_height (int, optional): height to which we should resize this image, or -1
             to let target_width determine the size
-        no_enlarge_width (bool, optional): if [no_enlarge_width] is True, and
-            [target width] is larger than the original image width, does not modify the image,
+        no_enlarge_width (bool, optional): if [no_enlarge_width] is True, and
+            [target width] is larger than the original image width, does not modify the image,
             but will write to output_file if supplied
         verbose (bool, optional): enable additional debug output
         quality (str or int, optional): passed to exif_preserving_save, see docs for more detail
@@ -1476,34 +1526,34 @@ def resize_image_folder(input_folder,
         image_files_relative (list, optional): if not None, skips any relative paths not
             in this list
         overwrite (bool, optional): whether to overwrite existing target images
     Returns:
         list: a list of dicts with keys 'input_fn', 'output_fn', 'status', and 'error'.
-        'status' will be 'success', 'skipped', or 'error'; 'error' will be None for successful
+        'status' will be 'success', 'skipped', or 'error'; 'error' will be None for successful
         cases, otherwise will contain the image-specific error.
     """
     assert os.path.isdir(input_folder), '{} is not a folder'.format(input_folder)
     if output_folder is None:
         output_folder = input_folder
     else:
         os.makedirs(output_folder,exist_ok=True)
     assert pool_type in ('process','thread'), 'Illegal pool type {}'.format(pool_type)
     if image_files_relative is None:
         if verbose:
             print('Enumerating images')
         image_files_relative = find_images(input_folder,recursive=recursive,
                                            return_relative_paths=True,convert_slashes=True)
         if verbose:
             print('Found {} images'.format(len(image_files_relative)))
-    if n_workers == 1:
+    if n_workers == 1:
         if verbose:
             print('Resizing images')
@@ -1520,16 +1570,16 @@ def resize_image_folder(input_folder,
                                   overwrite=overwrite))
     else:
         if pool_type == 'thread':
-            pool = ThreadPool(n_workers); poolstring = 'threads'
+            pool = ThreadPool(n_workers); poolstring = 'threads'
         else:
             assert pool_type == 'process'
             pool = Pool(n_workers); poolstring = 'processes'
         if verbose:
             print('Starting resizing pool with {} {}'.format(n_workers,poolstring))
         p = partial(_resize_relative_image,
                 input_folder=input_folder,
                 output_folder=output_folder,
@@ -1539,8 +1589,9 @@ def resize_image_folder(input_folder,
                 verbose=verbose,
                 quality=quality,
                 overwrite=overwrite)
-        results = list(tqdm(pool.imap(p, image_files_relative),total=len(image_files_relative)))
+        results = list(tqdm(pool.imap(p, image_files_relative),
+                            total=len(image_files_relative)))
     return results
@@ -1550,17 +1601,18 @@ def resize_image_folder(input_folder,
 def get_image_size(im,verbose=False):
     """
     Retrieve the size of an image.  Returns None if the image fails to load.
     Args:
         im (str or PIL.Image): filename or PIL image
+        verbose (bool, optional): enable additional debug output
     Returns:
         tuple (w,h), or None if the image fails to load.
     """
     image_name = '[in memory]'
-    try:
+    try:
         if isinstance(im,str):
             image_name = im
             im = load_image(im)
@@ -1577,66 +1629,66 @@ def get_image_size(im,verbose=False):
             print('Error reading width from image {}: {}'.format(
                 image_name,str(e)))
         return None
 # ...def get_image_size(...)
 def parallel_get_image_sizes(filenames,
-                             max_workers=16,
-                             use_threads=True,
+                             max_workers=16,
+                             use_threads=True,
                              recursive=True,
                              verbose=False):
     """
     Retrieve image sizes for a list or folder of images
     Args:
-        filenames (list or str): a list of image filenames or a folder.  Non-image files and
+        filenames (list or str): a list of image filenames or a folder.  Non-image files and
             unreadable images will be returned with a file size of None.
         max_workers (int, optional): the number of parallel workers to use; set to <=1 to disable
             parallelization
         use_threads (bool, optional): whether to use threads (True) or processes (False) for
             parallelization
-        recursive (bool, optional): if [filenames] is a folder, whether to search recursively for images.
-            Ignored if [filenames] is a list.
+        recursive (bool, optional): if [filenames] is a folder, whether to search recursively
+            for images. Ignored if [filenames] is a list.
         verbose (bool, optional): enable additional debug output
     Returns:
         dict: a dict mapping filenames to (w,h) tuples; the value will be None for images that fail
-        to load.
+        to load.  Filenames will always be absolute.
     """
     if isinstance(filenames,str) and os.path.isdir(filenames):
         if verbose:
             print('Enumerating images in {}'.format(filenames))
         filenames = find_images(filenames,recursive=recursive,return_relative_paths=False)
     n_workers = min(max_workers,len(filenames))
     if verbose:
         print('Getting image sizes for {} images'.format(len(filenames)))
     if n_workers <= 1:
         results = []
         for filename in filenames:
             results.append(get_image_size(filename,verbose=verbose))
     else:
         if use_threads:
             pool = ThreadPool(n_workers)
         else:
             pool = Pool(n_workers)
         results = list(tqdm(pool.imap(
             partial(get_image_size,verbose=verbose),filenames), total=len(filenames)))
     assert len(filenames) == len(results), 'Internal error in parallel_get_image_sizes'
     to_return = {}
     for i_file,filename in enumerate(filenames):
         to_return[filename] = results[i_file]
     return to_return
@@ -1645,30 +1697,30 @@ def parallel_get_image_sizes(filenames,
 def check_image_integrity(filename,modes=None):
     """
     Check whether we can successfully load an image via OpenCV and/or PIL.
-    Args:
+    Args:
         filename (str): the filename to evaluate
         modes (list, optional): a list containing one or more of:
             - 'cv'
             - 'pil'
             - 'skimage'
-            - 'jpeg_trailer'
+            - 'jpeg_trailer'
             'jpeg_trailer' checks that the binary data ends with ffd9.  It does not check whether
             the image is actually a jpeg, and even if it is, there are lots of reasons the image might not
             end with ffd9.  It's also true the JPEGs that cause "premature end of jpeg segment" issues
             don't end with ffd9, so this may be a useful diagnostic.  High precision, very low recall
             for corrupt jpegs.
             Set to None to use all modes.
     Returns:
         dict: a dict with a key called 'file' (the value of [filename]), one key for each string in
         [modes] (a success indicator for that mode, specifically a string starting with either
         'success' or 'error').
     """
     if modes is None:
         modes = ('cv','pil','skimage','jpeg_trailer')
     else:
@@ -1676,14 +1728,14 @@ def check_image_integrity(filename,modes=None):
             modes = [modes]
         for mode in modes:
             assert mode in ('cv','pil','skimage'), 'Unrecognized mode {}'.format(mode)
     assert os.path.isfile(filename), 'Could not find file {}'.format(filename)
     result = {}
     result['file'] = filename
     for mode in modes:
         result[mode] = 'unknown'
         if mode == 'pil':
             try:
@@ -1700,10 +1752,10 @@ def check_image_integrity(filename,modes=None):
                 result[mode] = 'success'
             except Exception as e:
                 result[mode] = 'error: {}'.format(str(e))
-        elif mode == 'skimage':
+        elif mode == 'skimage':
             try:
                 # This is not a standard dependency
-                from skimage import io as skimage_io # noqa
+                from skimage import io as skimage_io # type: ignore # noqa
             except Exception:
                 result[mode] = 'could not import skimage, run pip install scikit-image'
                 return result
@@ -1724,26 +1776,26 @@ def check_image_integrity(filename,modes=None):
                     result[mode] = 'success'
             except Exception as e:
                 result[mode] = 'error: {}'.format(str(e))
-    # ...for each mode
+    # ...for each mode
     return result
 # ...def check_image_integrity(...)
 def parallel_check_image_integrity(filenames,
-                                   modes=None,
-                                   max_workers=16,
-                                   use_threads=True,
+                                   modes=None,
+                                   max_workers=16,
+                                   use_threads=True,
                                    recursive=True,
                                    verbose=False):
     """
     Check whether we can successfully load a list of images via OpenCV and/or PIL.
     Args:
         filenames (list or str): a list of image filenames or a folder
-        mode (list): see check_image_integrity() for documentation on the [modes] parameter
+        modes (list, optional): see check_image_integrity() for documentation on the [modes] parameter
         max_workers (int, optional): the number of parallel workers to use; set to <=1 to disable
             parallelization
         use_threads (bool, optional): whether to use threads (True) or processes (False) for
@@ -1751,10 +1803,10 @@ def parallel_check_image_integrity(filenames,
         recursive (bool, optional): if [filenames] is a folder, whether to search recursively for images.
             Ignored if [filenames] is a list.
         verbose (bool, optional): enable additional debug output
     Returns:
-        list: a list of dicts, each with a key called 'file' (the value of [filename]), one key for
-        each string in [modes] (a success indicator for that mode, specifically a string starting
+        list: a list of dicts, each with a key called 'file' (the value of [filename]), one key for
+        each string in [modes] (a success indicator for that mode, specifically a string starting
         with either 'success' or 'error').
     """
@@ -1762,69 +1814,69 @@ def parallel_check_image_integrity(filenames,
         if verbose:
             print('Enumerating images in {}'.format(filenames))
         filenames = find_images(filenames,recursive=recursive,return_relative_paths=False)
     n_workers = min(max_workers,len(filenames))
     if verbose:
         print('Checking image integrity for {} filenames'.format(len(filenames)))
     if n_workers <= 1:
         results = []
         for filename in filenames:
             results.append(check_image_integrity(filename,modes=modes))
     else:
         if use_threads:
             pool = ThreadPool(n_workers)
         else:
             pool = Pool(n_workers)
         results = list(tqdm(pool.imap(
             partial(check_image_integrity,modes=modes),filenames), total=len(filenames)))
     return results
 #%% Test drivers
 if False:
     #%% Text rendering tests
     import os # noqa
     import numpy as np # noqa
     from megadetector.visualization.visualization_utils import \
         draw_bounding_boxes_on_image, exif_preserving_save, load_image, \
         TEXTALIGN_LEFT,TEXTALIGN_RIGHT,VTEXTALIGN_BOTTOM,VTEXTALIGN_TOP, \
         DEFAULT_LABEL_FONT_SIZE
     fn = os.path.expanduser('~/AppData/Local/Temp/md-tests/md-test-images/ena24_7904.jpg')
     output_fn = r'g:\temp\test.jpg'
     image = load_image(fn)
     w = 0.2; h = 0.2
     all_boxes = [[0.05, 0.05, 0.25, 0.25],
                  [0.05, 0.35, 0.25, 0.6],
                  [0.35, 0.05, 0.6, 0.25],
                  [0.35, 0.35, 0.6, 0.6]]
     alignments = [
         [TEXTALIGN_LEFT,VTEXTALIGN_TOP],
         [TEXTALIGN_LEFT,VTEXTALIGN_BOTTOM],
         [TEXTALIGN_RIGHT,VTEXTALIGN_TOP],
         [TEXTALIGN_RIGHT,VTEXTALIGN_BOTTOM]
         ]
     labels = ['left_top','left_bottom','right_top','right_bottom']
     text_rotation = -90
     n_label_copies = 2
     for i_box,box in enumerate(all_boxes):
         boxes = [box]
         boxes = np.array(boxes)
         classes = [i_box]
@@ -1846,30 +1898,30 @@ if False:
     exif_preserving_save(image,output_fn)
     from megadetector.utils.path_utils import open_file
     open_file(output_fn)
     #%% Recursive resize test
     from megadetector.visualization.visualization_utils import resize_image_folder # noqa
     input_folder = r"C:\temp\resize-test\in"
     output_folder = r"C:\temp\resize-test\out"
     resize_results = resize_image_folder(input_folder,output_folder,
                          target_width=1280,verbose=True,quality=85,no_enlarge_width=True,
                          pool_type='process',n_workers=10)
     #%% Integrity checking test
     from megadetector.utils import md_tests
     options = md_tests.download_test_data()
     folder = options.scratch_dir
     results = parallel_check_image_integrity(folder,max_workers=8)
     modes = ['cv','pil','skimage','jpeg_trailer']
     for r in results:
         for mode in modes:
             if r[mode] != 'success':

megadetector 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl