PyPI - megadetector - Versions diffs - 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl - Mend

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (197) hide show

megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/efficientnet/model.py +8 -8
megadetector/classification/efficientnet/utils.py +6 -5
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +26 -26
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -2
megadetector/data_management/camtrap_dp_to_coco.py +79 -46
megadetector/data_management/cct_json_utils.py +103 -103
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +210 -193
megadetector/data_management/databases/add_width_and_height_to_db.py +86 -12
megadetector/data_management/databases/combine_coco_camera_traps_files.py +40 -40
megadetector/data_management/databases/integrity_check_json_db.py +228 -200
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +88 -39
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +133 -125
megadetector/data_management/labelme_to_yolo.py +159 -73
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +365 -107
megadetector/data_management/lila/get_lila_annotation_counts.py +35 -33
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +73 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +28 -19
megadetector/data_management/mewc_to_md.py +344 -340
megadetector/data_management/ocr_tools.py +262 -255
megadetector/data_management/read_exif.py +249 -227
megadetector/data_management/remap_coco_categories.py +90 -28
megadetector/data_management/remove_exif.py +81 -21
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +588 -120
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +248 -122
megadetector/data_management/yolo_to_coco.py +333 -191
megadetector/detection/change_detection.py +832 -0
megadetector/detection/process_video.py +340 -337
megadetector/detection/pytorch_detector.py +358 -278
megadetector/detection/run_detector.py +399 -186
megadetector/detection/run_detector_batch.py +404 -377
megadetector/detection/run_inference_with_yolov5_val.py +340 -327
megadetector/detection/run_tiled_inference.py +257 -249
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +332 -295
megadetector/postprocessing/add_max_conf.py +19 -11
megadetector/postprocessing/categorize_detections_by_size.py +45 -45
megadetector/postprocessing/classification_postprocessing.py +468 -433
megadetector/postprocessing/combine_batch_outputs.py +23 -23
megadetector/postprocessing/compare_batch_results.py +590 -525
megadetector/postprocessing/convert_output_format.py +106 -102
megadetector/postprocessing/create_crop_folder.py +347 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -499
megadetector/postprocessing/load_api_results.py +48 -27
megadetector/postprocessing/md_to_coco.py +133 -102
megadetector/postprocessing/md_to_labelme.py +107 -90
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +92 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -301
megadetector/postprocessing/remap_detection_categories.py +91 -38
megadetector/postprocessing/render_detection_confusion_matrix.py +214 -205
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +704 -679
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +18 -19
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +54 -33
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +67 -67
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +156 -74
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +10 -10
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/ct_utils.py +1049 -211
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +632 -529
megadetector/utils/path_utils.py +1520 -431
megadetector/utils/process_utils.py +41 -41
megadetector/utils/split_locations_into_train_val.py +62 -62
megadetector/utils/string_utils.py +148 -27
megadetector/utils/url_utils.py +489 -176
megadetector/utils/wi_utils.py +2658 -2526
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +34 -30
megadetector/visualization/render_images_with_thumbnails.py +39 -74
megadetector/visualization/visualization_utils.py +487 -435
megadetector/visualization/visualize_db.py +232 -198
megadetector/visualization/visualize_detector_output.py +82 -76
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/METADATA +5 -2
megadetector-10.0.0.dist-info/RECORD +139 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/WHEEL +1 -1
megadetector/api/batch_processing/api_core/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/score.py +0 -439
megadetector/api/batch_processing/api_core/server.py +0 -294
megadetector/api/batch_processing/api_core/server_api_config.py +0 -97
megadetector/api/batch_processing/api_core/server_app_config.py +0 -55
megadetector/api/batch_processing/api_core/server_batch_job_manager.py +0 -220
megadetector/api/batch_processing/api_core/server_job_status_table.py +0 -149
megadetector/api/batch_processing/api_core/server_orchestration.py +0 -360
megadetector/api/batch_processing/api_core/server_utils.py +0 -88
megadetector/api/batch_processing/api_core_support/__init__.py +0 -0
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
megadetector/api/batch_processing/api_support/__init__.py +0 -0
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +0 -152
megadetector/api/batch_processing/data_preparation/__init__.py +0 -0
megadetector/api/synchronous/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/api_backend.py +0 -151
megadetector/api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -263
megadetector/api/synchronous/api_core/animal_detection_api/config.py +0 -35
megadetector/api/synchronous/api_core/tests/__init__.py +0 -0
megadetector/api/synchronous/api_core/tests/load_test.py +0 -110
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector/utils/azure_utils.py +0 -178
megadetector/utils/sas_blob_utils.py +0 -509
megadetector-5.0.28.dist-info/RECORD +0 -209
/megadetector/{api/batch_processing/__init__.py → __init__.py} +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/top_level.txt +0 -0

megadetector/detection/run_detector_batch.py CHANGED Viewed

@@ -10,8 +10,8 @@ https://github.com/agentmorris/MegaDetector/tree/main/megadetector/api/batch_pro
 This enables the results to be used in our post-processing pipeline; see postprocess_batch_results.py.
 This script can save results to checkpoints intermittently, in case disaster
-strikes. To enable this, set --checkpoint_frequency to n > 0, and results
-will be saved as a checkpoint every n images. Checkpoints will be written
+strikes. To enable this, set --checkpoint_frequency to n > 0, and results
+will be saved as a checkpoint every n images. Checkpoints will be written
 to a file in the same directory as the output_file, and after all images
 are processed and final results file written to output_file, the temporary
 checkpoint file will be deleted. If you want to resume from a checkpoint, set
@@ -26,10 +26,10 @@ run a gazillion MegaDetector images on multiple GPUs using this script, we just
 one GPU *per invocation of this script*.  Dividing a big batch of images into one chunk
 per GPU happens outside of this script.
-Does not have a command-line option to bind the process to a particular GPU, but you can
+Does not have a command-line option to bind the process to a particular GPU, but you can
 prepend with "CUDA_VISIBLE_DEVICES=0 ", for example, to bind to GPU 0, e.g.:
-CUDA_VISIBLE_DEVICES=0 python detection/run_detector_batch.py md_v4.1.0.pb ~/data ~/mdv4test.json
+CUDA_VISIBLE_DEVICES=0 python detection/run_detector_batch.py md_v4.1.0.pb ~/data ~/mdv4test.json
 You can disable GPU processing entirely by setting CUDA_VISIBLE_DEVICES=''.
@@ -70,6 +70,7 @@ from megadetector.detection.run_detector import \
     get_detector_metadata_from_version_string
 from megadetector.utils import path_utils
+from megadetector.utils import ct_utils
 from megadetector.utils.ct_utils import parse_kvp_list
 from megadetector.utils.ct_utils import split_list_into_n_chunks
 from megadetector.utils.ct_utils import sort_list_of_dicts_by_key
@@ -92,7 +93,7 @@ max_queue_size = 10
 # How often should we print progress when using the image queue?
 n_queue_print = 1000
-# TODO: it's a little sloppy that these are module-level globals, but in practice it
+# TODO: it's a little sloppy that these are module-level globals, but in practice it
 # doesn't really matter, so I'm not in a big rush to move these to options until I do
 # a larger cleanup of all the long argument lists in this module.
 #
@@ -116,40 +117,42 @@ def _producer_func(q,
                    verbose=False,
                    image_size=None,
                    augment=None):
-    """
+    """
     Producer function; only used when using the (optional) image queue.
-    Reads up to images from disk and puts them on the blocking queue for
-    processing.  Each image is queued as a tuple of [filename,Image].  Sends
+    Reads up to images from disk and puts them on the blocking queue for
+    processing.  Each image is queued as a tuple of [filename,Image].  Sends
     "None" to the queue when finished.
     The "detector" argument is only used for preprocessing.
     """
     if verbose:
         print('Producer starting: ID {}, preprocessor {}'.format(producer_id,preprocessor))
         sys.stdout.flush()
-    if preprocessor is not None:
+    if preprocessor is not None:
         assert isinstance(preprocessor,str)
         detector_options = deepcopy(detector_options)
         detector_options['preprocess_only'] = True
-        preprocessor = load_detector(preprocessor,detector_options=detector_options,verbose=verbose)
+        preprocessor = load_detector(preprocessor,
+                                     detector_options=detector_options,
+                                     verbose=verbose)
     for im_file in image_files:
         try:
             if verbose:
                 print('Loading image {} on producer {}'.format(im_file,producer_id))
                 sys.stdout.flush()
             image = vis_utils.load_image(im_file)
             if preprocessor is not None:
                 image_info = preprocessor.generate_detections_one_image(
-                                                  image,
-                                                  im_file,
-                                                  detection_threshold=None,
+                                                  image,
+                                                  im_file,
+                                                  detection_threshold=None,
                                                   image_size=image_size,
                                                   skip_image_resizing=False,
                                                   augment=augment,
@@ -158,29 +161,29 @@ def _producer_func(q,
                 if 'failure' in image_info:
                     assert image_info['failure'] == run_detector.FAILURE_INFER
                     raise
                 image = image_info
         except Exception as e:
             print('Producer process: image {} cannot be loaded:\n{}'.format(im_file,str(e)))
-            image = run_detector.FAILURE_IMAGE_OPEN
+            image = run_detector.FAILURE_IMAGE_OPEN
         if verbose:
             print('Queueing image {} from producer {}'.format(im_file,producer_id))
             sys.stdout.flush()
         q.put([im_file,image,producer_id])
     # This is a signal to the consumer function that a worker has finished
     q.put(None)
     if verbose:
         print('Loader worker {} finished'.format(producer_id))
     sys.stdout.flush()
 # ...def _producer_func(...)
 def _consumer_func(q,
                    return_queue,
                    model_file,
@@ -188,27 +191,29 @@ def _consumer_func(q,
                    loader_workers,
                    image_size=None,
                    include_image_size=False,
-                   include_image_timestamp=False,
+                   include_image_timestamp=False,
                    include_exif_data=False,
                    augment=False,
                    detector_options=None,
                    preprocess_on_image_queue=default_preprocess_on_image_queue,
                    n_total_images=None
                    ):
-    """
+    """
     Consumer function; only used when using the (optional) image queue.
     Pulls images from a blocking queue and processes them.  Returns when "None" has
     been read from each loader's queue.
     """
     if verbose:
         print('Consumer starting'); sys.stdout.flush()
     start_time = time.time()
     if isinstance(model_file,str):
-        detector = load_detector(model_file,detector_options=detector_options,verbose=verbose)
+        detector = load_detector(model_file,
+                                 detector_options=detector_options,
+                                 verbose=verbose)
         elapsed = time.time() - start_time
         print('Loaded model (before queueing) in {}, printing updates every {} images'.format(
             humanfriendly.format_timespan(elapsed),n_queue_print))
@@ -216,21 +221,21 @@ def _consumer_func(q,
     else:
         detector = model_file
         print('Detector of type {} passed to consumer function'.format(type(detector)))
     results = []
     n_images_processed = 0
     n_queues_finished = 0
     pbar = None
     if n_total_images is not None:
         # TODO: in principle I should close this pbar
         pbar = tqdm(total=n_total_images)
     while True:
         r = q.get()
         # Is this the last image in one of the producer queues?
         if r is None:
             n_queues_finished += 1
@@ -246,7 +251,7 @@ def _consumer_func(q,
         n_images_processed += 1
         im_file = r[0]
         image = r[1]
         """
         result['img_processed'] = img
         result['img_original'] = img_original
@@ -255,19 +260,19 @@ def _consumer_func(q,
         result['letterbox_ratio'] = letterbox_ratio
         result['letterbox_pad'] = letterbox_pad
         """
         if pbar is not None:
             pbar.update(1)
         if False:
             if verbose or ((n_images_processed % n_queue_print) == 1):
                 elapsed = time.time() - start_time
                 images_per_second = n_images_processed / elapsed
                 print('De-queued image {} ({:.2f}/s) ({})'.format(n_images_processed,
                                                               images_per_second,
-                                                              im_file));
+                                                              im_file))
                 sys.stdout.flush()
         if isinstance(image,str):
             # This is how the producer function communicates read errors
             results.append({'file': im_file,
@@ -276,7 +281,7 @@ def _consumer_func(q,
                 print('Expected a dict, received an image of type {}'.format(type(image)))
                 results.append({'file': im_file,
                                 'failure': 'illegal image type'})
         else:
             results.append(process_image(im_file=im_file,
                                          detector=detector,
@@ -285,14 +290,14 @@ def _consumer_func(q,
                                          quiet=True,
                                          image_size=image_size,
                                          include_image_size=include_image_size,
-                                         include_image_timestamp=include_image_timestamp,
+                                         include_image_timestamp=include_image_timestamp,
                                          include_exif_data=include_exif_data,
                                          augment=augment,
                                          skip_image_resizing=preprocess_on_image_queue))
         if verbose:
             print('Processed image {}'.format(im_file)); sys.stdout.flush()
         q.task_done()
     # ...while True (consumer loop)
 # ...def _consumer_func(...)
@@ -303,7 +308,7 @@ def run_detector_with_image_queue(image_files,
                                   confidence_threshold,
                                   quiet=False,
                                   image_size=None,
-                                  include_image_size=False,
+                                  include_image_size=False,
                                   include_image_timestamp=False,
                                   include_exif_data=False,
                                   augment=False,
@@ -311,54 +316,59 @@ def run_detector_with_image_queue(image_files,
                                   loader_workers=default_loaders,
                                   preprocess_on_image_queue=default_preprocess_on_image_queue):
     """
-    Driver function for the (optional) multiprocessing-based image queue; only used
-    when --use_image_queue is specified.  Starts a reader process to read images from disk, but
+    Driver function for the (optional) multiprocessing-based image queue; only used
+    when --use_image_queue is specified.  Starts a reader process to read images from disk, but
     processes images in the  process from which this function is called (i.e., does not currently
     spawn a separate consumer process).
     Args:
         image_files (str): list of absolute paths to images
         model_file (str): filename or model identifier (e.g. "MDV5A")
         confidence_threshold (float): minimum confidence detection to include in
             output
         quiet (bool, optional): suppress per-image console printouts
-        image_size (tuple, optional): image size to use for inference, only mess with this
+        image_size (int, optional): image size to use for inference, only mess with this
             if (a) you're using a model other than MegaDetector or (b) you know what you're
             doing
         include_image_size (bool, optional): should we include image size in the output for each image?
         include_image_timestamp (bool, optional): should we include image timestamps in the output for each image?
         include_exif_data (bool, optional): should we include EXIF data in the output for each image?
         augment (bool, optional): enable image augmentation
-        detector_options (dict, optional): key/value pairs that are interpreted differently
+        detector_options (dict, optional): key/value pairs that are interpreted differently
             by different detectors
         loader_workers (int, optional): number of loaders to use
+        preprocess_on_image_queue (bool, optional): if the image queue is enabled, should it handle
+            image loading and preprocessing (True), or just image loading (False)?
     Returns:
         list: list of dicts in the format returned by process_image()
     """
     # Validate inputs
     assert isinstance(model_file,str)
     if loader_workers <= 0:
         loader_workers = 1
+    if detector_options is None:
+        detector_options = {}
     q = multiprocessing.JoinableQueue(max_queue_size)
     return_queue = multiprocessing.Queue(1)
     producers = []
     worker_string = 'thread' if use_threads_for_queue else 'process'
     print('Starting a {} pool with {} workers'.format(worker_string,loader_workers))
     preprocessor = None
     if preprocess_on_image_queue:
         print('Enabling image queue preprocessing')
         preprocessor = model_file
     n_total_images = len(image_files)
     chunks = split_list_into_n_chunks(image_files, loader_workers, chunk_strategy='greedy')
     for i_chunk,chunk in enumerate(chunks):
         if use_threads_for_queue:
@@ -379,11 +389,11 @@ def run_detector_with_image_queue(image_files,
                                                            image_size,
                                                            augment))
         producers.append(producer)
     for producer in producers:
         producer.daemon = False
         producer.start()
     if run_separate_consumer_process:
         if use_threads_for_queue:
             consumer = Thread(target=_consumer_func,args=(q,
@@ -393,7 +403,7 @@ def run_detector_with_image_queue(image_files,
                                                           loader_workers,
                                                           image_size,
                                                           include_image_size,
-                                                          include_image_timestamp,
+                                                          include_image_timestamp,
                                                           include_exif_data,
                                                           augment,
                                                           detector_options,
@@ -407,7 +417,7 @@ def run_detector_with_image_queue(image_files,
                                                            loader_workers,
                                                            image_size,
                                                            include_image_size,
-                                                           include_image_timestamp,
+                                                           include_image_timestamp,
                                                            include_exif_data,
                                                            augment,
                                                            detector_options,
@@ -423,7 +433,7 @@ def run_detector_with_image_queue(image_files,
                        loader_workers,
                        image_size,
                        include_image_size,
-                       include_image_timestamp,
+                       include_image_timestamp,
                        include_exif_data,
                        augment,
                        detector_options,
@@ -434,21 +444,21 @@ def run_detector_with_image_queue(image_files,
         producer.join()
         if verbose:
             print('Producer {} finished'.format(i_producer))
     if verbose:
         print('All producers finished')
     if run_separate_consumer_process:
         consumer.join()
     if verbose:
         print('Consumer loop finished')
     q.join()
     if verbose:
         print('Queue joined')
     results = return_queue.get()
     return results
 # ...def run_detector_with_image_queue(...)
@@ -459,29 +469,29 @@ def run_detector_with_image_queue(image_files,
 def _chunks_by_number_of_chunks(ls, n):
     """
     Splits a list into n even chunks.
     External callers should use ct_utils.split_list_into_n_chunks().
     Args:
         ls (list): list to break up into chunks
         n (int): number of chunks
     """
     for i in range(0, n):
         yield ls[i::n]
 #%% Image processing functions
-def process_images(im_files,
-                   detector,
-                   confidence_threshold,
-                   use_image_queue=False,
-                   quiet=False,
-                   image_size=None,
-                   checkpoint_queue=None,
-                   include_image_size=False,
-                   include_image_timestamp=False,
+def process_images(im_files,
+                   detector,
+                   confidence_threshold,
+                   use_image_queue=False,
+                   quiet=False,
+                   image_size=None,
+                   checkpoint_queue=None,
+                   include_image_size=False,
+                   include_image_timestamp=False,
                    include_exif_data=False,
                    augment=False,
                    detector_options=None,
@@ -489,15 +499,15 @@ def process_images(im_files,
                    preprocess_on_image_queue=default_preprocess_on_image_queue):
     """
     Runs a detector (typically MegaDetector) over a list of image files on a single thread.
     Args:
-        im_files (list: paths to image files
+        im_files (list): paths to image files
         detector (str or detector object): loaded model or str; if this is a string, it can be a
             path to a .pb/.pt model file or a known model identifier (e.g. "MDV5A")
         confidence_threshold (float): only detections above this threshold are returned
         use_image_queue (bool, optional): separate image loading onto a dedicated worker process
         quiet (bool, optional): suppress per-image printouts
-        image_size (tuple, optional): image size to use for inference, only mess with this
+        image_size (int, optional): image size to use for inference, only mess with this
             if (a) you're using a model other than MegaDetector or (b) you know what you're
             doing
         checkpoint_queue (Queue, optional): internal parameter used to pass image queues around
@@ -505,68 +515,75 @@ def process_images(im_files,
         include_image_timestamp (bool, optional): should we include image timestamps in the output for each image?
         include_exif_data (bool, optional): should we include EXIF data in the output for each image?
         augment (bool, optional): enable image augmentation
-        detector_options (dict, optional): key/value pairs that are interpreted differently
+        detector_options (dict, optional): key/value pairs that are interpreted differently
             by different detectors
         loader_workers (int, optional): number of loaders to use (only relevant when using image queue)
+        preprocess_on_image_queue (bool, optional): if the image queue is enabled, should it handle
+            image loading and preprocessing (True), or just image loading (False)?
     Returns:
         list: list of dicts, in which each dict represents detections on one image,
         see the 'images' key in https://github.com/agentmorris/MegaDetector/tree/main/megadetector/api/batch_processing#batch-processing-api-output-format
     """
     if isinstance(detector, str):
         start_time = time.time()
-        detector = load_detector(detector,detector_options=detector_options,verbose=verbose)
+        detector = load_detector(detector,
+                                 detector_options=detector_options,
+                                 verbose=verbose)
         elapsed = time.time() - start_time
         print('Loaded model (batch level) in {}'.format(humanfriendly.format_timespan(elapsed)))
+    if detector_options is None:
+        detector_options = {}
     if use_image_queue:
-        run_detector_with_image_queue(im_files,
-                                      detector,
-                                      confidence_threshold,
-                                      quiet=quiet,
+        run_detector_with_image_queue(im_files,
+                                      detector,
+                                      confidence_threshold,
+                                      quiet=quiet,
                                       image_size=image_size,
-                                      include_image_size=include_image_size,
+                                      include_image_size=include_image_size,
                                       include_image_timestamp=include_image_timestamp,
                                       include_exif_data=include_exif_data,
                                       augment=augment,
                                       detector_options=detector_options,
                                       loader_workers=loader_workers,
                                       preprocess_on_image_queue=preprocess_on_image_queue)
-    else:
+    else:
         results = []
         for im_file in im_files:
-            result = process_image(im_file,
-                                   detector,
+            result = process_image(im_file,
+                                   detector,
                                    confidence_threshold,
-                                   quiet=quiet,
-                                   image_size=image_size,
-                                   include_image_size=include_image_size,
+                                   quiet=quiet,
+                                   image_size=image_size,
+                                   include_image_size=include_image_size,
                                    include_image_timestamp=include_image_timestamp,
                                    include_exif_data=include_exif_data,
                                    augment=augment)
             if checkpoint_queue is not None:
                 checkpoint_queue.put(result)
-            results.append(result)
+            results.append(result)
         return results
 # ...def process_images(...)
-def process_image(im_file,
-                  detector,
-                  confidence_threshold,
-                  image=None,
-                  quiet=False,
-                  image_size=None,
+def process_image(im_file,
+                  detector,
+                  confidence_threshold,
+                  image=None,
+                  quiet=False,
+                  image_size=None,
                   include_image_size=False,
-                  include_image_timestamp=False,
+                  include_image_timestamp=False,
                   include_exif_data=False,
                   skip_image_resizing=False,
                   augment=False):
@@ -575,30 +592,30 @@ def process_image(im_file,
     Args:
         im_file (str): path to image file
-        detector (detector object): loaded model, this can no longer be a string by the time
+        detector (detector object): loaded model, this can no longer be a string by the time
             you get this far down the pipeline
         confidence_threshold (float): only detections above this threshold are returned
         image (Image, optional): previously-loaded image, if available, used when a worker
             thread is handling image loads
         quiet (bool, optional): suppress per-image printouts
-        image_size (tuple, optional): image size to use for inference, only mess with this
+        image_size (int, optional): image size to use for inference, only mess with this
             if (a) you're using a model other than MegaDetector or (b) you know what you're
-            doing
+            doing
         include_image_size (bool, optional): should we include image size in the output for each image?
         include_image_timestamp (bool, optional): should we include image timestamps in the output for each image?
-        include_exif_data (bool, optional): should we include EXIF data in the output for each image?
+        include_exif_data (bool, optional): should we include EXIF data in the output for each image?
         skip_image_resizing (bool, optional): whether to skip internal image resizing and rely on external resizing
         augment (bool, optional): enable image augmentation
     Returns:
         dict: dict representing detections on one image,
-        see the 'images' key in
+        see the 'images' key in
         https://github.com/agentmorris/MegaDetector/tree/main/megadetector/api/batch_processing#batch-processing-api-output-format
     """
     if not quiet:
         print('Processing image {}'.format(im_file))
     if image is None:
         try:
             image = vis_utils.load_image(im_file)
@@ -612,11 +629,11 @@ def process_image(im_file,
             return result
     try:
         result = detector.generate_detections_one_image(
-                    image,
-                    im_file,
-                    detection_threshold=confidence_threshold,
+                    image,
+                    im_file,
+                    detection_threshold=confidence_threshold,
                     image_size=image_size,
                     skip_image_resizing=skip_image_resizing,
                     augment=augment)
@@ -632,7 +649,7 @@ def process_image(im_file,
     if isinstance(image,dict):
         image = image['img_original_pil']
-    if include_image_size:
+    if include_image_size:
         result['width'] = image.width
         result['height'] = image.height
@@ -651,13 +668,13 @@ def _load_custom_class_mapping(class_mapping_filename):
     """
     This is an experimental hack to allow the use of non-MD YOLOv5 models through
     the same infrastructure; it disables the code that enforces MDv5-like class lists.
     Should be a .json file that maps int-strings to strings, or a YOLOv5 dataset.yaml file.
     """
     if class_mapping_filename is None:
         return
     run_detector.USE_MODEL_NATIVE_CLASSES = True
     if class_mapping_filename.endswith('.json'):
         with open(class_mapping_filename,'r') as f:
@@ -668,28 +685,28 @@ def _load_custom_class_mapping(class_mapping_filename):
         class_mapping = {str(k):v for k,v in class_mapping.items()}
     else:
         raise ValueError('Unrecognized class mapping file {}'.format(class_mapping_filename))
     print('Loaded custom class mapping:')
     print(class_mapping)
     run_detector.DEFAULT_DETECTOR_LABEL_MAP = class_mapping
     return class_mapping
 #%% Main function
-def load_and_run_detector_batch(model_file,
-                                image_file_names,
+def load_and_run_detector_batch(model_file,
+                                image_file_names,
                                 checkpoint_path=None,
                                 confidence_threshold=run_detector.DEFAULT_OUTPUT_CONFIDENCE_THRESHOLD,
-                                checkpoint_frequency=-1,
-                                results=None,
+                                checkpoint_frequency=-1,
+                                results=None,
                                 n_cores=1,
-                                use_image_queue=False,
-                                quiet=False,
-                                image_size=None,
-                                class_mapping_filename=None,
-                                include_image_size=False,
-                                include_image_timestamp=False,
+                                use_image_queue=False,
+                                quiet=False,
+                                image_size=None,
+                                class_mapping_filename=None,
+                                include_image_size=False,
+                                include_image_timestamp=False,
                                 include_exif_data=False,
                                 augment=False,
                                 force_model_download=False,
@@ -698,27 +715,26 @@ def load_and_run_detector_batch(model_file,
                                 preprocess_on_image_queue=default_preprocess_on_image_queue):
     """
     Load a model file and run it on a list of images.
     Args:
         model_file (str): path to model file, or supported model string (e.g. "MDV5A")
-        image_file_names (list or str): list of strings (image filenames), a single image filename,
-            a folder to recursively search for images in, or a .json or .txt file containing a list
+        image_file_names (list or str): list of strings (image filenames), a single image filename,
+            a folder to recursively search for images in, or a .json or .txt file containing a list
             of images.
-        checkpoint_path (str, optional), path to use for checkpoints (if None, checkpointing
+        checkpoint_path (str, optional): path to use for checkpoints (if None, checkpointing
             is disabled)
         confidence_threshold (float, optional): only detections above this threshold are returned
-        checkpoint_frequency (int, optional): int, write results to JSON checkpoint file every N
+        checkpoint_frequency (int, optional): int, write results to JSON checkpoint file every N
             images, -1 disabled checkpointing
-        results (list, optional): list of dicts, existing results loaded from checkpoint; generally
+        results (list, optional): list of dicts, existing results loaded from checkpoint; generally
             not useful if you're using this function outside of the CLI
         n_cores (int, optional): number of parallel worker to use, ignored if we're running on a GPU
         use_image_queue (bool, optional): use a dedicated worker for image loading
         quiet (bool, optional): disable per-image console output
-        image_size (tuple, optional): image size to use for inference, only mess with this
+        image_size (int, optional): image size to use for inference, only mess with this
             if (a) you're using a model other than MegaDetector or (b) you know what you're
             doing
-        class_mapping_filename (str, optional), use a non-default class mapping supplied in a .json
+        class_mapping_filename (str, optional): use a non-default class mapping supplied in a .json
             file or YOLOv5 dataset.yaml file
         include_image_size (bool, optional): should we include image size in the output for each image?
         include_image_timestamp (bool, optional): should we include image timestamps in the output for each image?
@@ -727,37 +743,42 @@ def load_and_run_detector_batch(model_file,
         force_model_download (bool, optional): force downloading the model file if
             a named model (e.g. "MDV5A") is supplied, even if the local file already
             exists
-        detector_options (dict, optional): key/value pairs that are interpreted differently
+        detector_options (dict, optional): key/value pairs that are interpreted differently
             by different detectors
         loader_workers (int, optional): number of loaders to use, only relevant when use_image_queue is True
+        preprocess_on_image_queue (bool, optional): if the image queue is enabled, should it handle
+            image loading and preprocessing (True), or just image loading (False)?
     Returns:
         results: list of dicts; each dict represents detections on one image
     """
     # Validate input arguments
     if n_cores is None or n_cores <= 0:
         n_cores = 1
+    if detector_options is None:
+        detector_options = {}
     if confidence_threshold is None:
         confidence_threshold=run_detector.DEFAULT_OUTPUT_CONFIDENCE_THRESHOLD
     # Disable checkpointing if checkpoint_path is None
     if checkpoint_frequency is None or checkpoint_path is None:
         checkpoint_frequency = -1
     if class_mapping_filename is not None:
         _load_custom_class_mapping(class_mapping_filename)
     # Handle the case where image_file_names is not yet actually a list
     if isinstance(image_file_names,str):
         # Find the images to score; images can be a directory, may need to recurse
         if os.path.isdir(image_file_names):
             image_dir = image_file_names
             image_file_names = path_utils.find_images(image_dir, True)
             print('{} image files found in folder {}'.format(len(image_file_names),image_dir))
         # A single file, or a list of image paths
         elif os.path.isfile(image_file_names):
             list_file = image_file_names
@@ -780,43 +801,45 @@ def load_and_run_detector_batch(model_file,
                     'File {} supplied as [image_file_names] argument, but extension is neither .json nor .txt'\
                         .format(
                         list_file))
-        else:
+        else:
             raise ValueError(
                 '{} supplied as [image_file_names] argument, but it does not appear to be a file or folder'.format(
                     image_file_names))
     if results is None:
         results = []
     already_processed = set([i['file'] for i in results])
-    model_file = try_download_known_detector(model_file, force_download=force_model_download)
+    model_file = try_download_known_detector(model_file,
+                                             force_download=force_model_download,
+                                             verbose=verbose)
     print('GPU available: {}'.format(is_gpu_available(model_file)))
-    if n_cores > 1 and is_gpu_available(model_file):
+    if (n_cores > 1) and is_gpu_available(model_file):
         print('Warning: multiple cores requested, but a GPU is available; parallelization across ' + \
               'GPUs is not currently supported, defaulting to one GPU')
         n_cores = 1
-    if n_cores > 1 and use_image_queue:
+    if (n_cores > 1) and use_image_queue:
         print('Warning: multiple cores requested, but the image queue is enabled; parallelization ' + \
               'with the image queue is not currently supported, defaulting to one worker')
         n_cores = 1
     if use_image_queue:
         assert checkpoint_frequency < 0, \
             'Using an image queue is not currently supported when checkpointing is enabled'
         assert len(results) == 0, \
             'Using an image queue with results loaded from a checkpoint is not currently supported'
         assert n_cores <= 1
-        results = run_detector_with_image_queue(image_file_names,
-                                                model_file,
-                                                confidence_threshold,
-                                                quiet,
+        results = run_detector_with_image_queue(image_file_names,
+                                                model_file,
+                                                confidence_threshold,
+                                                quiet,
                                                 image_size=image_size,
                                                 include_image_size=include_image_size,
                                                 include_image_timestamp=include_image_timestamp,
@@ -825,12 +848,14 @@ def load_and_run_detector_batch(model_file,
                                                 detector_options=detector_options,
                                                 loader_workers=loader_workers,
                                                 preprocess_on_image_queue=preprocess_on_image_queue)
     elif n_cores <= 1:
         # Load the detector
         start_time = time.time()
-        detector = load_detector(model_file,detector_options=detector_options,verbose=verbose)
+        detector = load_detector(model_file,
+                                 detector_options=detector_options,
+                                 verbose=verbose)
         elapsed = time.time() - start_time
         print('Loaded model in {}'.format(humanfriendly.format_timespan(elapsed)))
@@ -848,11 +873,11 @@ def load_and_run_detector_batch(model_file,
             count += 1
-            result = process_image(im_file,
-                                   detector,
-                                   confidence_threshold,
-                                   quiet=quiet,
-                                   image_size=image_size,
+            result = process_image(im_file,
+                                   detector,
+                                   confidence_threshold,
+                                   quiet=quiet,
+                                   image_size=image_size,
                                    include_image_size=include_image_size,
                                    include_image_timestamp=include_image_timestamp,
                                    include_exif_data=include_exif_data,
@@ -861,97 +886,100 @@ def load_and_run_detector_batch(model_file,
             # Write a checkpoint if necessary
             if (checkpoint_frequency != -1) and ((count % checkpoint_frequency) == 0):
                 print('Writing a new checkpoint after having processed {} images since '
                       'last restart'.format(count))
                 _write_checkpoint(checkpoint_path, results)
     else:
         # Multiprocessing is enabled at this point
         # When using multiprocessing, tell the workers to load the model on each
         # process, by passing the model_file string as the "model" argument to
         # process_images.
         detector = model_file
-        print('Creating pool with {} cores'.format(n_cores))
+        print('Creating worker pool with {} cores'.format(n_cores))
         if len(already_processed) > 0:
             n_images_all = len(image_file_names)
             image_file_names = [fn for fn in image_file_names if fn not in already_processed]
             print('Loaded {} of {} images from checkpoint'.format(
                 len(already_processed),n_images_all))
-        # Divide images into chunks; we'll send one chunk to each worker process
+        # Divide images into chunks; we'll send one chunk to each worker process
         image_batches = list(_chunks_by_number_of_chunks(image_file_names, n_cores))
-        pool = workerpool(n_cores)
-        if checkpoint_path is not None:
-            # Multiprocessing and checkpointing are both enabled at this point
-            checkpoint_queue = Manager().Queue()
-            # Pass the "results" array (which may already contain images loaded from an existing
-            # checkpoint) to the checkpoint queue handler function, which will append results to
-            # the list as they become available.
-            checkpoint_thread = Thread(target=_checkpoint_queue_handler,
-                                       args=(checkpoint_path, checkpoint_frequency,
-                                             checkpoint_queue, results), daemon=True)
-            checkpoint_thread.start()
-            pool.map(partial(process_images,
-                             detector=detector,
-                             confidence_threshold=confidence_threshold,
-                             use_image_queue=False,
-                             quiet=quiet,
-                             image_size=image_size,
-                             checkpoint_queue=checkpoint_queue,
-                             include_image_size=include_image_size,
-                             include_image_timestamp=include_image_timestamp,
-                             include_exif_data=include_exif_data,
-                             augment=augment,
-                             detector_options=detector_options),
-                             image_batches)
-            checkpoint_queue.put(None)
-        else:
-            # Multprocessing is enabled, but checkpointing is not
-            new_results = pool.map(partial(process_images,
-                                           detector=detector,
-                                           confidence_threshold=confidence_threshold,
-                                           use_image_queue=False,
-                                           quiet=quiet,
-                                           checkpoint_queue=None,
-                                           image_size=image_size,
-                                           include_image_size=include_image_size,
-                                           include_image_timestamp=include_image_timestamp,
-                                           include_exif_data=include_exif_data,
-                                           augment=augment,
-                                           detector_options=detector_options),
-                                           image_batches)
-            new_results = list(itertools.chain.from_iterable(new_results))
-            # Append the results we just computed to "results", which is *usually* empty, but will
-            # be non-empty if we resumed from a checkpoint
-            results += new_results
-        # ...if checkpointing is/isn't enabled
+        pool = None
         try:
-            pool.close()
-        except Exception as e:
-            print('Warning: error closing multiprocessing pool:\n{}'.format(str(e)))
+            pool = workerpool(n_cores)
+            if checkpoint_path is not None:
+                # Multiprocessing and checkpointing are both enabled at this point
+                checkpoint_queue = Manager().Queue()
+                # Pass the "results" array (which may already contain images loaded from an existing
+            # checkpoint) to the checkpoint queue handler function, which will append results to
+                # the list as they become available.
+                checkpoint_thread = Thread(target=_checkpoint_queue_handler,
+                                           args=(checkpoint_path, checkpoint_frequency,
+                                                 checkpoint_queue, results), daemon=True)
+                checkpoint_thread.start()
+                pool.map(partial(process_images,
+                                 detector=detector,
+                                 confidence_threshold=confidence_threshold,
+                                 use_image_queue=False,
+                                 quiet=quiet,
+                                 image_size=image_size,
+                                 checkpoint_queue=checkpoint_queue,
+                                 include_image_size=include_image_size,
+                                 include_image_timestamp=include_image_timestamp,
+                                 include_exif_data=include_exif_data,
+                                 augment=augment,
+                                 detector_options=detector_options),
+                                 image_batches)
+                checkpoint_queue.put(None)
+            else:
+                # Multprocessing is enabled, but checkpointing is not
+                new_results = pool.map(partial(process_images,
+                                               detector=detector,
+                                               confidence_threshold=confidence_threshold,
+                                               use_image_queue=False,
+                                               quiet=quiet,
+                                               checkpoint_queue=None,
+                                               image_size=image_size,
+                                               include_image_size=include_image_size,
+                                               include_image_timestamp=include_image_timestamp,
+                                               include_exif_data=include_exif_data,
+                                               augment=augment,
+                                               detector_options=detector_options),
+                                               image_batches)
+                new_results = list(itertools.chain.from_iterable(new_results))
+                # Append the results we just computed to "results", which is *usually* empty, but will
+                # be non-empty if we resumed from a checkpoint
+                results += new_results
+            # ...if checkpointing is/isn't enabled
+        finally:
+            if pool is not None:
+                pool.close()
+                pool.join()
+                print("Pool closed and joined for multi-core inference")
     # ...if we're running (1) with image queue, (2) on one core, or (3) on multiple cores
     # 'results' may have been modified in place, but we also return it for
     # backwards-compatibility.
     return results
@@ -964,21 +992,21 @@ def _checkpoint_queue_handler(checkpoint_path, checkpoint_frequency, checkpoint_
     Thread function to accumulate results and write checkpoints when checkpointing and
     multiprocessing are both enabled.
     """
     result_count = 0
     while True:
-        result = checkpoint_queue.get()
-        if result is None:
-            break
+        result = checkpoint_queue.get()
+        if result is None:
+            break
         result_count +=1
         results.append(result)
         if (checkpoint_frequency != -1) and (result_count % checkpoint_frequency == 0):
             print('Writing a new checkpoint after having processed {} images since '
                     'last restart'.format(result_count))
             _write_checkpoint(checkpoint_path, results)
@@ -986,20 +1014,19 @@ def _write_checkpoint(checkpoint_path, results):
     """
     Writes the 'images' field in the dict 'results' to a json checkpoint file.
     """
-    assert checkpoint_path is not None
+    assert checkpoint_path is not None
     # Back up any previous checkpoints, to protect against crashes while we're writing
     # the checkpoint file.
     checkpoint_tmp_path = None
     if os.path.isfile(checkpoint_path):
         checkpoint_tmp_path = checkpoint_path + '_tmp'
         shutil.copyfile(checkpoint_path,checkpoint_tmp_path)
     # Write the new checkpoint
-    with open(checkpoint_path, 'w') as f:
-        json.dump({'images': results}, f, indent=1, default=str)
+    ct_utils.write_json(checkpoint_path, {'images': results}, force_str=True)
     # Remove the backup checkpoint if it exists
     if checkpoint_tmp_path is not None:
         os.remove(checkpoint_tmp_path)
@@ -1008,33 +1035,33 @@ def _write_checkpoint(checkpoint_path, results):
 def get_image_datetime(image):
     """
     Reads EXIF datetime from a PIL Image object.
     Args:
         image (Image): the PIL Image object from which we should read datetime information
     Returns:
         str: the EXIF datetime from [image] (a PIL Image object), if available, as a string;
         returns None if EXIF datetime is not available.
     """
     exif_tags = read_exif.read_pil_exif(image,exif_options)
     try:
         datetime_str = exif_tags['DateTimeOriginal']
         _ = time.strptime(datetime_str, '%Y:%m:%d %H:%M:%S')
         return datetime_str
     except Exception:
-        return None
+        return None
-def write_results_to_file(results,
-                          output_file,
-                          relative_path_base=None,
-                          detector_file=None,
-                          info=None,
+def write_results_to_file(results,
+                          output_file,
+                          relative_path_base=None,
+                          detector_file=None,
+                          info=None,
                           include_max_conf=False,
-                          custom_metadata=None,
+                          custom_metadata=None,
                           force_forward_slashes=True):
     """
     Writes list of detection results to JSON output file. Format matches:
@@ -1056,11 +1083,11 @@ def write_results_to_file(results,
             a dictionary, but no type/format checks are performed
         force_forward_slashes (bool, optional): convert all slashes in filenames within [results] to
             forward slashes
     Returns:
         dict: the MD-formatted dictionary that was written to [output_file]
     """
     if relative_path_base is not None:
         results_relative = []
         for r in results:
@@ -1076,68 +1103,67 @@ def write_results_to_file(results,
             r_converted['file'] = r_converted['file'].replace('\\','/')
             results_converted.append(r_converted)
         results = results_converted
     # The typical case: we need to build the 'info' struct
     if info is None:
-        info = {
+        info = {
             'detection_completion_time': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
-            'format_version': '1.4'
+            'format_version': '1.4'
         }
         if detector_file is not None:
             detector_filename = os.path.basename(detector_file)
-            detector_version = get_detector_version_from_filename(detector_filename)
+            detector_version = get_detector_version_from_filename(detector_filename,verbose=True)
             detector_metadata = get_detector_metadata_from_version_string(detector_version)
-            info['detector'] = detector_filename
+            info['detector'] = detector_filename
             info['detector_metadata'] = detector_metadata
         else:
             info['detector'] = 'unknown'
             info['detector_metadata'] = get_detector_metadata_from_version_string('unknown')
     # If the caller supplied the entire "info" struct
     else:
-        if detector_file is not None:
+        if detector_file is not None:
             print('Warning (write_results_to_file): info struct and detector file ' + \
                   'supplied, ignoring detector file')
     if custom_metadata is not None:
         info['custom_metadata'] = custom_metadata
     # The 'max_detection_conf' field used to be included by default, and it caused all kinds
     # of headaches, so it's no longer included unless the user explicitly requests it.
     if not include_max_conf:
         for im in results:
             if 'max_detection_conf' in im:
                 del im['max_detection_conf']
     # Sort results by filename; not required by the format, but convenient for consistency
     results = sort_list_of_dicts_by_key(results,'file')
     # Sort detections in descending order by confidence; not required by the format, but
     # convenient for consistency
     for r in results:
         if ('detections' in r) and (r['detections'] is not None):
             r['detections'] = sort_list_of_dicts_by_key(r['detections'], 'conf', reverse=True)
     final_output = {
         'images': results,
         'detection_categories': run_detector.DEFAULT_DETECTOR_LABEL_MAP,
         'info': info
     }
     # Create the folder where the output file belongs; this will fail if
     # this is a relative path with no folder component
     try:
         os.makedirs(os.path.dirname(output_file),exist_ok=True)
     except Exception:
         pass
-    with open(output_file, 'w') as f:
-        json.dump(final_output, f, indent=1, default=str)
+    ct_utils.write_json(output_file, final_output, force_str=True)
     print('Output file saved at {}'.format(output_file))
     return final_output
 # ...def write_results_to_file(...)
@@ -1146,15 +1172,15 @@ def write_results_to_file(results,
 #%% Interactive driver
 if False:
     pass
     #%%
     model_file = 'MDV5A'
     image_dir = r'g:\camera_traps\camera_trap_images'
     output_file = r'g:\temp\md-test.json'
     recursive = True
     output_relative_filenames = True
     include_max_conf = False
@@ -1162,7 +1188,7 @@ if False:
     image_size = None
     use_image_queue = False
     confidence_threshold = 0.0001
-    checkpoint_frequency = 5
+    checkpoint_frequency = 5
     checkpoint_path = None
     resume_from_checkpoint = 'auto'
     allow_checkpoint_overwrite = False
@@ -1172,11 +1198,11 @@ if False:
     include_image_timestamp = True
     include_exif_data = True
     overwrite_handling = None
     # Generate a command line
     cmd = 'python run_detector_batch.py "{}" "{}" "{}"'.format(
         model_file,image_dir,output_file)
     if recursive:
         cmd += ' --recursive'
     if output_relative_filenames:
@@ -1211,18 +1237,18 @@ if False:
         cmd += ' --include_exif_data'
     if overwrite_handling is not None:
         cmd += ' --overwrite_handling {}'.format(overwrite_handling)
     print(cmd)
     import clipboard; clipboard.copy(cmd)
     #%% Run inference interactively
-    image_file_names = path_utils.find_images(image_dir, recursive=False)
+    image_file_names = path_utils.find_images(image_dir, recursive=False)
     results = None
     start_time = time.time()
     results = load_and_run_detector_batch(model_file=model_file,
                                           image_file_names=image_file_names,
                                           checkpoint_path=checkpoint_path,
@@ -1233,21 +1259,22 @@ if False:
                                           use_image_queue=use_image_queue,
                                           quiet=quiet,
                                           image_size=image_size)
     elapsed = time.time() - start_time
     print('Finished inference in {}'.format(humanfriendly.format_timespan(elapsed)))
 #%% Command-line driver
-def main():
+def main(): # noqa
     parser = argparse.ArgumentParser(
         description='Module to run a TF/PT animal detection model on lots of images')
     parser.add_argument(
         'detector_file',
-        help='Path to detector model file (.pb or .pt).  Can also be the strings "MDV4", "MDV5A", or "MDV5B" to request automatic download.')
+        help='Path to detector model file (.pb or .pt).  Can also be the strings "MDV4", ' + \
+             '"MDV5A", or "MDV5B" to request automatic download.')
     parser.add_argument(
         'image_file',
         help=\
@@ -1279,7 +1306,7 @@ def main():
         '--image_size',
         type=int,
         default=None,
-        help=('Force image resizing to a specific integer size on the long axis (not recommended to change this)'))
+        help=('Force image resizing to a specific integer size on the long axis (not recommended to change this)'))
     parser.add_argument(
         '--augment',
         action='store_true',
@@ -1316,7 +1343,7 @@ def main():
         type=str,
         default=None,
         help='File name to which checkpoints will be written if checkpoint_frequency is > 0, ' + \
-             'defaults to md_checkpoint_[date].json in the same folder as the output file')
+             'defaults to md_checkpoint_[date].json in the same folder as the output file')
     parser.add_argument(
         '--resume_from_checkpoint',
         type=str,
@@ -1367,7 +1394,7 @@ def main():
         type=str,
         default='overwrite',
         help='What should we do if the output file exists?  overwrite/skip/error (default overwrite)'
-    )
+    )
     parser.add_argument(
         '--force_model_download',
         action='store_true',
@@ -1387,28 +1414,29 @@ def main():
         metavar='KEY=VALUE',
         default='',
         help='Detector-specific options, as a space-separated list of key-value pairs')
     if len(sys.argv[1:]) == 0:
         parser.print_help()
         parser.exit()
     args = parser.parse_args()
     global verbose
     global use_threads_for_queue
     if args.verbose:
         verbose = True
     if args.use_threads_for_queue:
         use_threads_for_queue = True
     detector_options = parse_kvp_list(args.detector_options)
-    # If the specified detector file is really the name of a known model, find
+    # If the specified detector file is really the name of a known model, find
     # (and possibly download) that model
-    args.detector_file = try_download_known_detector(args.detector_file,
-                                                     force_download=args.force_model_download)
+    args.detector_file = try_download_known_detector(args.detector_file,
+                                                     force_download=args.force_model_download,
+                                                     verbose=verbose)
     assert os.path.exists(args.detector_file), \
         'detector file {} does not exist'.format(args.detector_file)
     assert 0.0 <= args.threshold <= 1.0, 'Confidence threshold needs to be between 0 and 1'
@@ -1439,12 +1467,12 @@ def main():
     if len(output_dir) > 0:
         os.makedirs(output_dir,exist_ok=True)
     assert not os.path.isdir(args.output_file), 'Specified output file is a directory'
     if args.class_mapping_filename is not None:
         _load_custom_class_mapping(args.class_mapping_filename)
     # Load the checkpoint if available
     #
     # File paths in the checkpoint are always absolute paths; conversion to relative paths
@@ -1463,7 +1491,7 @@ def main():
                         len(checkpoint_files),output_dir))
                     checkpoint_files = sorted(checkpoint_files)
                 checkpoint_file_relative = checkpoint_files[-1]
-                checkpoint_file = os.path.join(output_dir,checkpoint_file_relative)
+                checkpoint_file = os.path.join(output_dir,checkpoint_file_relative)
         else:
             checkpoint_file = args.resume_from_checkpoint
         assert os.path.exists(checkpoint_file), \
@@ -1483,7 +1511,7 @@ def main():
     if os.path.isdir(args.image_file):
         image_file_names = path_utils.find_images(args.image_file, args.recursive)
         if len(image_file_names) > 0:
-            print('{} image files found in the input directory'.format(len(image_file_names)))
+            print('{} image files found in the input directory'.format(len(image_file_names)))
         else:
             if (args.recursive):
                 print('No image files found in directory {}, exiting'.format(args.image_file))
@@ -1492,14 +1520,14 @@ def main():
                       '--recursive?'.format(
                     args.image_file))
             return
     # A json list of image paths
-    elif os.path.isfile(args.image_file) and args.image_file.endswith('.json'):
+    elif os.path.isfile(args.image_file) and args.image_file.endswith('.json'):
         with open(args.image_file) as f:
             image_file_names = json.load(f)
         print('Loaded {} image filenames from .json list file {}'.format(
             len(image_file_names),args.image_file))
     # A text list of image paths
     elif os.path.isfile(args.image_file) and args.image_file.endswith('.txt'):
         with open(args.image_file) as f:
@@ -1507,51 +1535,51 @@ def main():
             image_file_names = [fn.strip() for fn in image_file_names if len(fn.strip()) > 0]
         print('Loaded {} image filenames from .txt list file {}'.format(
             len(image_file_names),args.image_file))
     # A single image file
     elif os.path.isfile(args.image_file) and path_utils.is_image_file(args.image_file):
         image_file_names = [args.image_file]
         print('Processing image {}'.format(args.image_file))
-    else:
+    else:
         raise ValueError('image_file specified is not a directory, a json list, or an image file, '
                          '(or does not have recognizable extensions).')
-    # At this point, regardless of how they were specified, [image_file_names] is a list of
+    # At this point, regardless of how they were specified, [image_file_names] is a list of
     # absolute image paths.
     assert len(image_file_names) > 0, 'Specified image_file does not point to valid image files'
     # Convert to forward slashes to facilitate comparison with previous results
     image_file_names = [fn.replace('\\','/') for fn in image_file_names]
     # We can head off many problems related to incorrect command line formulation if we confirm
-    # that one image exists before proceeding.  The use of the first image for this test is
+    # that one image exists before proceeding.  The use of the first image for this test is
     # arbitrary.
     assert os.path.exists(image_file_names[0]), \
         'The first image to be processed does not exist at {}'.format(image_file_names[0])
     # Possibly load results from a previous pass
     previous_results = None
     if args.previous_results_file is not None:
         assert os.path.isfile(args.previous_results_file), \
             'Could not find previous results file {}'.format(args.previous_results_file)
         with open(args.previous_results_file,'r') as f:
             previous_results = json.load(f)
         assert previous_results['detection_categories'] == run_detector.DEFAULT_DETECTOR_LABEL_MAP, \
             "Can't merge previous results when those results use a different set of detection categories"
         print('Loaded previous results for {} images from {}'.format(
             len(previous_results['images']), args.previous_results_file))
-        # Convert previous result filenames to absolute paths if necessary
+        # Convert previous result filenames to absolute paths if necessary
         #
-        # We asserted above to make sure that we are using relative paths and processing a
+        # We asserted above to make sure that we are using relative paths and processing a
         # folder, but just to be super-clear...
         assert os.path.isdir(args.image_file)
         previous_image_files_set = set()
         for im in previous_results['images']:
             assert not os.path.isabs(im['file']), \
@@ -1559,54 +1587,53 @@ def main():
             fn_abs = os.path.join(args.image_file,im['file']).replace('\\','/')
             # Absolute paths are expected at the final output stage below
             im['file'] = fn_abs
-            previous_image_files_set.add(fn_abs)
+            previous_image_files_set.add(fn_abs)
         image_file_names_to_keep = []
         for fn_abs in image_file_names:
             if fn_abs not in previous_image_files_set:
                 image_file_names_to_keep.append(fn_abs)
         print('Based on previous results file, processing {} of {} images'.format(
             len(image_file_names_to_keep), len(image_file_names)))
         image_file_names = image_file_names_to_keep
     # ...if we're handling previous results
     # Test that we can write to the output_file's dir if checkpointing requested
     if args.checkpoint_frequency != -1:
         if args.checkpoint_path is not None:
             checkpoint_path = args.checkpoint_path
         else:
             checkpoint_path = os.path.join(output_dir,
                                            'md_checkpoint_{}.json'.format(
                                                datetime.now().strftime("%Y%m%d%H%M%S")))
         # Don't overwrite existing checkpoint files, this is a sure-fire way to eventually
         # erase someone's checkpoint.
         if (checkpoint_path is not None) and (not args.allow_checkpoint_overwrite) \
             and (args.resume_from_checkpoint is None):
             assert not os.path.isfile(checkpoint_path), \
                 f'Checkpoint path {checkpoint_path} already exists, delete or move it before ' + \
                 're-using the same checkpoint path, or specify --allow_checkpoint_overwrite'
         # Confirm that we can write to the checkpoint path; this avoids issues where
         # we crash after several thousand images.
         #
-        # But actually, commenting this out for now... the scenario where we are resuming from a
+        # But actually, commenting this out for now... the scenario where we are resuming from a
         # checkpoint, then immediately overwrite that checkpoint with empty data is higher-risk
         # than the annoyance of crashing a few minutes after starting a job.
         if False:
-            with open(checkpoint_path, 'w') as f:
-                json.dump({'images': []}, f)
+            ct_utils.write_json(checkpoint_path, {'images': []}, indent=None)
         print('The checkpoint file will be written to {}'.format(checkpoint_path))
     else:
         if args.checkpoint_path is not None:
             print('Warning: checkpointing disabled because checkpoint_frequency is -1, ' + \
                   'but a checkpoint path was specified')
@@ -1641,23 +1668,23 @@ def main():
         len(results),humanfriendly.format_timespan(elapsed),images_per_second))
     relative_path_base = None
-    # We asserted above to make sure that if output_relative_filenames is set,
+    # We asserted above to make sure that if output_relative_filenames is set,
     # args.image_file is a folder, but we'll double-check for clarity.
     if args.output_relative_filenames:
         assert os.path.isdir(args.image_file)
         relative_path_base = args.image_file
     # Merge results from a previous file if necessary
     if previous_results is not None:
         previous_filenames_set = set([im['file'] for im in previous_results['images']])
         new_filenames_set = set([im['file'] for im in results])
         assert len(previous_filenames_set.intersection(new_filenames_set)) == 0, \
             'Previous results handling error: redundant image filenames'
-        results.extend(previous_results['images'])
-    write_results_to_file(results,
-                          args.output_file,
+        results.extend(previous_results['images'])
+    write_results_to_file(results,
+                          args.output_file,
                           relative_path_base=relative_path_base,
                           detector_file=args.detector_file,
                           include_max_conf=args.include_max_conf)

megadetector 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl