PyPI - megadetector - Versions diffs - 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl - Mend

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (197) hide show

megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/efficientnet/model.py +8 -8
megadetector/classification/efficientnet/utils.py +6 -5
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +26 -26
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -2
megadetector/data_management/camtrap_dp_to_coco.py +79 -46
megadetector/data_management/cct_json_utils.py +103 -103
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +210 -193
megadetector/data_management/databases/add_width_and_height_to_db.py +86 -12
megadetector/data_management/databases/combine_coco_camera_traps_files.py +40 -40
megadetector/data_management/databases/integrity_check_json_db.py +228 -200
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +88 -39
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +133 -125
megadetector/data_management/labelme_to_yolo.py +159 -73
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +365 -107
megadetector/data_management/lila/get_lila_annotation_counts.py +35 -33
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +73 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +28 -19
megadetector/data_management/mewc_to_md.py +344 -340
megadetector/data_management/ocr_tools.py +262 -255
megadetector/data_management/read_exif.py +249 -227
megadetector/data_management/remap_coco_categories.py +90 -28
megadetector/data_management/remove_exif.py +81 -21
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +588 -120
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +248 -122
megadetector/data_management/yolo_to_coco.py +333 -191
megadetector/detection/change_detection.py +832 -0
megadetector/detection/process_video.py +340 -337
megadetector/detection/pytorch_detector.py +358 -278
megadetector/detection/run_detector.py +399 -186
megadetector/detection/run_detector_batch.py +404 -377
megadetector/detection/run_inference_with_yolov5_val.py +340 -327
megadetector/detection/run_tiled_inference.py +257 -249
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +332 -295
megadetector/postprocessing/add_max_conf.py +19 -11
megadetector/postprocessing/categorize_detections_by_size.py +45 -45
megadetector/postprocessing/classification_postprocessing.py +468 -433
megadetector/postprocessing/combine_batch_outputs.py +23 -23
megadetector/postprocessing/compare_batch_results.py +590 -525
megadetector/postprocessing/convert_output_format.py +106 -102
megadetector/postprocessing/create_crop_folder.py +347 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -499
megadetector/postprocessing/load_api_results.py +48 -27
megadetector/postprocessing/md_to_coco.py +133 -102
megadetector/postprocessing/md_to_labelme.py +107 -90
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +92 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -301
megadetector/postprocessing/remap_detection_categories.py +91 -38
megadetector/postprocessing/render_detection_confusion_matrix.py +214 -205
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +704 -679
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +18 -19
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +54 -33
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +67 -67
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +156 -74
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +10 -10
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/ct_utils.py +1049 -211
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +632 -529
megadetector/utils/path_utils.py +1520 -431
megadetector/utils/process_utils.py +41 -41
megadetector/utils/split_locations_into_train_val.py +62 -62
megadetector/utils/string_utils.py +148 -27
megadetector/utils/url_utils.py +489 -176
megadetector/utils/wi_utils.py +2658 -2526
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +34 -30
megadetector/visualization/render_images_with_thumbnails.py +39 -74
megadetector/visualization/visualization_utils.py +487 -435
megadetector/visualization/visualize_db.py +232 -198
megadetector/visualization/visualize_detector_output.py +82 -76
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/METADATA +5 -2
megadetector-10.0.0.dist-info/RECORD +139 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/WHEEL +1 -1
megadetector/api/batch_processing/api_core/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/score.py +0 -439
megadetector/api/batch_processing/api_core/server.py +0 -294
megadetector/api/batch_processing/api_core/server_api_config.py +0 -97
megadetector/api/batch_processing/api_core/server_app_config.py +0 -55
megadetector/api/batch_processing/api_core/server_batch_job_manager.py +0 -220
megadetector/api/batch_processing/api_core/server_job_status_table.py +0 -149
megadetector/api/batch_processing/api_core/server_orchestration.py +0 -360
megadetector/api/batch_processing/api_core/server_utils.py +0 -88
megadetector/api/batch_processing/api_core_support/__init__.py +0 -0
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
megadetector/api/batch_processing/api_support/__init__.py +0 -0
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +0 -152
megadetector/api/batch_processing/data_preparation/__init__.py +0 -0
megadetector/api/synchronous/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/api_backend.py +0 -151
megadetector/api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -263
megadetector/api/synchronous/api_core/animal_detection_api/config.py +0 -35
megadetector/api/synchronous/api_core/tests/__init__.py +0 -0
megadetector/api/synchronous/api_core/tests/load_test.py +0 -110
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector/utils/azure_utils.py +0 -178
megadetector/utils/sas_blob_utils.py +0 -509
megadetector-5.0.28.dist-info/RECORD +0 -209
/megadetector/{api/batch_processing/__init__.py → __init__.py} +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/top_level.txt +0 -0

megadetector/detection/run_tiled_inference.py CHANGED Viewed

@@ -6,15 +6,15 @@ run_tiled_inference.py
 Runs inference on a folder, fist splitting each image up into tiles of size
 MxN (typically the native inference size of your detector), writing those
-tiles out to a temporary folder, then de-duplicating the resulting detections before
+tiles out to a temporary folder, then de-duplicating the resulting detections before
 merging them back into a set of detections that make sense on the original images.
-This approach will likely fail to detect very large animals, so if you expect both large
-and small animals (in terms of pixel size), this script is best used in
+This approach will likely fail to detect very large animals, so if you expect both large
+and small animals (in terms of pixel size), this script is best used in
 conjunction with a traditional inference pass that looks at whole images.
 Currently requires temporary storage at least as large as the input data, generally
-a lot more than that (depending on the overlap between adjacent tiles).  This is
+a lot more than that (depending on the overlap between adjacent tiles).  This is
 inefficient, but easy to debug.
 Programmatic invocation supports using YOLOv5's inference scripts (and test-time
@@ -28,6 +28,8 @@ import os
 import json
 import tempfile
 import uuid
+import sys
+import argparse
 from tqdm import tqdm
@@ -63,59 +65,59 @@ def get_patch_boundaries(image_size,patch_size,patch_stride=None):
     """
     Computes a list of patch starting coordinates (x,y) given an image size (w,h)
     and a stride (x,y)
     Patch size is guaranteed, but the stride may deviate to make sure all pixels are covered.
     I.e., we move by regular strides until the current patch walks off the right/bottom,
     at which point it backs up to one patch from the end.  So if your image is 15
-    pixels wide and you have a stride of 10 pixels, you will get starting positions
+    pixels wide and you have a stride of 10 pixels, you will get starting positions
     of 0 (from 0 to 9) and 5 (from 5 to 14).
     Args:
         image_size (tuple): size of the image you want to divide into patches, as a length-2 tuple (w,h)
         patch_size (tuple): patch size into which you want to divide an image, as a length-2 tuple (w,h)
-        patch_stride (tuple or float, optional): stride between patches, as a length-2 tuple (x,y), or a
-            float; if this is a float, it's interpreted as the stride relative to the patch size
+        patch_stride (tuple or float, optional): stride between patches, as a length-2 tuple (x,y), or a
+            float; if this is a float, it's interpreted as the stride relative to the patch size
             (0.1 == 10% stride).  Defaults to half the patch size.
     Returns:
-        list: list of length-2 tuples, each representing the x/y start position of a patch
+        list: list of length-2 tuples, each representing the x/y start position of a patch
     """
     if patch_stride is None:
         patch_stride = (round(patch_size[0]*(1.0-default_patch_overlap)),
                         round(patch_size[1]*(1.0-default_patch_overlap)))
     elif isinstance(patch_stride,float):
         patch_stride = (round(patch_size[0]*(patch_stride)),
                         round(patch_size[1]*(patch_stride)))
     image_width = image_size[0]
     image_height = image_size[1]
     assert patch_size[0] <= image_size[0], 'Patch width {} is larger than image width {}'.format(
         patch_size[0],image_size[0])
     assert patch_size[1] <= image_size[1], 'Patch height {} is larger than image height {}'.format(
         patch_size[1],image_size[1])
     def add_patch_row(patch_start_positions,y_start):
         """
         Add one row to our list of patch start positions, i.e.
         loop over all columns.
         """
         x_start = 0; x_end = x_start + patch_size[0] - 1
         while(True):
             patch_start_positions.append([x_start,y_start])
             # If this patch put us right at the end of the last column, we're done
             if x_end == image_width - 1:
                 break
             # Move one patch to the right
             x_start += patch_stride[0]
             x_end = x_start + patch_size[0] - 1
             # If this patch flows over the edge, add one more patch to cover
             # the pixels on the end, then we're done.
             if x_end > (image_width - 1):
@@ -124,27 +126,27 @@ def get_patch_boundaries(image_size,patch_size,patch_stride=None):
                 x_end = x_start + patch_size[0] - 1
                 patch_start_positions.append([x_start,y_start])
                 break
         # ...for each column
         return patch_start_positions
     patch_start_positions = []
     y_start = 0; y_end = y_start + patch_size[1] - 1
     while(True):
         patch_start_positions = add_patch_row(patch_start_positions,y_start)
         # If this patch put us right at the bottom of the lats row, we're done
         if y_end == image_height - 1:
             break
         # Move one patch down
         y_start += patch_stride[1]
         y_end = y_start + patch_size[1] - 1
         # If this patch flows over the bottom, add one more patch to cover
         # the pixels at the bottom, then we're done
         if y_end > (image_height - 1):
@@ -153,24 +155,24 @@ def get_patch_boundaries(image_size,patch_size,patch_stride=None):
             y_end = y_start + patch_size[1] - 1
             patch_start_positions = add_patch_row(patch_start_positions,y_start)
             break
     # ...for each row
     for p in patch_start_positions:
         assert p[0] >= 0 and p[1] >= 0 and p[0] <= image_width and p[1] <= image_height, \
         'Patch generation error (illegal patch {})'.format(p)
     # The last patch should always end at the bottom-right of the image
     assert patch_start_positions[-1][0]+patch_size[0] == image_width, \
         'Patch generation error (last patch does not end on the right)'
     assert patch_start_positions[-1][1]+patch_size[1] == image_height, \
         'Patch generation error (last patch does not end at the bottom)'
     # All patches should be unique
     patch_start_positions_tuples = [tuple(x) for x in patch_start_positions]
     assert len(patch_start_positions_tuples) == len(set(patch_start_positions_tuples)), \
         'Patch generation error (duplicate start position)'
     return patch_start_positions
 # ...get_patch_boundaries()
@@ -180,12 +182,12 @@ def patch_info_to_patch_name(image_name,patch_x_min,patch_y_min):
     """
     Gives a unique string name to an x/y coordinate, e.g. turns ("a.jpg",10,20) into
     "a.jpg_0010_0020".
     Args:
         image_name (str): image identifier
         patch_x_min (int): x coordinate
         patch_y_min (int): y coordinate
     Returns:
         str: name for this patch, e.g. "a.jpg_0010_0020"
     """
@@ -203,13 +205,13 @@ def extract_patch_from_image(im,
                              overwrite=True):
     """
     Extracts a patch from the provided image, and writes that patch out to a new file.
     Args:
         im (str or Image): image from which we should extract a patch, can be a filename or
             a PIL Image object.
-        patch_xy (tuple): length-2 tuple of ints (x,y) representing the upper-left corner
+        patch_xy (tuple): length-2 tuple of ints (x,y) representing the upper-left corner
             of the patch to extract
-        patch_size (tuple): length-2 tuple of ints (w,h) representing the size of the
+        patch_size (tuple): length-2 tuple of ints (w,h) representing the size of the
             patch to extract
         patch_image_fn (str, optional): image filename to write the patch to; if this is None
             the filename will be generated from [image_name] and the patch coordinates
@@ -218,16 +220,16 @@ def extract_patch_from_image(im,
         image_name (str, optional): the identifier of the source image; only used to generate
             a patch filename, so only required if [patch_image_fn] is None
         overwrite (bool, optional): whether to overwrite an existing patch image
     Returns:
         dict: a dictionary with fields xmin,xmax,ymin,ymax,patch_fn
     """
     if isinstance(im,str):
         pil_im = vis_utils.open_image(im)
     else:
         pil_im = im
     patch_x_min = patch_xy[0]
     patch_y_min = patch_xy[1]
     patch_x_max = patch_x_min + patch_size[0] - 1
@@ -249,19 +251,19 @@ def extract_patch_from_image(im,
             "If you don't supply a patch filename to extract_patch_from_image, you need to supply a folder name"
         patch_name = patch_info_to_patch_name(image_name,patch_x_min,patch_y_min)
         patch_image_fn = os.path.join(patch_folder,patch_name + '.jpg')
     if os.path.isfile(patch_image_fn) and (not overwrite):
         pass
-    else:
+    else:
         patch_im.save(patch_image_fn,quality=patch_jpeg_quality)
     patch_info = {}
     patch_info['xmin'] = patch_x_min
     patch_info['xmax'] = patch_x_max
     patch_info['ymin'] = patch_y_min
     patch_info['ymax'] = patch_y_max
     patch_info['patch_fn'] = patch_image_fn
     return patch_info
 # ...def extract_patch_from_image(...)
@@ -270,33 +272,33 @@ def extract_patch_from_image(im,
 def in_place_nms(md_results, iou_thres=0.45, verbose=True):
     """
     Run torch.ops.nms in-place on MD-formatted detection results.
     Args:
-        md_results (dict): detection results for a list of images, in MD results format (i.e.,
+        md_results (dict): detection results for a list of images, in MD results format (i.e.,
             containing a list of image dicts with the key 'images', each of which has a list
             of detections with the key 'detections')
         iou_thres (float, optional): IoU threshold above which we will treat two detections as
             redundant
         verbose (bool, optional): enable additional debug console output
     """
     n_detections_before = 0
     n_detections_after = 0
     # i_image = 18; im = md_results['images'][i_image]
     for i_image,im in tqdm(enumerate(md_results['images']),total=len(md_results['images'])):
         if (im['detections'] is None) or (len(im['detections']) == 0):
             continue
         boxes = []
         scores = []
         n_detections_before += len(im['detections'])
         # det = im['detections'][0]
         for det in im['detections']:
             # Using x1/x2 notation rather than x0/x1 notation to be consistent
             # with the Torch documentation.
             x1 = det['bbox'][0]
@@ -308,86 +310,86 @@ def in_place_nms(md_results, iou_thres=0.45, verbose=True):
             scores.append(det['conf'])
         # ...for each detection
         t_boxes = torch.tensor(boxes)
         t_scores = torch.tensor(scores)
         box_indices = ops.nms(t_boxes,t_scores,iou_thres).tolist()
         post_nms_detections = [im['detections'][x] for x in box_indices]
         assert len(post_nms_detections) <= len(im['detections'])
         im['detections'] = post_nms_detections
         n_detections_after += len(im['detections'])
     # ...for each image
     if verbose:
         print('NMS removed {} of {} detections'.format(
             n_detections_before-n_detections_after,
             n_detections_before))
 # ...in_place_nms()
 def _extract_tiles_for_image(fn_relative,image_folder,tiling_folder,patch_size,patch_stride,overwrite):
     """
     Private function to extract tiles for a single image.
     Returns a dict with fields 'patches' (see extract_patch_from_image) and 'image_fn'.
     If there is an error, 'patches' will be None and the 'error' field will contain
     failure details.  In that case, some tiles may still be generated.
     """
     fn_abs = os.path.join(image_folder,fn_relative)
     error = None
-    patches = []
+    patches = []
     image_name = path_utils.clean_filename(fn_relative,char_limit=None,force_lower=True)
     try:
         # Open the image
         im = vis_utils.open_image(fn_abs)
         image_size = [im.width,im.height]
         # Generate patch boundaries (a list of [x,y] starting points)
-        patch_boundaries = get_patch_boundaries(image_size,patch_size,patch_stride)
+        patch_boundaries = get_patch_boundaries(image_size,patch_size,patch_stride)
         # Extract patches
         #
-        # patch_xy = patch_boundaries[0]
+        # patch_xy = patch_boundaries[0]
         for patch_xy in patch_boundaries:
             patch_info = extract_patch_from_image(im,patch_xy,patch_size,
                                      patch_folder=tiling_folder,
                                      image_name=image_name,
                                      overwrite=overwrite)
             patch_info['source_fn'] = fn_relative
             patches.append(patch_info)
     except Exception as e:
         s = 'Patch generation error for {}: \n{}'.format(fn_relative,str(e))
         print(s)
         # patches = None
         error = s
     image_patch_info = {}
     image_patch_info['patches'] = patches
     image_patch_info['image_fn'] = fn_relative
     image_patch_info['error'] = error
     return image_patch_info
 #%% Main function
-def run_tiled_inference(model_file,
-                        image_folder,
+def run_tiled_inference(model_file,
+                        image_folder,
                         tiling_folder,
                         output_file,
                         tile_size_x=1280,
@@ -395,7 +397,7 @@ def run_tiled_inference(model_file,
                         tile_overlap=0.5,
                         checkpoint_path=None,
                         checkpoint_frequency=-1,
-                        remove_tiles=False,
+                        remove_tiles=False,
                         yolo_inference_options=None,
                         n_patch_extraction_workers=default_n_patch_extraction_workers,
                         overwrite_tiles=True,
@@ -406,26 +408,26 @@ def run_tiled_inference(model_file,
                         preprocess_on_image_queue=True,
                         inference_size=None):
     """
-    Runs inference using [model_file] on the images in [image_folder], fist splitting each image up
+    Runs inference using [model_file] on the images in [image_folder], fist splitting each image up
     into tiles of size [tile_size_x] x [tile_size_y], writing those tiles to [tiling_folder],
-    then de-duplicating the results before merging them back into a set of detections that make
-    sense on the original images and writing those results to [output_file].
+    then de-duplicating the results before merging them back into a set of detections that make
+    sense on the original images and writing those results to [output_file].
     [tiling_folder] can be any folder, but this function reserves the right to do whatever it wants
-    within that folder, including deleting everything, so it's best if it's a new folder.
+    within that folder, including deleting everything, so it's best if it's a new folder.
     Conceptually this folder is temporary, it's just helpful in this case to not actually
-    use the system temp folder, because the tile cache may be very large, so the caller may
-    want it to be on a specific drive.  If this is None, a new folder will be created in
+    use the system temp folder, because the tile cache may be very large, so the caller may
+    want it to be on a specific drive.  If this is None, a new folder will be created in
     system temp space.
     tile_overlap is the fraction of overlap between tiles.
     Optionally removes the temporary tiles.
-    if yolo_inference_options is supplied, it should be an instance of YoloInferenceOptions; in
-    this case the model will be run with run_inference_with_yolov5_val.  This is typically used to
+    if yolo_inference_options is supplied, it should be an instance of YoloInferenceOptions; in
+    this case the model will be run with run_inference_with_yolov5_val.  This is typically used to
     run the model with test-time augmentation.
     Args:
         model_file (str): model filename (ending in .pt), or a well-known model name (e.g. "MDV5A")
         image_folder (str): the folder of images to proess (always recursive)
@@ -445,7 +447,8 @@ def run_tiled_inference(model_file,
             run_inference_with_yolov5_val.py, rather than with run_detector_batch.py, using these options
         n_patch_extraction_workers (int, optional): number of workers to use for patch extraction;
             set to <= 1 to disable parallelization
-        image_list (list, optional): .json file containing a list of specific images to process.  If
+        overwrite_tiles (bool, optional): whether to overwrite image files for individual tiles if they exist
+        image_list (list, optional): .json file containing a list of specific images to process.  If
             this is supplied, and the paths are absolute, [image_folder] will be ignored. If this is supplied,
             and the paths are relative, they should be relative to [image_folder]
         augment (bool, optional): apply test-time augmentation, only relevant if yolo_inference_options
@@ -453,47 +456,47 @@ def run_tiled_inference(model_file,
         detector_options (dict, optional): parameters to pass to run_detector, only relevant if
             yolo_inference_options is None
         use_image_queue (bool, optional): whether to use a loader worker queue, only relevant if
-            yolo_inference_options is None
+            yolo_inference_options is None
         preprocess_on_image_queue (bool, optional): whether the image queue should also be responsible
             for preprocessing
         inference_size (int, optional): override the default inference image size, only relevant if
             yolo_inference_options is None
     Returns:
         dict: MD-formatted results dictionary, identical to what's written to [output_file]
     """
     ##%% Validate arguments
     assert tile_overlap < 1 and tile_overlap >= 0, \
         'Illegal tile overlap value {}'.format(tile_overlap)
     if tile_size_x == -1:
         tile_size_x = default_tile_size[0]
     if tile_size_y == -1:
         tile_size_y = default_tile_size[1]
     patch_size = [tile_size_x,tile_size_y]
     patch_stride = (round(patch_size[0]*(1.0-tile_overlap)),
                     round(patch_size[1]*(1.0-tile_overlap)))
     if tiling_folder is None:
         tiling_folder = \
             os.path.join(tempfile.gettempdir(), 'md-tiling', str(uuid.uuid1()))
         print('Creating temporary tiling folder: {}'.format(tiling_folder))
     os.makedirs(tiling_folder,exist_ok=True)
     ##%% List files
     if image_list is None:
         print('Enumerating images in {}'.format(image_folder))
-        image_files_relative = path_utils.find_images(image_folder, recursive=True, return_relative_paths=True)
+        image_files_relative = path_utils.find_images(image_folder, recursive=True, return_relative_paths=True)
         assert len(image_files_relative) > 0, 'No images found in folder {}'.format(image_folder)
     else:
         print('Loading image list from {}'.format(image_list))
         with open(image_list,'r') as f:
             image_files_relative = json.load(f)
@@ -514,107 +517,114 @@ def run_tiled_inference(model_file,
         if (n_absolute_paths != 0) and (n_absolute_paths != len(image_files_relative)):
             raise ValueError('Illegal file list: converted {} of {} paths to relative'.format(
             n_absolute_paths,len(image_files_relative)))
     ##%% Generate tiles
     all_image_patch_info = None
     print('Extracting patches from {} images'.format(len(image_files_relative)))
     n_workers = n_patch_extraction_workers
     if n_workers <= 1:
         all_image_patch_info = []
-        # fn_relative = image_files_relative[0]
-        for fn_relative in tqdm(image_files_relative):
+        # fn_relative = image_files_relative[0]
+        for fn_relative in tqdm(image_files_relative):
             image_patch_info = \
                 _extract_tiles_for_image(fn_relative,image_folder,tiling_folder,patch_size,patch_stride,
                                          overwrite=overwrite_tiles)
             all_image_patch_info.append(image_patch_info)
     else:
         from multiprocessing.pool import ThreadPool
         from multiprocessing.pool import Pool
         from functools import partial
-        if n_workers > len(image_files_relative):
-            print('Pool of {} requested, but only {} images available, reducing pool to {}'.\
-                  format(n_workers,len(image_files_relative),len(image_files_relative)))
-            n_workers = len(image_files_relative)
-        if parallelization_uses_threads:
-            pool = ThreadPool(n_workers); poolstring = 'threads'
-        else:
-            pool = Pool(n_workers); poolstring = 'processes'
-        print('Starting patch extraction pool with {} {}'.format(n_workers,poolstring))
-        all_image_patch_info = list(tqdm(pool.imap(
-                partial(_extract_tiles_for_image,
-                        image_folder=image_folder,
-                        tiling_folder=tiling_folder,
-                        patch_size=patch_size,
-                        patch_stride=patch_stride,
-                        overwrite=overwrite_tiles),
-                image_files_relative),total=len(image_files_relative)))
+        pool = None
+        try:
+            if n_workers > len(image_files_relative):
+                print('Pool of {} requested, but only {} images available, reducing pool to {}'.\
+                      format(n_workers,len(image_files_relative),len(image_files_relative)))
+                n_workers = len(image_files_relative)
+            if parallelization_uses_threads:
+                pool = ThreadPool(n_workers); poolstring = 'threads'
+            else:
+                pool = Pool(n_workers); poolstring = 'processes'
+            print('Starting patch extraction pool with {} {}'.format(n_workers,poolstring))
+            all_image_patch_info = list(tqdm(pool.imap(
+                    partial(_extract_tiles_for_image,
+                            image_folder=image_folder,
+                            tiling_folder=tiling_folder,
+                            patch_size=patch_size,
+                            patch_stride=patch_stride,
+                            overwrite=overwrite_tiles),
+                    image_files_relative),total=len(image_files_relative)))
+        finally:
+            if pool is not None:
+                pool.close()
+                pool.join()
+                print("Pool closed and joined for patch extraction")
     # ...for each image
     # Write tile information to file; this is just a debugging convenience
     folder_name = path_utils.clean_filename(image_folder,force_lower=True)
     if folder_name.startswith('_'):
         folder_name = folder_name[1:]
     tile_cache_file = os.path.join(tiling_folder,folder_name + '_patch_info.json')
     with open(tile_cache_file,'w') as f:
         json.dump(all_image_patch_info,f,indent=1)
     # Keep track of patches that failed
     images_with_patch_errors = {}
     for patch_info in all_image_patch_info:
         if patch_info['error'] is not None:
             images_with_patch_errors[patch_info['image_fn']] = patch_info
     ##%% Run inference on the folder of tiles
     # When running with run_inference_with_yolov5_val, we'll pass the folder
     if yolo_inference_options is not None:
         patch_level_output_file = os.path.join(tiling_folder,folder_name + '_patch_level_results.json')
         if yolo_inference_options.model_filename is None:
             yolo_inference_options.model_filename = model_file
         else:
             assert yolo_inference_options.model_filename == model_file, \
                 'Model file between yolo inference file ({}) and model file parameter ({})'.format(
                     yolo_inference_options.model_filename,model_file)
         yolo_inference_options.input_folder = tiling_folder
         yolo_inference_options.output_file = patch_level_output_file
         run_inference_with_yolo_val(yolo_inference_options)
         with open(patch_level_output_file,'r') as f:
             patch_level_results = json.load(f)
     # For standard inference, we'll pass a list of files
     else:
         patch_file_names = []
         for im in all_image_patch_info:
-            # If there was a patch generation error, don't run inference
+            # If there was a patch generation error, don't run inference
             if patch_info['error'] is not None:
                 assert im['image_fn'] in images_with_patch_errors
                 continue
             for patch in im['patches']:
                 patch_file_names.append(patch['patch_fn'])
-        inference_results = load_and_run_detector_batch(model_file,
-                                                        patch_file_names,
+        inference_results = load_and_run_detector_batch(model_file,
+                                                        patch_file_names,
                                                         checkpoint_path=checkpoint_path,
                                                         checkpoint_frequency=checkpoint_frequency,
                                                         quiet=True,
@@ -623,18 +633,18 @@ def run_tiled_inference(model_file,
                                                         use_image_queue=use_image_queue,
                                                         preprocess_on_image_queue=preprocess_on_image_queue,
                                                         image_size=inference_size)
         patch_level_output_file = os.path.join(tiling_folder,folder_name + '_patch_level_results.json')
-        patch_level_results = write_results_to_file(inference_results,
-                                                    patch_level_output_file,
-                                                    relative_path_base=tiling_folder,
+        patch_level_results = write_results_to_file(inference_results,
+                                                    patch_level_output_file,
+                                                    relative_path_base=tiling_folder,
                                                     detector_file=model_file)
     # ...if we are/aren't using run_inference_with_yolov5_val
-    ##%% Map patch-level detections back to the original images
+    ##%% Map patch-level detections back to the original images
     # Map relative paths for patches to detections
     patch_fn_relative_to_results = {}
     for im in tqdm(patch_level_results['images']):
@@ -644,36 +654,36 @@ def run_tiled_inference(model_file,
     image_level_results['info'] = patch_level_results['info']
     image_level_results['detection_categories'] = patch_level_results['detection_categories']
     image_level_results['images'] = []
     image_fn_relative_to_patch_info = { x['image_fn']:x for x in all_image_patch_info }
     # i_image = 0; image_fn_relative = image_files_relative[i_image]
     for i_image,image_fn_relative in tqdm(enumerate(image_files_relative),
                                           total=len(image_files_relative)):
         image_fn_abs = os.path.join(image_folder,image_fn_relative)
         assert os.path.isfile(image_fn_abs)
         output_im = {}
         output_im['file'] = image_fn_relative
         # If we had a patch generation error
         if image_fn_relative in images_with_patch_errors:
             patch_info = image_fn_relative_to_patch_info[image_fn_relative]
             assert patch_info['error'] is not None
             output_im['detections'] = None
             output_im['failure'] = 'Patch generation error'
             output_im['failure_details'] = patch_info['error']
             image_level_results['images'].append(output_im)
             continue
         try:
-            pil_im = vis_utils.open_image(image_fn_abs)
+            pil_im = vis_utils.open_image(image_fn_abs)
             image_w = pil_im.size[0]
             image_h = pil_im.size[1]
         # This would be a very unusual situation; we're reading back an image here that we already
         # (successfully) read once during patch generation.
         except Exception as e:
@@ -683,36 +693,36 @@ def run_tiled_inference(model_file,
             output_im['failure'] = 'Patch processing error'
             output_im['failure_details'] = str(e)
             image_level_results['images'].append(output_im)
-            continue
+            continue
         output_im['detections'] = []
         image_patch_info = image_fn_relative_to_patch_info[image_fn_relative]
         assert image_patch_info['patches'][0]['source_fn'] == image_fn_relative
         # Patches for this image
         patch_fn_abs_to_patch_info_this_image = {}
         for patch_info in image_patch_info['patches']:
             patch_fn_abs_to_patch_info_this_image[patch_info['patch_fn']] = patch_info
         # For each patch
         #
         # i_patch = 0; patch_fn_abs = list(patch_fn_abs_to_patch_info_this_image.keys())[i_patch]
         for i_patch,patch_fn_abs in enumerate(patch_fn_abs_to_patch_info_this_image.keys()):
             patch_fn_relative = os.path.relpath(patch_fn_abs,tiling_folder)
             patch_results = patch_fn_relative_to_results[patch_fn_relative]
             patch_info = patch_fn_abs_to_patch_info_this_image[patch_fn_abs]
             # patch_results['file'] is a relative path, and a subset of patch_info['patch_fn']
             assert patch_results['file'] in patch_info['patch_fn']
             patch_w = (patch_info['xmax'] - patch_info['xmin']) + 1
             patch_h = (patch_info['ymax'] - patch_info['ymin']) + 1
             assert patch_w == patch_size[0]
             assert patch_h == patch_size[1]
             # If there was an inference failure on one patch, report the image
             # as an inference failure
             if 'detections' not in patch_results:
@@ -720,16 +730,16 @@ def run_tiled_inference(model_file,
                 output_im['detections'] = None
                 output_im['failure'] = patch_results['failure']
                 break
             # det = patch_results['detections'][0]
             for det in patch_results['detections']:
                 bbox_patch_relative = det['bbox']
                 xmin_patch_relative = bbox_patch_relative[0]
                 ymin_patch_relative = bbox_patch_relative[1]
                 w_patch_relative = bbox_patch_relative[2]
                 h_patch_relative = bbox_patch_relative[3]
                 # Convert from patch-relative normalized values to image-relative absolute values
                 w_pixels = w_patch_relative * patch_w
                 h_pixels = h_patch_relative * patch_h
@@ -737,82 +747,82 @@ def run_tiled_inference(model_file,
                 ymin_patch_pixels = ymin_patch_relative * patch_h
                 xmin_image_pixels = patch_info['xmin'] + xmin_patch_pixels
                 ymin_image_pixels = patch_info['ymin'] + ymin_patch_pixels
                 # ...and now to image-relative normalized values
                 w_image_normalized = w_pixels / image_w
                 h_image_normalized = h_pixels / image_h
                 xmin_image_normalized = xmin_image_pixels / image_w
                 ymin_image_normalized = ymin_image_pixels / image_h
                 bbox_image_normalized = [xmin_image_normalized,
                                          ymin_image_normalized,
                                          w_image_normalized,
                                          h_image_normalized]
-                bbox_image_normalized = round_float_array(bbox_image_normalized,
+                bbox_image_normalized = round_float_array(bbox_image_normalized,
                                                           precision=COORD_DIGITS)
                 det['conf'] = round_float(det['conf'], precision=CONF_DIGITS)
                 output_det = {}
                 output_det['bbox'] = bbox_image_normalized
                 output_det['conf'] = det['conf']
                 output_det['category'] = det['category']
                 output_im['detections'].append(output_det)
             # ...for each detection
         # ...for each patch
         image_level_results['images'].append(output_im)
-    # ...for each image
+    # ...for each image
     image_level_results_file_pre_nms = \
         os.path.join(tiling_folder,folder_name + '_image_level_results_pre_nms.json')
     with open(image_level_results_file_pre_nms,'w') as f:
         json.dump(image_level_results,f,indent=1)
     ##%% Run NMS
     in_place_nms(image_level_results,iou_thres=nms_iou_threshold)
     ##%% Write output file
     print('Saving image-level results (after NMS) to {}'.format(output_file))
     with open(output_file,'w') as f:
         json.dump(image_level_results,f,indent=1)
     ##%% Possibly remove tiles
     if remove_tiles:
         patch_file_names = []
         for im in all_image_patch_info:
             for patch in im['patches']:
                 patch_file_names.append(patch['patch_fn'])
         for patch_fn_abs in patch_file_names:
             os.remove(patch_fn_abs)
     ##%% Return
     return image_level_results
 #%% Interactive driver
 if False:
     pass
     #%% Run tiled inference (in Python)
     model_file = os.path.expanduser('~/models/camera_traps/megadetector/md_v5.0.0/md_v5a.0.0.pt')
     image_folder = os.path.expanduser('~/data/KRU-test')
     tiling_folder = os.path.expanduser('~/tmp/tiling-test')
@@ -824,47 +834,47 @@ if False:
     checkpoint_path = None
     checkpoint_frequency = -1
     remove_tiles = False
     use_yolo_inference = False
     if not use_yolo_inference:
         yolo_inference_options = None
     else:
         yolo_inference_options = YoloInferenceOptions()
         yolo_inference_options.yolo_working_folder = os.path.expanduser('~/git/yolov5')
     run_tiled_inference(model_file, image_folder, tiling_folder, output_file,
-                            tile_size_x=tile_size_x, tile_size_y=tile_size_y,
+                            tile_size_x=tile_size_x, tile_size_y=tile_size_y,
                             tile_overlap=tile_overlap,
-                            checkpoint_path=checkpoint_path,
-                            checkpoint_frequency=checkpoint_frequency,
-                            remove_tiles=remove_tiles,
+                            checkpoint_path=checkpoint_path,
+                            checkpoint_frequency=checkpoint_frequency,
+                            remove_tiles=remove_tiles,
                             yolo_inference_options=yolo_inference_options)
     #%% Run tiled inference (generate a command)
     import os
     model_file = os.path.expanduser('~/models/camera_traps/megadetector/md_v5.0.0/md_v5a.0.0.pt')
     image_folder = os.path.expanduser('~/data/KRU-test')
     tiling_folder = os.path.expanduser('~/tmp/tiling-test')
     output_file = os.path.expanduser('~/tmp/KRU-test-tiled.json')
     tile_size = [5152,3968]
     tile_overlap = 0.8
     cmd = f'python run_tiled_inference.py {model_file} {image_folder} {tiling_folder} {output_file} ' + \
           f'--tile_overlap {tile_overlap} --no_remove_tiles --tile_size_x {tile_size[0]} --tile_size_y {tile_size[1]}'
     print(cmd)
     import clipboard; clipboard.copy(cmd)
     #%% Preview tiled inference
     from megadetector.postprocessing.postprocess_batch_results import \
         PostProcessingOptions, process_batch_results
@@ -893,14 +903,12 @@ if False:
     html_output_file = ppresults.output_html_file
     path_utils.open_file(html_output_file)
 #%% Command-line driver
-import sys,argparse
+def main(): # noqa
-def main():
     parser = argparse.ArgumentParser(
         description='Chop a folder of images up into tiles, run MD on the tiles, and stitch the results together')
     parser.add_argument(
@@ -918,7 +926,7 @@ def main():
     parser.add_argument(
         '--no_remove_tiles',
         action='store_true',
-        help='Tiles are removed by default; this option suppresses tile deletion')
+        help='Tiles are removed by default; this option suppresses tile deletion')
     parser.add_argument(
         '--tile_size_x',
         type=int,
@@ -949,8 +957,8 @@ def main():
         type=str,
         default=None,
         help=('A list of detector options (key-value pairs) to '))
-    # detector_options = parse_kvp_list(args.detector_options)
+    # detector_options = parse_kvp_list(args.detector_options)
     if len(sys.argv[1:]) == 0:
         parser.print_help()
@@ -961,7 +969,7 @@ def main():
     model_file = try_download_known_detector(args.model_file)
     assert os.path.exists(model_file), \
         'detector file {} does not exist'.format(args.model_file)
     if os.path.exists(args.output_file):
         if args.overwrite_handling == 'skip':
             print('Warning: output file {} exists, skipping'.format(args.output_file))
@@ -972,15 +980,15 @@ def main():
             raise ValueError('Output file {} exists'.format(args.output_file))
         else:
             raise ValueError('Unknown output handling method {}'.format(args.overwrite_handling))
     remove_tiles = (not args.no_remove_tiles)
     run_tiled_inference(model_file, args.image_folder, args.tiling_folder, args.output_file,
-                        tile_size_x=args.tile_size_x, tile_size_y=args.tile_size_y,
+                        tile_size_x=args.tile_size_x, tile_size_y=args.tile_size_y,
                         tile_overlap=args.tile_overlap,
                         remove_tiles=remove_tiles,
                         image_list=args.image_list)
 if __name__ == '__main__':
     main()

megadetector 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl