PyPI - megadetector - Versions diffs - 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl - Mend

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (197) hide show

megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/efficientnet/model.py +8 -8
megadetector/classification/efficientnet/utils.py +6 -5
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +26 -26
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -2
megadetector/data_management/camtrap_dp_to_coco.py +79 -46
megadetector/data_management/cct_json_utils.py +103 -103
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +210 -193
megadetector/data_management/databases/add_width_and_height_to_db.py +86 -12
megadetector/data_management/databases/combine_coco_camera_traps_files.py +40 -40
megadetector/data_management/databases/integrity_check_json_db.py +228 -200
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +88 -39
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +133 -125
megadetector/data_management/labelme_to_yolo.py +159 -73
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +365 -107
megadetector/data_management/lila/get_lila_annotation_counts.py +35 -33
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +73 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +28 -19
megadetector/data_management/mewc_to_md.py +344 -340
megadetector/data_management/ocr_tools.py +262 -255
megadetector/data_management/read_exif.py +249 -227
megadetector/data_management/remap_coco_categories.py +90 -28
megadetector/data_management/remove_exif.py +81 -21
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +588 -120
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +248 -122
megadetector/data_management/yolo_to_coco.py +333 -191
megadetector/detection/change_detection.py +832 -0
megadetector/detection/process_video.py +340 -337
megadetector/detection/pytorch_detector.py +358 -278
megadetector/detection/run_detector.py +399 -186
megadetector/detection/run_detector_batch.py +404 -377
megadetector/detection/run_inference_with_yolov5_val.py +340 -327
megadetector/detection/run_tiled_inference.py +257 -249
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +332 -295
megadetector/postprocessing/add_max_conf.py +19 -11
megadetector/postprocessing/categorize_detections_by_size.py +45 -45
megadetector/postprocessing/classification_postprocessing.py +468 -433
megadetector/postprocessing/combine_batch_outputs.py +23 -23
megadetector/postprocessing/compare_batch_results.py +590 -525
megadetector/postprocessing/convert_output_format.py +106 -102
megadetector/postprocessing/create_crop_folder.py +347 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -499
megadetector/postprocessing/load_api_results.py +48 -27
megadetector/postprocessing/md_to_coco.py +133 -102
megadetector/postprocessing/md_to_labelme.py +107 -90
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +92 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -301
megadetector/postprocessing/remap_detection_categories.py +91 -38
megadetector/postprocessing/render_detection_confusion_matrix.py +214 -205
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +704 -679
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +18 -19
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +54 -33
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +67 -67
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +156 -74
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +10 -10
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/ct_utils.py +1049 -211
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +632 -529
megadetector/utils/path_utils.py +1520 -431
megadetector/utils/process_utils.py +41 -41
megadetector/utils/split_locations_into_train_val.py +62 -62
megadetector/utils/string_utils.py +148 -27
megadetector/utils/url_utils.py +489 -176
megadetector/utils/wi_utils.py +2658 -2526
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +34 -30
megadetector/visualization/render_images_with_thumbnails.py +39 -74
megadetector/visualization/visualization_utils.py +487 -435
megadetector/visualization/visualize_db.py +232 -198
megadetector/visualization/visualize_detector_output.py +82 -76
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/METADATA +5 -2
megadetector-10.0.0.dist-info/RECORD +139 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/WHEEL +1 -1
megadetector/api/batch_processing/api_core/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/score.py +0 -439
megadetector/api/batch_processing/api_core/server.py +0 -294
megadetector/api/batch_processing/api_core/server_api_config.py +0 -97
megadetector/api/batch_processing/api_core/server_app_config.py +0 -55
megadetector/api/batch_processing/api_core/server_batch_job_manager.py +0 -220
megadetector/api/batch_processing/api_core/server_job_status_table.py +0 -149
megadetector/api/batch_processing/api_core/server_orchestration.py +0 -360
megadetector/api/batch_processing/api_core/server_utils.py +0 -88
megadetector/api/batch_processing/api_core_support/__init__.py +0 -0
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
megadetector/api/batch_processing/api_support/__init__.py +0 -0
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +0 -152
megadetector/api/batch_processing/data_preparation/__init__.py +0 -0
megadetector/api/synchronous/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/api_backend.py +0 -151
megadetector/api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -263
megadetector/api/synchronous/api_core/animal_detection_api/config.py +0 -35
megadetector/api/synchronous/api_core/tests/__init__.py +0 -0
megadetector/api/synchronous/api_core/tests/load_test.py +0 -110
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector/utils/azure_utils.py +0 -178
megadetector/utils/sas_blob_utils.py +0 -509
megadetector-5.0.28.dist-info/RECORD +0 -209
/megadetector/{api/batch_processing/__init__.py → __init__.py} +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/top_level.txt +0 -0

megadetector/data_management/databases/subset_json_db.py CHANGED Viewed

@@ -2,14 +2,14 @@
 subset_json_db.py
-Select a subset of images (and associated annotations) from a .json file in COCO
+Select a subset of images (and associated annotations) from a .json file in COCO
 Camera Traps format based on a string query.
 To subset .json files in the MegaDetector output format, see
 subset_json_detector_output.py.
 """
 #%% Constants and imports
 import os
@@ -18,6 +18,7 @@ import json
 import argparse
 from tqdm import tqdm
+from megadetector.utils import ct_utils
 from copy import copy
@@ -25,22 +26,22 @@ from copy import copy
 def subset_json_db(input_json, query, output_json=None, ignore_case=False, verbose=False):
     """
-    Given a json file (or dictionary already loaded from a json file), produce a new
-    database containing only the images whose filenames contain the string 'query',
+    Given a json file (or dictionary already loaded from a json file), produce a new
+    database containing only the images whose filenames contain the string 'query',
     optionally writing that DB output to a new json file.
     Args:
         input_json (str): COCO Camera Traps .json file to load, or an already-loaded dict
-        query (str or list): string to query for, only include images in the output whose filenames
+        query (str or list): string to query for, only include images in the output whose filenames
             contain this string.  If this is a list, test for exact matches.
         output_json (str, optional): file to write the resulting .json file to
         ignore_case (bool, optional): whether to perform a case-insensitive search for [query]
         verbose (bool, optional): enable additional debug output
     Returns:
         dict: CCT dictionary containing a subset of the images and annotations in the input dict
     """
     # Load the input file if necessary
     if isinstance(input_json,str):
         print('Loading input .json...')
@@ -51,26 +52,26 @@ def subset_json_db(input_json, query, output_json=None, ignore_case=False, verbo
     # Find images matching the query
     images = []
     if isinstance(query,str):
         if ignore_case:
             query = query.lower()
         for im in tqdm(input_data['images']):
             fn = im['file_name']
             if ignore_case:
                 fn = fn.lower()
             if query in fn:
                 images.append(im)
     else:
         query = set(query)
         if ignore_case:
             query = set([s.lower() for s in query])
         for im in input_data['images']:
             fn = im['file_name']
             if ignore_case:
@@ -79,27 +80,26 @@ def subset_json_db(input_json, query, output_json=None, ignore_case=False, verbo
                 images.append(im)
     image_ids = set([im['id'] for im in images])
     # Find annotations referring to those images
     annotations = []
     for ann in input_data['annotations']:
         if ann['image_id'] in image_ids:
             annotations.append(ann)
     output_data = copy(input_data)
     output_data['images'] = images
     output_data['annotations'] = annotations
     # Write the output file if requested
     if output_json is not None:
         if verbose:
             print('Writing output .json to {}'.format(output_json))
         output_dir = os.path.dirname(output_json)
         os.makedirs(output_dir,exist_ok=True)
-        with open(output_json,'w') as f:
-            json.dump(output_data,f,indent=1)
+        ct_utils.write_json(output_json, output_data)
     if verbose:
         print('Keeping {} of {} images, {} of {} annotations'.format(
             len(output_data['images']),len(input_data['images']),
@@ -111,33 +111,33 @@ def subset_json_db(input_json, query, output_json=None, ignore_case=False, verbo
 #%% Interactive driver
 if False:
     #%%
     input_json = r"e:\Statewide_wolf_container\idfg_20190409.json"
     output_json = r"e:\Statewide_wolf_container\idfg_20190409_clearcreek.json"
     query = 'clearcreek'
     ignore_case = True
     db = subset_json_db(input_json, query, output_json, ignore_case)
 #%% Command-line driver
-def main():
+def main(): # noqa
     parser = argparse.ArgumentParser()
     parser.add_argument('input_json', type=str, help='Input file (a COCO Camera Traps .json file)')
-    parser.add_argument('output_json', type=str, help='Output file')
-    parser.add_argument('query', type=str, help='Filename query')
+    parser.add_argument('output_json', type=str, help='Output file')
+    parser.add_argument('query', type=str, help='Filename query')
     parser.add_argument('--ignore_case', action='store_true')
     if len(sys.argv[1:]) == 0:
         parser.print_help()
         parser.exit()
-    args = parser.parse_args()
+    args = parser.parse_args()
     subset_json_db(args.input_json,args.query,args.output_json,args.ignore_case)
-if __name__ == '__main__':
+if __name__ == '__main__':
     main()

megadetector/data_management/generate_crops_from_cct.py CHANGED Viewed

@@ -10,6 +10,7 @@ each bounding box.
 #%% Imports and constants
 import os
+import argparse
 import json
 from tqdm import tqdm
@@ -22,7 +23,7 @@ def generate_crops_from_cct(cct_file,image_dir,output_dir,padding=0,flat_output=
     """
     Given a .json file in COCO Camera Traps format, creates a cropped image for
     each bounding box.
     Args:
         cct_file (str): the COCO .json file from which we should load data
         image_dir (str): the folder where the images live; filenames in the .json
@@ -31,119 +32,167 @@ def generate_crops_from_cct(cct_file,image_dir,output_dir,padding=0,flat_output=
         padding (float, optional): number of pixels we should expand each box before
             cropping
         flat_output (bool, optional): if False, folder structure will be preserved
-            in the output, e.g. the image a/b/c/d.jpg will result in image files
+            in the output, e.g. the image a/b/c/d.jpg will result in image files
             in the output folder called, e.g., a/b/c/d_crop_000_id_12345.jpg.  If
-            [flat_output] is True, the corresponding output image will be
-            a_b_c_d_crop_000_id_12345.jpg.
+            [flat_output] is True, the corresponding output image will be
+            a_b_c_d_crop_000_id_12345.jpg.
     """
     ## Read and validate input
     assert os.path.isfile(cct_file)
     assert os.path.isdir(image_dir)
     os.makedirs(output_dir,exist_ok=True)
     with open(cct_file,'r') as f:
         d = json.load(f)
     ## Find annotations for each image
     from collections import defaultdict
     # This actually maps image IDs to annotations, but only to annotations
     # containing boxes
     image_id_to_boxes = defaultdict(list)
     n_boxes = 0
     for ann in d['annotations']:
         if 'bbox' in ann:
             image_id_to_boxes[ann['image_id']].append(ann)
             n_boxes += 1
     print('Found {} boxes in {} annotations for {} images'.format(
         n_boxes,len(d['annotations']),len(d['images'])))
     ## Generate crops
     # im = d['images'][0]
     for im in tqdm(d['images']):
         input_image_fn = os.path.join(os.path.join(image_dir,im['file_name']))
         assert os.path.isfile(input_image_fn), 'Could not find image {}'.format(input_image_fn)
         if im['id'] not in image_id_to_boxes:
             continue
         annotations_this_image = image_id_to_boxes[im['id']]
         # Load the image
         img = Image.open(input_image_fn)
         # Generate crops
         # i_ann = 0; ann = annotations_this_image[i_ann]
         for i_ann,ann in enumerate(annotations_this_image):
             # x/y/w/h, origin at the upper-left
             bbox = ann['bbox']
             xmin = bbox[0]
             ymin = bbox[1]
             xmax = xmin + bbox[2]
             ymax = ymin + bbox[3]
             xmin -= padding / 2
             ymin -= padding / 2
             xmax += padding / 2
             ymax += padding / 2
             xmin = max(xmin,0)
             ymin = max(ymin,0)
             xmax = min(xmax,img.width-1)
             ymax = min(ymax,img.height-1)
             crop = img.crop(box=[xmin, ymin, xmax, ymax])
             output_fn = os.path.splitext(im['file_name'])[0].replace('\\','/')
             if flat_output:
                 output_fn = output_fn.replace('/','_')
             output_fn = output_fn + '_crop' + str(i_ann).zfill(3) + '_id_' + ann['id']
             output_fn = output_fn + '.jpg'
             output_full_path = os.path.join(output_dir,output_fn)
             if not flat_output:
                 os.makedirs(os.path.dirname(output_full_path),exist_ok=True)
             crop.save(output_full_path)
         # ...for each box
     # ...for each image
 # ...generate_crops_from_cct()
 #%% Interactive driver
 if False:
     pass
     #%%
     cct_file = os.path.expanduser('~/data/noaa/noaa_estuary_fish.json')
     image_dir = os.path.expanduser('~/data/noaa/JPEGImages')
     padding = 50
     flat_output = True
     output_dir = '/home/user/tmp/noaa-fish-crops'
     generate_crops_from_cct(cct_file,image_dir,output_dir,padding,flat_output=True)
     files = os.listdir(output_dir)
 #%% Command-line driver
-# TODO
+def main():
+    """
+    Command-line interface to generate crops from a COCO Camera Traps .json file.
+    """
+    parser = argparse.ArgumentParser(
+        description='Generate cropped images from a COCO Camera Traps .json file'
+    )
+    parser.add_argument(
+        'cct_file',
+        type=str,
+        help='COCO .json file to load data from'
+    )
+    parser.add_argument(
+        'image_dir',
+        type=str,
+        help='Folder where images are located'
+    )
+    parser.add_argument(
+        'output_dir',
+        type=str,
+        help='Folder to which we should write cropped images'
+    )
+    parser.add_argument(
+        '--padding',
+        type=int,
+        default=0,
+        help='Pixels to expand each box before cropping'
+    )
+    parser.add_argument(
+        '--flat_output',
+        action='store_true',
+        help='Flatten folder structure in output (preserves folder structure by default)'
+    )
+    args = parser.parse_args()
+    generate_crops_from_cct(
+        cct_file=args.cct_file,
+        image_dir=args.image_dir,
+        output_dir=args.output_dir,
+        padding=args.padding,
+        flat_output=args.flat_output
+    )
+    print(f'Generated crops in {args.output_dir}')
+if __name__ == '__main__':
+    main()

megadetector/data_management/get_image_sizes.py CHANGED Viewed

@@ -2,7 +2,7 @@
 get_image_sizes.py
-Given a json-formatted list of image filenames, retrieves the width and height of
+Given a json-formatted list of image filenames, retrieves the width and height of
 every image, optionally writing the results to a new .json file.
 """
@@ -35,45 +35,45 @@ def _get_image_size(image_path,image_prefix=None):
     Support function to get the size of a single image.  Returns a (path,w,h) tuple.
     w and h will be -1 if the image fails to load.
     """
     if image_prefix is not None:
         full_path = os.path.join(image_prefix,image_path)
     else:
         full_path = image_path
     # Is this image on disk?
     if not os.path.isfile(full_path):
         print('Could not find image {}'.format(full_path))
         return (image_path,-1,-1)
-    try:
+    try:
         pil_im = Image.open(full_path)
-        w = pil_im.width
+        w = pil_im.width
         h = pil_im.height
         return (image_path,w,h)
-    except Exception as e:
+    except Exception as e:
         print('Error reading image {}: {}'.format(full_path,str(e)))
         return (image_path,-1,-1)
 def get_image_sizes(filenames,image_prefix=None,output_file=None,
                     n_workers=default_n_threads,use_threads=True,
                     recursive=True):
     """
     Gets the width and height of all images in [filenames], which can be:
     * A .json-formatted file containing list of strings
     * A folder
     * A list of files
     ...returning a list of (path,w,h) tuples, and optionally writing the results to [output_file].
     Args:
-        filenames (str or list): the image filenames for which we should retrieve sizes,
-            can be the name of a .json-formatted file containing list of strings, a folder
+        filenames (str or list): the image filenames for which we should retrieve sizes,
+            can be the name of a .json-formatted file containing list of strings, a folder
             in which we should enumerate images, or a list of files.
         image_prefix (str, optional): optional prefix to add to images to get to full paths;
-            useful when [filenames] contains relative files, in which case [image_prefix] is the
+            useful when [filenames] contains relative files, in which case [image_prefix] is the
             base folder for the source images.
         output_file (str, optional): a .json file to write the imgae sizes
         n_workers (int, optional): number of parallel workers to use, set to <=1 to
@@ -82,57 +82,62 @@ def get_image_sizes(filenames,image_prefix=None,output_file=None,
             for parallelization; not relevant if [n_workers] <= 1
         recursive (bool, optional): only relevant if [filenames] is actually a folder,
             determines whether image enumeration within that folder will be recursive
     Returns:
         list: list of (path,w,h) tuples
-    """
+    """
     if output_file is not None:
         assert os.path.isdir(os.path.dirname(output_file)), \
             'Illegal output file {}, parent folder does not exist'.format(output_file)
     if isinstance(filenames,str) and os.path.isfile(filenames):
-        with open(filenames,'r') as f:
+        with open(filenames,'r') as f:
             filenames = json.load(f)
         filenames = [s.strip() for s in filenames]
     elif isinstance(filenames,str) and os.path.isdir(filenames):
         filenames = find_images(filenames,recursive=recursive,
                                 return_relative_paths=False,convert_slashes=True)
     else:
-        assert isinstance(filenames,list)
+        assert isinstance(filenames,list)
     if n_workers <= 1:
         all_results = []
         for i_file,fn in tqdm(enumerate(filenames),total=len(filenames)):
             all_results.append(_get_image_size(fn,image_prefix=image_prefix))
     else:
         print('Creating a pool with {} workers'.format(n_workers))
         if use_threads:
-            pool = ThreadPool(n_workers)
+            pool = ThreadPool(n_workers)
         else:
             pool = Pool(n_workers)
         # all_results = list(tqdm(pool.imap(process_image, filenames), total=len(filenames)))
-        all_results = list(tqdm(pool.imap(
-            partial(_get_image_size,image_prefix=image_prefix), filenames), total=len(filenames)))
+        try:
+            all_results = list(tqdm(pool.imap(
+                partial(_get_image_size,image_prefix=image_prefix), filenames), total=len(filenames)))
+        finally:
+            pool.close()
+            pool.join()
+            print("Pool closed and joined for image size reads")
     if output_file is not None:
         with open(output_file,'w') as f:
             json.dump(all_results,f,indent=1)
     return all_results
 #%% Interactive driver
 if False:
-    pass
+    pass
     #%%
     # List images in a test folder
     base_dir = r'c:\temp\test_images'
     image_list_file = os.path.join(base_dir,'images.json')
@@ -140,50 +145,50 @@ if False:
     image_size_file = os.path.join(base_dir,'image_sizes.json')
     from megadetector.utils import path_utils
     image_names = path_utils.find_images(base_dir,recursive=True)
     with open(image_list_file,'w') as f:
         json.dump(image_names,f,indent=1)
     relative_image_names = []
     for s in image_names:
         relative_image_names.append(os.path.relpath(s,base_dir))
     with open(relative_image_list_file,'w') as f:
         json.dump(relative_image_names,f,indent=1)
     #%%
     get_image_sizes(relative_image_list_file,image_size_file,image_prefix=base_dir,n_threads=4)
 #%% Command-line driver
-def main():
+def main(): # noqa
     parser = argparse.ArgumentParser()
     parser.add_argument('filenames',type=str,
                         help='Folder from which we should fetch image sizes, or .json file with a list of filenames')
     parser.add_argument('output_file',type=str,
                         help='Output file (.json) to which we should write image size information')
     parser.add_argument('--image_prefix', type=str, default=None,
-                        help='Prefix to append to image filenames, only relevant if [filenames] points to a list of ' + \
-                             'relative paths')
+                        help='Prefix to append to image filenames, only relevant if [filenames] points to a ' + \
+                             'list of relative paths')
     parser.add_argument('--n_threads', type=int, default=default_n_threads,
                         help='Number of concurrent workers, set to <=1 to disable parallelization (default {})'.format(
                             default_n_threads))
     if len(sys.argv[1:])==0:
         parser.print_help()
         parser.exit()
     args = parser.parse_args()
     _ = get_image_sizes(filenames=args.filenames,
                         output_file=args.output_file,
                         image_prefix=args.image_prefix,
                         n_workers=args.n_threads)
 if __name__ == '__main__':
     main()

megadetector 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl