PyPI - megadetector - Versions diffs - 5.0.27__py3-none-any.whl → 5.0.29__py3-none-any.whl - Mend

megadetector 5.0.27py3-none-any.whl → 5.0.29py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (176) hide show

megadetector/api/batch_processing/api_core/batch_service/score.py +4 -5
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +1 -1
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +1 -1
megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/api/synchronous/api_core/tests/load_test.py +2 -3
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +23 -23
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -1
megadetector/data_management/camtrap_dp_to_coco.py +45 -45
megadetector/data_management/cct_json_utils.py +101 -101
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +189 -189
megadetector/data_management/databases/add_width_and_height_to_db.py +3 -2
megadetector/data_management/databases/combine_coco_camera_traps_files.py +38 -38
megadetector/data_management/databases/integrity_check_json_db.py +202 -188
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +38 -38
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +130 -124
megadetector/data_management/labelme_to_yolo.py +78 -72
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +91 -91
megadetector/data_management/lila/get_lila_annotation_counts.py +30 -30
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +70 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +13 -14
megadetector/data_management/mewc_to_md.py +339 -340
megadetector/data_management/ocr_tools.py +258 -252
megadetector/data_management/read_exif.py +232 -223
megadetector/data_management/remap_coco_categories.py +26 -26
megadetector/data_management/remove_exif.py +31 -20
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +41 -41
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +117 -120
megadetector/data_management/yolo_to_coco.py +195 -188
megadetector/detection/change_detection.py +831 -0
megadetector/detection/process_video.py +341 -338
megadetector/detection/pytorch_detector.py +308 -266
megadetector/detection/run_detector.py +186 -166
megadetector/detection/run_detector_batch.py +366 -364
megadetector/detection/run_inference_with_yolov5_val.py +328 -325
megadetector/detection/run_tiled_inference.py +312 -253
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +291 -283
megadetector/postprocessing/add_max_conf.py +15 -11
megadetector/postprocessing/categorize_detections_by_size.py +44 -44
megadetector/postprocessing/classification_postprocessing.py +808 -311
megadetector/postprocessing/combine_batch_outputs.py +20 -21
megadetector/postprocessing/compare_batch_results.py +528 -517
megadetector/postprocessing/convert_output_format.py +97 -97
megadetector/postprocessing/create_crop_folder.py +220 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -0
megadetector/postprocessing/load_api_results.py +25 -22
megadetector/postprocessing/md_to_coco.py +129 -98
megadetector/postprocessing/md_to_labelme.py +89 -83
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +87 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -302
megadetector/postprocessing/remap_detection_categories.py +36 -36
megadetector/postprocessing/render_detection_confusion_matrix.py +205 -199
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +702 -677
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +15 -15
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +14 -14
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +66 -69
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +33 -33
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +11 -11
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/azure_utils.py +22 -22
megadetector/utils/ct_utils.py +1019 -200
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +541 -518
megadetector/utils/path_utils.py +1511 -406
megadetector/utils/process_utils.py +41 -41
megadetector/utils/sas_blob_utils.py +53 -49
megadetector/utils/split_locations_into_train_val.py +73 -60
megadetector/utils/string_utils.py +147 -26
megadetector/utils/url_utils.py +463 -173
megadetector/utils/wi_utils.py +2629 -2868
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +21 -21
megadetector/visualization/render_images_with_thumbnails.py +37 -73
megadetector/visualization/visualization_utils.py +424 -404
megadetector/visualization/visualize_db.py +197 -190
megadetector/visualization/visualize_detector_output.py +126 -98
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/METADATA +6 -3
megadetector-5.0.29.dist-info/RECORD +163 -0
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/WHEEL +1 -1
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector-5.0.27.dist-info/RECORD +0 -208
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/top_level.txt +0 -0

megadetector/taxonomy_mapping/species_lookup.py CHANGED Viewed

@@ -114,7 +114,7 @@ def initialize_taxonomy_lookup(force_init=False) -> None:
     if (not force_init) and (inat_taxonomy is not None):
         print('Skipping taxonomy re-init')
         return
     if (not force_init) and (os.path.isfile(serialized_structures_file)):
         print(f'De-serializing taxonomy data from {serialized_structures_file}')
@@ -135,7 +135,7 @@ def initialize_taxonomy_lookup(force_init=False) -> None:
         gbif_vernacular_to_taxon_id,\
         gbif_taxon_id_to_scientific,\
         gbif_scientific_to_taxon_id = structures_to_serialize
         return
@@ -146,7 +146,7 @@ def initialize_taxonomy_lookup(force_init=False) -> None:
     for taxonomy_name, zip_url in taxonomy_urls.items():
         need_to_download = False
         if force_init:
             need_to_download = True
@@ -267,7 +267,7 @@ def initialize_taxonomy_lookup(force_init=False) -> None:
     # Build iNat dictionaries
     print('Building lookup dictionaries for iNat taxonomy')
     for i_row, row in tqdm(inat_taxonomy.iterrows(), total=len(inat_taxonomy)):
         taxon_id = row['taxonID']
@@ -286,7 +286,7 @@ def initialize_taxonomy_lookup(force_init=False) -> None:
     # Build GBIF dictionaries
     print('Building lookup dictionaries for GBIF taxonomy')
     for i_row, row in tqdm(gbif_taxonomy.iterrows(), total=len(gbif_taxonomy)):
         taxon_id = row['taxonID']
@@ -596,21 +596,21 @@ class TaxonomicMatch:
 hyphenated_terms = ['crowned', 'backed', 'throated', 'tailed', 'headed', 'cheeked',
-                    'ruffed', 'browed', 'eating', 'striped', 'shanked',
+                    'ruffed', 'browed', 'eating', 'striped', 'shanked',
                     'fronted', 'bellied', 'spotted', 'eared', 'collared', 'breasted',
                     'necked']
 def get_preferred_taxonomic_match(query: str, taxonomy_preference = 'inat', retry=True) -> TaxonomicMatch:
     """
-    Wrapper for _get_preferred_taxonomic_match, but expressing a variety of heuristics
+    Wrapper for _get_preferred_taxonomic_match, but expressing a variety of heuristics
     and preferences that are specific to our scenario.
     Args:
         query (str): The common or scientific name we want to look up
         taxonomy_preference (str, optional): 'inat' or 'gbif'
-        retry (bool, optional): if the initial lookup fails, should we try heuristic
+        retry (bool, optional): if the initial lookup fails, should we try heuristic
             substitutions, e.g. replacing "_" with " ", or "spp" with "species"?
     Returns:
         TaxonomicMatch: the best taxonomic match, or None
     """
@@ -618,31 +618,31 @@ def get_preferred_taxonomic_match(query: str, taxonomy_preference = 'inat', retr
     m,query = _get_preferred_taxonomic_match(query=query,taxonomy_preference=taxonomy_preference)
     if (len(m.scientific_name) > 0) or (not retry):
         return m
     for s in hyphenated_terms:
         query = query.replace(' ' + s,'-' + s)
     m,query = _get_preferred_taxonomic_match(query=query,taxonomy_preference=taxonomy_preference)
     return m
 def validate_and_convert(data):
     """
     Recursively validates that all elements in the nested structure are only
     tuples, lists, ints, or np.int64, and converts np.int64 to int.
     Args:
         data: The nested structure to validate and convert
     Returns:
         The validated and converted structure
     Raises:
         TypeError: If an invalid type is encountered
     """
-    if isinstance(data, np.int64):
+    if isinstance(data, np.int64):
         return int(data)
-    elif isinstance(data, int) or isinstance(data, str):
+    elif isinstance(data, int) or isinstance(data, str):
         return data
     elif isinstance(data, (list, tuple)):
         # Process lists and tuples recursively
@@ -654,17 +654,17 @@ def validate_and_convert(data):
 # ...def validate_and_convert(...)
 def _get_preferred_taxonomic_match(query: str, taxonomy_preference = 'inat') -> TaxonomicMatch:
     query = query.lower().strip().replace('_', ' ')
     query = query.replace('unidentified','')
     query = query.replace('unknown','')
     if query.endswith(' sp'):
         query = query.replace(' sp','')
     if query.endswith(' group'):
-        query = query.replace(' group','')
+        query = query.replace(' group','')
     query = query.strip()
     # query = 'person'
@@ -686,17 +686,17 @@ def _get_preferred_taxonomic_match(query: str, taxonomy_preference = 'inat') ->
     n_inat_matches = len(inat_matches)
     n_gbif_matches = len(gbif_matches)
     selected_matches = None
     assert taxonomy_preference in ['gbif','inat'],\
         'Unrecognized taxonomy preference: {}'.format(taxonomy_preference)
     if n_inat_matches > 0 and taxonomy_preference == 'inat':
         selected_matches = 'inat'
     elif n_gbif_matches > 0:
         selected_matches = 'gbif'
     if selected_matches == 'inat':
         i_match = 0
@@ -802,7 +802,7 @@ def _get_preferred_taxonomic_match(query: str, taxonomy_preference = 'inat') ->
     # Convert np.int64's to ints
     if match is not None:
         match = validate_and_convert(match)
     taxonomy_string = str(match)
     return TaxonomicMatch(scientific_name, common_name, taxonomic_level, source,
@@ -828,15 +828,15 @@ if False:
     # print(matches)
     print_taxonomy_matches(matches,verbose=True)
     print('\n\n')
     # Print the taxonomy in the taxonomy spreadsheet format
     assert matches[1]['source'] == 'inat'
     t = str(matches[1]['taxonomy'])
     print(t)
     import clipboard; clipboard.copy(t)
     #%% Directly access the taxonomy tables
@@ -848,12 +848,12 @@ if False:
 #%% Command-line driver
-def main():
+def main(): # noqa
     # Read command line inputs (absolute path)
     parser = argparse.ArgumentParser()
     parser.add_argument('input_file')
     if len(sys.argv[1:]) == 0:
         parser.print_help()
         parser.exit()

megadetector/taxonomy_mapping/taxonomy_csv_checker.py CHANGED Viewed

@@ -36,7 +36,7 @@ def check_taxonomy_csv(csv_path: str) -> None:
     """
     See module docstring.
     """
     taxonomy_df = pd.read_csv(csv_path)
     graph = nx.DiGraph()
@@ -46,12 +46,12 @@ def check_taxonomy_csv(csv_path: str) -> None:
     num_scientific_name_errors = 0
     for i_row, row in taxonomy_df.iterrows():
         ds = row['dataset_name']
         ds_label = row['query']
         scientific_name = row['scientific_name']
         level = row['taxonomy_level']
         # This used to represent the source of the mapping: iNat, gbif, or manual.  We've
         # stopped tracking this, so this is now vestigial.
         id_source = 0 # row['source']
@@ -95,8 +95,8 @@ def check_taxonomy_csv(csv_path: str) -> None:
                     num_scientific_name_errors += 1
             taxon_child = node
-    # ...for each row in the taxonomy file
+    # ...for each row in the taxonomy file
     assert nx.is_directed_acyclic_graph(graph)
@@ -124,36 +124,36 @@ def check_taxonomy_csv(csv_path: str) -> None:
         print(f'At least one node has unresolved ambiguous parents: {e}')
     print('Processed {} rows from {}'.format(len(taxonomy_df),csv_path))
     print('num taxon level errors:', num_taxon_level_errors)
     print('num scientific name errors:', num_scientific_name_errors)
 #%% Command-line driver
 if __name__ == '__main__':
     parser = argparse.ArgumentParser()
     parser.add_argument(
         'taxonomy_csv_path',
         help='path to taxonomy CSV file')
     if len(sys.argv[1:]) == 0:
         parser.print_help()
         parser.exit()
     args = parser.parse_args()
     check_taxonomy_csv(args.taxonomy_csv_path)
 #%% Interactive driver
 if False:
     #%%
     import os
     csv_path = os.path.expanduser('~/lila/lila-taxonomy-mapping_release.csv')
     check_taxonomy_csv(csv_path)

megadetector/taxonomy_mapping/taxonomy_graph.py CHANGED Viewed

@@ -1,4 +1,4 @@
-"""
+r"""
 taxonomy_graph.py
@@ -69,7 +69,7 @@ class TaxonNode:
     By default, we support multiple parents for each TaxonNode. See discussion
     in module docstring above.
     """
     # class variables
     single_parent_only: ClassVar[bool] = False
@@ -82,7 +82,7 @@ class TaxonNode:
     def __init__(self, level: str, name: str,
                  graph: Optional[nx.DiGraph] = None):
         self.level = level
         self.name = name
         self.graph = graph
@@ -131,7 +131,7 @@ class TaxonNode:
         Args:
             parent: TaxonNode, must be higher in the taxonomical hierarchy
         """
         assert self.graph is not None
         parents = self.parents
         if TaxonNode.single_parent_only and len(parents) > 0:
@@ -150,7 +150,7 @@ class TaxonNode:
         Args:
             child: TaxonNode, must be lower in the taxonomical hierarchy
         """
         assert self.graph is not None
         self.graph.add_edge(self, child)
@@ -160,7 +160,7 @@ class TaxonNode:
             ds: str, name of dataset
             ds_label: str, name of label used by that dataset
         """
         self.dataset_labels.add((ds, ds_label))
     def get_dataset_labels(self,
@@ -176,7 +176,7 @@ class TaxonNode:
         Returns: set of (ds, ds_label) tuples
         """
         result = self.dataset_labels
         if include_datasets is not None:
             result = set(tup for tup in result if tup[0] in include_datasets)
@@ -199,7 +199,7 @@ class TaxonNode:
         Returns: TaxonNode, the LCA if it exists, or None if no LCA exists
         """
         paths = []
         for node in nodes:
             # get path to root
@@ -242,7 +242,7 @@ def build_taxonomy_graph(taxonomy_df: pd.DataFrame
             TaxonNode node in the tree that contains the label,
             keys are all lowercase
     """
     graph = nx.DiGraph()
     taxon_to_node = {}  # maps (taxon_level, taxon_name) to a TaxonNode
     label_to_node = {}  # maps (dataset_name, dataset_label) to a TaxonNode
@@ -303,12 +303,12 @@ def dag_to_tree(graph: nx.DiGraph,
     component separately.
     Args:
-        graph: nx.DiGraph, DAG representation of taxonomy hieararchy
+        graph: nx.DiGraph, DAG representation of taxonomy hierarchy
         taxon_to_node: dict, maps (taxon_level, taxon_name) to a TaxonNode
     Returns: nx.DiGraph, a tree-structured graph
     """
     tree = nx.DiGraph()
     for node in graph.nodes:
         tree.add_node(node)

megadetector/taxonomy_mapping/validate_lila_category_mappings.py CHANGED Viewed

@@ -17,9 +17,9 @@ from megadetector.data_management.lila.lila_common import read_lila_taxonomy_map
 #%% Prevent execution during infrastructural imports
 if False:
     #%% Constants
     lila_local_base = os.path.expanduser('~/lila')
     metadata_dir = os.path.join(lila_local_base,'metadata')
@@ -30,7 +30,7 @@ if False:
     lila_dataset_to_categories_file = os.path.join(category_list_dir,'lila_dataset_to_categories.json')
     assert os.path.isfile(lila_dataset_to_categories_file)
     #%% Load category and taxonomy files
@@ -48,36 +48,36 @@ if False:
     # i_row = 1; row = taxonomy_df.iloc[i_row]; row
     for i_row,row in taxonomy_df.iterrows():
         ds_query = row['dataset_name'] + ':' + row['query']
         ds_query = ds_query.lower()
         if not isinstance(row['scientific_name'],str):
             unmapped_queries.add(ds_query)
             ds_query_to_scientific_name[ds_query] = 'unmapped'
             continue
         ds_query_to_scientific_name[ds_query] = row['scientific_name']
     #%% For each dataset, make sure we can map every category to the taxonomy
     # dataset_name = list(lila_dataset_to_categories.keys())[0]
     for _dataset_name in lila_dataset_to_categories.keys():
         if '_bbox' in _dataset_name:
             dataset_name = _dataset_name.replace('_bbox','')
         else:
             dataset_name = _dataset_name
         categories = lila_dataset_to_categories[dataset_name]
         # c = categories[0]
         for c in categories:
             ds_query = dataset_name + ':' + c['name']
             ds_query = ds_query.lower()
             if ds_query not in ds_query_to_scientific_name:
-                print('Could not find mapping for {}'.format(ds_query))
+                print('Could not find mapping for {}'.format(ds_query))
             else:
                 scientific_name = ds_query_to_scientific_name[ds_query]

megadetector/utils/azure_utils.py CHANGED Viewed

@@ -12,8 +12,8 @@ Requires azure-storage-blob>=12.4.0
 import json
-from typing import Any, Iterable, List, Optional, Tuple, Union
-from azure.storage.blob import BlobPrefix, ContainerClient
+from typing import Any, Iterable, Optional, Union
+from azure.storage.blob import BlobPrefix, ContainerClient # type: ignore
 from megadetector.utils import path_utils
 from megadetector.utils import sas_blob_utils
@@ -26,20 +26,20 @@ def walk_container(container_client: ContainerClient,
                    prefix: str = '',
                    store_folders: bool = True,
                    store_blobs: bool = True,
-                   debug_max_items: int = -1) -> Tuple[List[str], List[str]]:
+                   debug_max_items: int = -1) -> tuple[list[str], list[str]]:
     """
     Recursively walk folders a Azure Blob Storage container.
     Based on:
     https://github.com/Azure/azure-sdk-for-python/blob/master/sdk/storage/azure-storage-blob/samples/blob_samples_walk_blob_hierarchy.py
     """
     depth = 1
     def walk_blob_hierarchy(prefix: str,
-                            folders: Optional[List[str]] = None,
-                            blobs: Optional[List[str]] = None
-                            ) -> Tuple[List[str], List[str]]:
+                            folders: Optional[list[str]] = None,
+                            blobs: Optional[list[str]] = None
+                            ) -> tuple[list[str], list[str]]:
         if folders is None:
             folders = []
         if blobs is None:
@@ -76,11 +76,11 @@ def walk_container(container_client: ContainerClient,
     return folders, blobs
-def list_top_level_blob_folders(container_client: ContainerClient) -> List[str]:
+def list_top_level_blob_folders(container_client: ContainerClient) -> list[str]:
     """
     List all top-level folders in a container.
     """
     top_level_folders, _ = walk_container(
         container_client, max_depth=1, store_blobs=False)
     return top_level_folders
@@ -88,13 +88,13 @@ def list_top_level_blob_folders(container_client: ContainerClient) -> List[str]:
 def concatenate_json_lists(input_files: Iterable[str],
                            output_file: Optional[str] = None
-                           ) -> List[Any]:
+                           ) -> list[Any]:
     """
     Given a list of JSON files that contain lists (typically string
     filenames), concatenates the lists into a single list and optionally
     writes out this list to a new output JSON file.
     """
     output_list = []
     for fn in input_files:
         with open(fn, 'r') as f:
@@ -116,12 +116,12 @@ def upload_file_to_blob(account_name: str,
     Uploads a local file to Azure Blob Storage and returns the uploaded
     blob URI with SAS token.
     """
     container_uri = sas_blob_utils.build_azure_storage_uri(
         account=account_name, container=container_name, sas_token=sas_token)
     with open(local_path, 'rb') as data:
         return sas_blob_utils.upload_blob(
-            container_uri=container_uri, blob_name=blob_name, data=data,
+            container_uri=container_uri, blob_name=blob_name, data=data,
             overwrite=overwrite)
@@ -131,11 +131,11 @@ def enumerate_blobs_to_file(
         container_name: str,
         sas_token: Optional[str] = None,
         blob_prefix: Optional[str] = None,
-        blob_suffix: Optional[Union[str, Tuple[str]]] = None,
+        blob_suffix: Optional[Union[str, tuple[str]]] = None,
         rsearch: Optional[str] = None,
         limit: Optional[int] = None,
         verbose: Optional[bool] = True
-        ) -> List[str]:
+        ) -> list[str]:
     """
     Enumerates blobs in a container, and writes the blob names to an output
     file.
@@ -143,7 +143,7 @@ def enumerate_blobs_to_file(
     Args:
         output_file: str, path to save list of files in container
             If ends in '.json', writes a JSON string. Otherwise, writes a
-            newline-delimited list. Can be None, in which case this is just a
+            newline-delimited list. Can be None, in which case this is just a
             convenient wrapper for blob enumeration.
         account_name: str, Azure Storage account name
         container_name: str, Azure Blob Storage container name
@@ -155,24 +155,24 @@ def enumerate_blobs_to_file(
             be lowercased first before comparing with the suffix(es).
         rsearch: optional str, returned results will only contain blob names
             that match this regex. Can also be a list of regexes, in which case
-            blobs matching *any* of the regex's will be returned.
+            blobs matching *any* of the regex's will be returned.
         limit: int, maximum # of blob names to list
             if None, then returns all blob names
     Returns: list of str, sorted blob names, of length limit or shorter.
     """
     if sas_token is not None and len(sas_token) > 9 and sas_token[0] == '?':
         sas_token = sas_token[1:]
     container_uri = sas_blob_utils.build_azure_storage_uri(
         account=account_name, container=container_name, sas_token=sas_token)
     matched_blobs = sas_blob_utils.list_blobs_in_container(
         container_uri=container_uri, blob_prefix=blob_prefix,
         blob_suffix=blob_suffix, rsearch=rsearch, limit=limit, verbose=verbose)
     if output_file is not None:
         path_utils.write_list_to_file(output_file, matched_blobs)
     return matched_blobs

megadetector 5.0.27__py3-none-any.whl → 5.0.29__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.27py3-none-any.whl → 5.0.29py3-none-any.whl