PyPI - megadetector - Versions diffs - 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl - Mend

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (197) hide show

megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/efficientnet/model.py +8 -8
megadetector/classification/efficientnet/utils.py +6 -5
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +26 -26
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -2
megadetector/data_management/camtrap_dp_to_coco.py +79 -46
megadetector/data_management/cct_json_utils.py +103 -103
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +210 -193
megadetector/data_management/databases/add_width_and_height_to_db.py +86 -12
megadetector/data_management/databases/combine_coco_camera_traps_files.py +40 -40
megadetector/data_management/databases/integrity_check_json_db.py +228 -200
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +88 -39
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +133 -125
megadetector/data_management/labelme_to_yolo.py +159 -73
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +365 -107
megadetector/data_management/lila/get_lila_annotation_counts.py +35 -33
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +73 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +28 -19
megadetector/data_management/mewc_to_md.py +344 -340
megadetector/data_management/ocr_tools.py +262 -255
megadetector/data_management/read_exif.py +249 -227
megadetector/data_management/remap_coco_categories.py +90 -28
megadetector/data_management/remove_exif.py +81 -21
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +588 -120
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +248 -122
megadetector/data_management/yolo_to_coco.py +333 -191
megadetector/detection/change_detection.py +832 -0
megadetector/detection/process_video.py +340 -337
megadetector/detection/pytorch_detector.py +358 -278
megadetector/detection/run_detector.py +399 -186
megadetector/detection/run_detector_batch.py +404 -377
megadetector/detection/run_inference_with_yolov5_val.py +340 -327
megadetector/detection/run_tiled_inference.py +257 -249
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +332 -295
megadetector/postprocessing/add_max_conf.py +19 -11
megadetector/postprocessing/categorize_detections_by_size.py +45 -45
megadetector/postprocessing/classification_postprocessing.py +468 -433
megadetector/postprocessing/combine_batch_outputs.py +23 -23
megadetector/postprocessing/compare_batch_results.py +590 -525
megadetector/postprocessing/convert_output_format.py +106 -102
megadetector/postprocessing/create_crop_folder.py +347 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -499
megadetector/postprocessing/load_api_results.py +48 -27
megadetector/postprocessing/md_to_coco.py +133 -102
megadetector/postprocessing/md_to_labelme.py +107 -90
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +92 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -301
megadetector/postprocessing/remap_detection_categories.py +91 -38
megadetector/postprocessing/render_detection_confusion_matrix.py +214 -205
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +704 -679
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +18 -19
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +54 -33
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +67 -67
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +156 -74
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +10 -10
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/ct_utils.py +1049 -211
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +632 -529
megadetector/utils/path_utils.py +1520 -431
megadetector/utils/process_utils.py +41 -41
megadetector/utils/split_locations_into_train_val.py +62 -62
megadetector/utils/string_utils.py +148 -27
megadetector/utils/url_utils.py +489 -176
megadetector/utils/wi_utils.py +2658 -2526
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +34 -30
megadetector/visualization/render_images_with_thumbnails.py +39 -74
megadetector/visualization/visualization_utils.py +487 -435
megadetector/visualization/visualize_db.py +232 -198
megadetector/visualization/visualize_detector_output.py +82 -76
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/METADATA +5 -2
megadetector-10.0.0.dist-info/RECORD +139 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/WHEEL +1 -1
megadetector/api/batch_processing/api_core/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/score.py +0 -439
megadetector/api/batch_processing/api_core/server.py +0 -294
megadetector/api/batch_processing/api_core/server_api_config.py +0 -97
megadetector/api/batch_processing/api_core/server_app_config.py +0 -55
megadetector/api/batch_processing/api_core/server_batch_job_manager.py +0 -220
megadetector/api/batch_processing/api_core/server_job_status_table.py +0 -149
megadetector/api/batch_processing/api_core/server_orchestration.py +0 -360
megadetector/api/batch_processing/api_core/server_utils.py +0 -88
megadetector/api/batch_processing/api_core_support/__init__.py +0 -0
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
megadetector/api/batch_processing/api_support/__init__.py +0 -0
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +0 -152
megadetector/api/batch_processing/data_preparation/__init__.py +0 -0
megadetector/api/synchronous/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/api_backend.py +0 -151
megadetector/api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -263
megadetector/api/synchronous/api_core/animal_detection_api/config.py +0 -35
megadetector/api/synchronous/api_core/tests/__init__.py +0 -0
megadetector/api/synchronous/api_core/tests/load_test.py +0 -110
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector/utils/azure_utils.py +0 -178
megadetector/utils/sas_blob_utils.py +0 -509
megadetector-5.0.28.dist-info/RECORD +0 -209
/megadetector/{api/batch_processing/__init__.py → __init__.py} +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/top_level.txt +0 -0

megadetector/taxonomy_mapping/preview_lila_taxonomy.py CHANGED Viewed

@@ -16,7 +16,7 @@ import os
 import pandas as pd
 # lila_taxonomy_file = r"c:\git\agentmorrisprivate\lila-taxonomy\lila-taxonomy-mapping.csv"
-lila_taxonomy_file = os.path.expanduser('~/lila/lila_additions_2025.03.24.csv')
+lila_taxonomy_file = os.path.expanduser('~/lila/lila_additions_2025.06.23.csv')
 preview_base = os.path.expanduser('~/lila/lila_taxonomy_preview')
 os.makedirs(preview_base,exist_ok=True)
@@ -27,20 +27,20 @@ html_output_file = os.path.join(preview_base,'index.html')
 def parse_taxonomy_string(taxonomy_string):
-    taxonomic_match = eval(taxonomy_string)
+    taxonomic_match = eval(taxonomy_string)
     matched_entity = taxonomic_match[0]
     assert len(matched_entity) == 4
     level = matched_entity[1]
     scientific_name = matched_entity[2]
     common_names = matched_entity[3]
     if len(common_names) == 1:
         common_name = common_names[0]
     else:
         common_name = str(common_names)
     return scientific_name,common_name,level,taxonomic_match
 def taxonomy_string_to_common_name(taxonomy_string):
@@ -79,14 +79,14 @@ n_taxonomy_changes = 0
 # Look for internal inconsistency
 for i_row,row in df.iterrows():
     sn = row['scientific_name']
     if not isinstance(sn,str):
         continue
-    ts = row['taxonomy_string']
+    ts = row['taxonomy_string']
     assert sn == taxonomy_string_to_scientific(ts)
     assert row['taxonomy_level'] == taxonomy_string_to_level(ts)
 # Look for outdated mappings
@@ -94,18 +94,18 @@ taxonomy_preference = 'inat'
 # i_row = 0; row = df.iloc[i_row]
 for i_row,row in tqdm(df.iterrows(),total=len(df)):
     sn = row['scientific_name']
     if not isinstance(sn,str):
         continue
     m = get_preferred_taxonomic_match(sn,taxonomy_preference)
     assert m.scientific_name == sn
     ts = row['taxonomy_string']
     assert m.taxonomy_string[0:50] == ts[0:50], 'Mismatch for {}:\n\n{}\n\n{}\n'.format(
         row['dataset_name'],ts,m.taxonomy_string)
     if ts != m.taxonomy_string:
         n_taxonomy_changes += 1
         df.loc[i_row,'taxonomy_string'] = m.taxonomy_string
@@ -161,45 +161,45 @@ suppress_multiple_matches = [
     ['porcupine','Snapshot Kruger','Idaho Camera Traps'],
     ['porcupine','Snapshot Mountain Zebra','Idaho Camera Traps'],
     ['porcupine','Snapshot Serengeti','Idaho Camera Traps'],
     ['porcupine','Snapshot Serengeti','Snapshot Mountain Zebra'],
     ['porcupine','Snapshot Serengeti','Snapshot Kruger'],
     ['porcupine','Snapshot Serengeti','Snapshot Kgalagadi'],
     ['porcupine','Snapshot Serengeti','Snapshot Karoo'],
     ['porcupine','Snapshot Serengeti','Snapshot Camdeboo'],
     ['porcupine','Snapshot Enonkishu','Snapshot Camdeboo'],
     ['porcupine','Snapshot Enonkishu','Snapshot Mountain Zebra'],
     ['porcupine','Snapshot Enonkishu','Snapshot Kruger'],
     ['porcupine','Snapshot Enonkishu','Snapshot Kgalagadi'],
     ['porcupine','Snapshot Enonkishu','Snapshot Karoo'],
     ['kudu','Snapshot Serengeti','Snapshot Mountain Zebra'],
     ['kudu','Snapshot Serengeti','Snapshot Kruger'],
     ['kudu','Snapshot Serengeti','Snapshot Kgalagadi'],
     ['kudu','Snapshot Serengeti','Snapshot Karoo'],
     ['kudu','Snapshot Serengeti','Snapshot Camdeboo'],
     ['fox','Caltech Camera Traps','Channel Islands Camera Traps'],
     ['fox','Idaho Camera Traps','Channel Islands Camera Traps'],
     ['fox','Idaho Camera Traps','Caltech Camera Traps'],
     ['pangolin','Snapshot Serengeti','SWG Camera Traps'],
     ['deer', 'Wellington Camera Traps', 'Idaho Camera Traps'],
     ['deer', 'Wellington Camera Traps', 'Caltech Camera Traps'],
     ['unknown cervid', 'WCS Camera Traps', 'Idaho Camera Traps']
 ]
 for i_row,row in df.iterrows():
     query = row['query']
     taxonomy_string = row['taxonomy_string']
     for previous_i_row in query_to_rows[query]:
         previous_row = df.iloc[previous_i_row]
         assert previous_row['query'] == query
         query_match = False
@@ -209,11 +209,11 @@ for i_row,row in df.iterrows():
             query_match = isnan(row['taxonomy_string'])
         else:
             query_match = previous_row['taxonomy_string'][0:10] == taxonomy_string[0:10]
         if not query_match:
             suppress = False
             # x = suppress_multiple_matches[-1]
             for x in suppress_multiple_matches:
                 if x[0] == query and \
@@ -225,18 +225,18 @@ for i_row,row in df.iterrows():
                     suppress = True
                     n_suppressed += 1
                     break
             if not suppress:
                 print('Query {} in {} and {}:\n\n{}\n\n{}\n'.format(
                     query, row['dataset_name'], previous_row['dataset_name'],
                     taxonomy_string, previous_row['taxonomy_string']))
             queries_with_multiple_mappings.add(query)
     # ...for each row where we saw this query
     query_to_rows[query].append(i_row)
 # ...for each row
 print('Found {} queries with multiple mappings ({} occurrences suppressed)'.format(
@@ -267,9 +267,9 @@ for i_row,row in df.iterrows():
         ) \
         and \
         ('species' in level):
         if query not in allowable_unknown_species:
             print('Warning: query {}:{} maps to {} {}'.format(
                 row['dataset_name'],
                 row['query'],
@@ -285,7 +285,7 @@ for i_row,row in df.iterrows():
         if 'source' in row:
             assert isinstance(row['source'],str)
         assert isinstance(row['taxonomy_level'],str)
 #%% Find WCS mappings that aren't species or aren't the same as the input
@@ -294,22 +294,22 @@ for i_row,row in df.iterrows():
 # row = df.iloc[-500]
 for i_row,row in df.iterrows():
     if not isinstance(row['scientific_name'],str):
         continue
     if 'WCS' not in row['dataset_name']:
         continue
     query = row['query']
     scientific_name = row['scientific_name']
     common_name = row['common_name']
-    level = row['taxonomy_level']
+    level = row['taxonomy_level']
     taxonomy_string = row['taxonomy_string']
-    common_name_from_taxonomy = taxonomy_string_to_common_name(taxonomy_string)
+    common_name_from_taxonomy = taxonomy_string_to_common_name(taxonomy_string)
     query_string = query.replace(' sp','')
     query_string = query_string.replace('unknown ','')
     # Anything marked "species" or "unknown" by definition doesn't map to a species,
     # so ignore these.
     if (' sp' not in query) and ('unknown' not in query) and \
@@ -317,7 +317,7 @@ for i_row,row in df.iterrows():
         print('WCS query {} ({}) remapped to {} {} ({})'.format(
             query,common_name,level,scientific_name,common_name_from_taxonomy))
-    if query_string != scientific_name:
+    if query_string != scientific_name:
         pass
         # print('WCS query {} ({}) remapped to {} ({})'.format(
         #     query,common_name,scientific_name,common_names_from_taxonomy))
@@ -345,20 +345,20 @@ min_valid_image_size = 3000
 #
 # i_row = 0; row = df.iloc[i_row]
 for i_row,row in df.iterrows():
     s = row['scientific_name']
     if (not isinstance(s,str)) or (len(s)==0):
         continue
     query = s.replace(' ','+')
     if query in remapped_queries:
         query = remapped_queries[query]
     query_folder = os.path.join(image_base,query)
     os.makedirs(query_folder,exist_ok=True)
     # Check whether we already have enough images for this query
     image_files = os.listdir(query_folder)
     image_fullpaths = [os.path.join(query_folder,fn) for fn in image_files]
@@ -371,7 +371,7 @@ for i_row,row in df.iterrows():
     # Check whether we've already run this query for a previous row
     if query in scientific_name_to_paths:
         continue
     print('Processing query {} of {} ({})'.format(i_row,len(df),query))
     paths = retrieve_sample_image.download_images(query=query,
                                              output_directory=image_base,
@@ -404,40 +404,40 @@ scientific_name_to_preferred_images = {}
 # s = list(scientific_name_to_paths.keys())[0]
 for s in list(df.scientific_name):
     if not isinstance(s,str):
         continue
     query = s.replace(' ','+')
     if query in remapped_queries:
         query = remapped_queries[query]
     query_folder = os.path.join(image_base,query)
     assert os.path.isdir(query_folder)
     image_files = os.listdir(query_folder)
-    image_fullpaths = [os.path.join(query_folder,fn) for fn in image_files]
+    image_fullpaths = [os.path.join(query_folder,fn) for fn in image_files]
     sizes = [os.path.getsize(p) for p in image_fullpaths]
     path_to_size = {}
     for i_fp,fp in enumerate(image_fullpaths):
         path_to_size[fp] = sizes[i_fp]
     paths_by_size = [x for _, x in sorted(zip(sizes, image_fullpaths),reverse=True)]
     # Be suspicious of duplicate sizes
     b_duplicate_sizes = [False] * len(paths_by_size)
     for i_path,p in enumerate(paths_by_size):
         if i_path == len(paths_by_size) - 1:
             continue
         if path_to_size[p] == path_to_size[paths_by_size[i_path+1]]:
             b_duplicate_sizes[i_path] = True
     paths_by_size_non_dup = [i for (i, v) in zip(paths_by_size, b_duplicate_sizes) if not v]
     preferred_paths = paths_by_size_non_dup[:max_images_per_query]
     scientific_name_to_preferred_images[s] = preferred_paths
-# ...for each scientific name
+# ...for each scientific name
 #%% Delete unused images
@@ -445,7 +445,7 @@ for s in list(df.scientific_name):
 used_images = []
 for images in scientific_name_to_preferred_images.values():
     used_images.extend(images)
 print('Using a total of {} images'.format(len(used_images)))
 used_images_set = set(used_images)
@@ -461,18 +461,18 @@ print('{} of {} files unused (diff {})'.format(len(unused_images),len(all_images
                                                len(all_images) - len(unused_images)))
 for fn in tqdm(unused_images):
-    os.remove(fn)
+    os.remove(fn)
 #%% Produce HTML preview
 with open(html_output_file, 'w', encoding='utf-8') as f:
     f.write('<html><head></head><body>\n')
     names = scientific_name_to_preferred_images.keys()
     names = sorted(names)
     f.write('<p class="speciesinfo_p" style="font-weight:bold;font-size:130%">'
             'dataset_name: <b><u>category</u></b> mapped to taxonomy_level scientific_name (taxonomic_common_name) (manual_common_name)</p>\n'
             '</p>')
@@ -481,10 +481,10 @@ with open(html_output_file, 'w', encoding='utf-8') as f:
     for i_row, row in tqdm(df.iterrows(), total=len(df)):
         s = row['scientific_name']
         taxonomy_string = row['taxonomy_string']
         if isinstance(taxonomy_string,str):
-            taxonomic_match = eval(taxonomy_string)
+            taxonomic_match = eval(taxonomy_string)
             matched_entity = taxonomic_match[0]
             assert len(matched_entity) == 4
             common_names = matched_entity[3]
@@ -499,7 +499,7 @@ with open(html_output_file, 'w', encoding='utf-8') as f:
         if isinstance(row.scientific_name,str):
             output_string = '{}: <b><u>{}</u></b> mapped to {} {} ({}) ({})</p>\n'.format(
-                row.dataset_name, row.query,
+                row.dataset_name, row.query,
                 row.taxonomy_level, row.scientific_name, common_name_string,
                 row.common_name)
             f.write(output_string)

megadetector/taxonomy_mapping/retrieve_sample_image.py CHANGED Viewed

@@ -17,21 +17,21 @@ import os
 output_folder = os.path.expanduser('~/tmp/image-download-test')
 os.makedirs(output_folder,exist_ok=True)
 method = 'simple_image_download' # 'google_images_download'
 if method == 'simple_image_download':
     from megadetector.taxonomy_mapping import simple_image_download
     google_image_downloader = simple_image_download.Downloader()
     google_image_downloader.directory = output_folder
 elif method == 'google_images_download':
     from google_images_download import google_images_download
 else:
     raise ValueError('Unrecognized method {}'.format(method))
@@ -39,33 +39,33 @@ else:
 def download_images(query,output_directory,limit=100,verbose=False):
-    query = query.replace(' ','+')
+    query = query.replace(' ','+')
     if method == 'simple_image_download':
         google_image_downloader.directory = output_directory
         paths = google_image_downloader.download(query, limit=limit,
           verbose=verbose, cache=False, download_cache=False)
         return paths
     elif method == 'google_images_download':
-        response = google_images_download.googleimagesdownload()
+        response = google_images_download.googleimagesdownload()
         arguments = {'keywords':query,'limit':limit,'print_urls':verbose,
                      'image-directory':output_directory}
         response.download(arguments)
         return None
     else:
         raise ValueError('Unrecognized method {}'.format(method))
 #%% Test driver
 if False:
     #%%
     paths = download_images(query='redunca',output_directory=output_folder,
-                    limit=20,verbose=True)
+                    limit=20,verbose=True)

megadetector/taxonomy_mapping/simple_image_download.py CHANGED Viewed

@@ -49,7 +49,7 @@ def generate_urls(search):
     """
     Generate Google search URLs for all tokens in the list [search]
     """
     return [(BASE_URL+quote(word)+GOOGLE_PICTURE_ID) for word in search]
@@ -60,7 +60,7 @@ def check_webpage(url):
         if 'html' not in str(request.content):
             checked_url = request
     except Exception as err:
-        print(err)
+        print(err)
     return checked_url
@@ -68,7 +68,7 @@ def scan_webpage(webpage, extensions, timer):
     """
     Scan for pictures to download based on keywords
     """
     global SCANNER_COUNTER
     scanner = webpage.find
     found = False
@@ -143,7 +143,7 @@ class Downloader:
         urls_ = generate_urls(search)
         timer = timer if timer else 1000
         # max_progressbar = count * (list(range(limit+1))[-1]+1)
         # bar = progressbar.ProgressBar(maxval=max_progressbar,
         #                               widgets=[progressbar.Bar('=', '[', ']'), ' ', progressbar.Percentage()]).start()
         i = 0
@@ -172,7 +172,7 @@ class Downloader:
             print('==='*15 + ' < ' + 'NO PICTURES FOUND' + ' > ' + '==='*15)
         return cache_out
-    def download(self, keywords=None, limit=1, verbose=False, cache=True, download_cache=False,
+    def download(self, keywords=None, limit=1, verbose=False, cache=True, download_cache=False,
                  timer=None):
         if not download_cache:
             content = self.search_urls(keywords, limit, verbose, cache, timer)
@@ -180,16 +180,16 @@ class Downloader:
             content = self._cached_urls
             if not content:
                 print('Downloader has not URLs saved in Memory yet, run Downloader.search_urls to find pics first')
-        paths = []
+        paths = []
         for name, (path, url) in content.items():
             fullpath = os.path.join(path, name)
             paths.append(fullpath)
             with open(fullpath, 'wb') as file:
                 file.write(url.content)
             if verbose:
-                print(f'File Name={name}, Downloaded from {url.url}')
+                print(f'File Name={name}, Downloaded from {url.url}')
         return paths
     def _create_directories(self, name):
         dir_path = os.path.join(self._directory, name)
         try:

megadetector 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl