PyPI - megadetector - Versions diffs - 5.0.6__py3-none-any.whl → 5.0.7__py3-none-any.whl - Mend

megadetector 5.0.6py3-none-any.whl → 5.0.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (62) hide show

api/batch_processing/data_preparation/manage_local_batch.py +278 -197
api/batch_processing/data_preparation/manage_video_batch.py +7 -2
api/batch_processing/postprocessing/add_max_conf.py +1 -0
api/batch_processing/postprocessing/compare_batch_results.py +110 -60
api/batch_processing/postprocessing/load_api_results.py +55 -69
api/batch_processing/postprocessing/md_to_labelme.py +1 -0
api/batch_processing/postprocessing/postprocess_batch_results.py +158 -50
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +625 -0
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +71 -23
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +1 -1
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +222 -74
api/batch_processing/postprocessing/subset_json_detector_output.py +132 -5
api/batch_processing/postprocessing/top_folders_to_bottom.py +1 -1
classification/prepare_classification_script.py +191 -191
data_management/coco_to_yolo.py +65 -44
data_management/databases/integrity_check_json_db.py +7 -5
data_management/generate_crops_from_cct.py +1 -1
data_management/importers/animl_results_to_md_results.py +2 -2
data_management/importers/noaa_seals_2019.py +1 -1
data_management/importers/zamba_results_to_md_results.py +2 -2
data_management/labelme_to_coco.py +34 -6
data_management/labelme_to_yolo.py +1 -1
data_management/lila/create_lila_blank_set.py +474 -0
data_management/lila/create_lila_test_set.py +2 -1
data_management/lila/create_links_to_md_results_files.py +1 -1
data_management/lila/download_lila_subset.py +46 -21
data_management/lila/generate_lila_per_image_labels.py +23 -14
data_management/lila/get_lila_annotation_counts.py +16 -10
data_management/lila/lila_common.py +14 -11
data_management/lila/test_lila_metadata_urls.py +116 -0
data_management/resize_coco_dataset.py +12 -10
data_management/yolo_output_to_md_output.py +40 -13
data_management/yolo_to_coco.py +34 -21
detection/process_video.py +36 -14
detection/pytorch_detector.py +1 -1
detection/run_detector.py +73 -18
detection/run_detector_batch.py +104 -24
detection/run_inference_with_yolov5_val.py +127 -26
detection/run_tiled_inference.py +153 -43
detection/video_utils.py +3 -1
md_utils/ct_utils.py +79 -3
md_utils/md_tests.py +253 -15
md_utils/path_utils.py +129 -24
md_utils/process_utils.py +26 -7
md_utils/split_locations_into_train_val.py +215 -0
md_utils/string_utils.py +10 -0
md_utils/url_utils.py +0 -2
md_utils/write_html_image_list.py +1 -0
md_visualization/visualization_utils.py +17 -2
md_visualization/visualize_db.py +8 -0
md_visualization/visualize_detector_output.py +185 -104
{megadetector-5.0.6.dist-info → megadetector-5.0.7.dist-info}/METADATA +2 -2
{megadetector-5.0.6.dist-info → megadetector-5.0.7.dist-info}/RECORD +62 -58
{megadetector-5.0.6.dist-info → megadetector-5.0.7.dist-info}/WHEEL +1 -1
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +1 -1
taxonomy_mapping/map_new_lila_datasets.py +43 -39
taxonomy_mapping/prepare_lila_taxonomy_release.py +5 -2
taxonomy_mapping/preview_lila_taxonomy.py +27 -27
taxonomy_mapping/species_lookup.py +33 -13
taxonomy_mapping/taxonomy_csv_checker.py +7 -5
{megadetector-5.0.6.dist-info → megadetector-5.0.7.dist-info}/LICENSE +0 -0
{megadetector-5.0.6.dist-info → megadetector-5.0.7.dist-info}/top_level.txt +0 -0

data_management/lila/create_lila_blank_set.py ADDED Viewed

@@ -0,0 +1,474 @@
+########
+#
+# create_lila_blank_set.py
+#
+# Create a folder of blank images sampled from LILA.  We'll aim for diversity, so less-common
+# locations will be oversampled relative to more common locations.  We'll also run MegaDetector
+# to minimize the chance that incorrectly-labeled non-empty images sneak into our blank set.
+#
+########
+#%% Constants and imports
+import os
+import random
+import math
+import json
+import shutil
+import numpy as np
+from tqdm import tqdm
+from multiprocessing.pool import ThreadPool
+from urllib.parse import urlparse
+from collections import defaultdict
+from data_management.lila.lila_common import \
+    read_lila_all_images_file, azure_url_to_gcp_http_url
+from md_utils.url_utils import download_url
+from md_visualization import visualization_utils as vis_utils
+from md_utils.path_utils import recursive_file_list
+# We'll write images, metadata downloads, and temporary files here
+lila_local_base = os.path.expanduser('~/lila')
+metadata_dir = os.path.join(lila_local_base,'metadata')
+os.makedirs(metadata_dir,exist_ok=True)
+project_base = os.path.join(lila_local_base,'lila_blanks')
+candidate_blanks_base = os.path.join(project_base,'candidate_blanks')
+os.makedirs(candidate_blanks_base,exist_ok=True)
+confirmed_blanks_base = os.path.join(project_base,'confirmed_blanks')
+os.makedirs(confirmed_blanks_base,exist_ok=True)
+md_possible_non_blanks_folder = os.path.join(project_base,'candidate_non_blanks')
+os.makedirs(md_possible_non_blanks_folder,exist_ok=True)
+preferred_image_download_source = 'gcp'
+# Number of concurrent download threads
+n_download_threads = 20
+n_blanks = 100000
+random.seed(0)
+#%% Download and open the giant table of image URLs and labels
+# ~60 seconds to download, unzip, and open
+df = read_lila_all_images_file(metadata_dir)
+#%% Explore blank labels
+# Original labels we're treating as blank:
+blank_original_labels = (
+    'empty','misfire'
+)
+# Some notable original labels we're *not* treating as blank:
+nonblank_original_labels = (
+    'unclassifiable', 'unidentifiable', 'unidentified', 'unknown', 'fire',
+    'foggy lens', 'foggy weather', 'blurred', 'end', 'eye_shine', 'ignore',
+    'lens obscured', 'misdirected', 'other', 'start', 'sun', 'problem',
+    'tilted', 'vegetation obstruction', 'snow on lens', 'malfunction'
+)
+other_labels_without_common_names = (
+    'car', 'motorcycle', 'vehicle'
+)
+common_names = sorted(list(df['common_name'].unique()),
+                      key=lambda x:str(x) if isinstance(x,float) else x)
+original_labels = sorted(list(df['original_label'].unique()),
+                         key=lambda x:str(x) if isinstance(x,float) else x)
+# Blanks are represented as NaN in the "common_name" column (though not all NaN's are blanks)
+assert '' not in common_names
+assert all([s not in common_names for s in blank_original_labels])
+assert all([s not in common_names for s in nonblank_original_labels])
+assert np.nan in common_names
+# Blanks are represented as "empty" or "misfire" in the "original_label" column
+assert all([s in original_labels for s in blank_original_labels])
+assert all([s in original_labels for s in nonblank_original_labels])
+assert all([s in original_labels for s in other_labels_without_common_names])
+assert all([s not in original_labels for s in ('','blank','none',np.nan)])
+#%% Count empty labels and common names
+common_names_with_empty_original_labels = set()
+original_labels_with_nan_common_names = set()
+common_name_to_count = defaultdict(int)
+original_label_to_count = defaultdict(int)
+# This loop takes ~10 mins
+for i_row,row in tqdm(df.iterrows(),total=len(df)):
+    common_name = row['common_name']
+    original_label = row['original_label']
+    if isinstance(common_name,float):
+        assert np.isnan(common_name)
+        original_labels_with_nan_common_names.add(original_label)
+    common_name = str(common_name)
+    assert isinstance(original_label,str)
+    if original_label in blank_original_labels:
+        common_names_with_empty_original_labels.add(common_name)
+    common_name_to_count[common_name] += 1
+    original_label_to_count[original_label] += 1
+#%% Look at the most common labels and common names
+from md_utils.ct_utils import sort_dictionary_by_value
+common_name_to_count = sort_dictionary_by_value(common_name_to_count,reverse=True)
+original_label_to_count = sort_dictionary_by_value(original_label_to_count,reverse=True)
+k = 10
+print('\nMost frequent common names:\n')
+i_label = 0
+for i_label,s in enumerate(common_name_to_count):
+    if i_label >= k:
+        break
+    print('{}: {}'.format(s,common_name_to_count[s]))
+print('\nMost frequent original labels:\n')
+i_label = 0
+for i_label,s in enumerate(original_label_to_count):
+    if i_label >= k:
+        break
+    print('{}: {}'.format(s,original_label_to_count[s]))
+#%% Do some consistency checks over the empty labels and stats
+# All images called 'empty' should have NaN as their common name
+assert (len(common_names_with_empty_original_labels) == 1)
+assert next(iter(common_names_with_empty_original_labels)) == 'nan'
+# 'empty' should be the most frequent original label overall
+assert next(iter(original_label_to_count)) == 'empty'
+# NaN should be the most frequent common name overall
+assert next(iter(common_name_to_count)) == 'nan'
+for s in original_labels_with_nan_common_names:
+    assert \
+        (s in blank_original_labels) or \
+        (s in nonblank_original_labels) or \
+        (s in other_labels_without_common_names)
+#%% Map locations to blank images
+location_to_blank_image_urls_cache_file = os.path.join(project_base,
+                                                       'location_to_blank_image_urls.json')
+force_map_locations = False
+# Load from .json if available
+if (not force_map_locations) and (os.path.isfile(location_to_blank_image_urls_cache_file)):
+    with open(location_to_blank_image_urls_cache_file,'r') as f:
+        location_to_blank_image_urls = json.load(f)
+else:
+    location_to_blank_image_urls = defaultdict(list)
+    # i_row = 0; row = df.iloc[i_row]
+    for i_row,row in tqdm(df.iterrows(),total=len(df)):
+        location_id = row['location_id']
+        url = row['url']
+        original_label = row['original_label']
+        if original_label in blank_original_labels:
+            assert np.isnan(row['common_name'])
+            location_to_blank_image_urls[location_id].append(url)
+    with open(location_to_blank_image_urls_cache_file,'w') as f:
+        json.dump(location_to_blank_image_urls,f,indent=1)
+n_locations_with_blanks = len(location_to_blank_image_urls)
+print('Found {} locations with blank images'.format(n_locations_with_blanks))
+#%% Sample blanks
+random.seed(0)
+# Make a fresh copy of the lists
+location_to_unsampled_blank_image_urls = {}
+# location = next(iter(location_to_blank_image_urls.keys()))
+for location in location_to_blank_image_urls:
+    blank_image_urls_this_location = location_to_blank_image_urls[location]
+    unsampled_blank_image_urls_this_location = blank_image_urls_this_location.copy()
+    location_to_unsampled_blank_image_urls[location] = unsampled_blank_image_urls_this_location
+# Put locations in a random order
+location_ids = list(location_to_unsampled_blank_image_urls.keys())
+random.shuffle(location_ids)
+blank_urls = []
+location_to_sampled_blanks = defaultdict(list)
+fully_sampled_locations = set()
+# Pick from each location until we hit our limit or have no blanks left
+while(True):
+    found_sample = False
+    # location = location_ids[0]
+    for location in location_ids:
+        unsampled_images_this_location = location_to_unsampled_blank_image_urls[location]
+        if len(unsampled_images_this_location) == 0:
+            fully_sampled_locations.add(location)
+            continue
+        url = random.choice(unsampled_images_this_location)
+        blank_urls.append(url)
+        location_to_unsampled_blank_image_urls[location].remove(url)
+        location_to_sampled_blanks[location].append(url)
+        found_sample = True
+        if len(blank_urls) == n_blanks:
+            break
+    # ...for each location
+    if not found_sample:
+        print('Terminating after {} blanks, we ran out before hitting {}'.format(
+            len(blank_urls),n_blanks))
+    if len(blank_urls) == n_blanks:
+        break
+# ...while(True)
+assert len(blank_urls) <= n_blanks
+min_blanks_per_location = math.floor(n_blanks/n_locations_with_blanks)
+max_blanks_per_location = -1
+for location in location_to_sampled_blanks:
+    n_blanks_this_location = len(location_to_sampled_blanks[location])
+    if n_blanks_this_location >= max_blanks_per_location:
+        max_blanks_per_location = n_blanks_this_location
+    assert (location in fully_sampled_locations) or \
+        n_blanks_this_location >= min_blanks_per_location
+print('Choose {} blanks from {} locations'.format(n_blanks,len(location_ids)))
+print('Fully sampled {} locations'.format(len(fully_sampled_locations)))
+print('Max samples per location: {}'.format(max_blanks_per_location))
+#%% Download those image files (prep)
+container_to_url_base = {
+                         'lilablobssc.blob.core.windows.net':'/',
+                         'storage.googleapis.com':'/public-datasets-lila/'
+                         }
+def download_relative_filename(url, output_base, verbose=False, url_base=None, overwrite=False):
+    """
+    Download a URL to output_base, preserving relative path
+    """
+    result = {'status':'unknown','url':url,'destination_filename':None}
+    if url_base is None:
+        assert url.startswith('https://')
+        container = url.split('/')[2]
+        assert container in container_to_url_base
+        url_base = container_to_url_base[container]
+    assert url_base.startswith('/') and url_base.endswith('/')
+    p = urlparse(url)
+    relative_filename = str(p.path)
+    # remove the leading '/'
+    assert relative_filename.startswith(url_base)
+    relative_filename = relative_filename.replace(url_base,'',1)
+    destination_filename = os.path.join(output_base,relative_filename)
+    result['destination_filename'] = destination_filename
+    if ((os.path.isfile(destination_filename)) and (not overwrite)):
+        result['status'] = 'skipped'
+        return result
+    try:
+        download_url(url, destination_filename, verbose=verbose)
+    except Exception as e:
+        print('Warning: error downloading URL {}: {}'.format(
+            url,str(e)))
+        result['status'] = 'error: {}'.format(str(e))
+        return result
+    result['status'] = 'success'
+    return result
+# Convert Azure URLs to GCP URLs if necessary
+if preferred_image_download_source != 'azure':
+    assert preferred_image_download_source == 'gcp'
+    blank_urls = [azure_url_to_gcp_http_url(url) for url in blank_urls]
+#%% Download those image files (execution)
+print('Downloading {} images on {} workers'.format(len(blank_urls),n_download_threads))
+if n_download_threads <= 1:
+    results = []
+    # url = all_urls[0]
+    for url in tqdm(blank_urls):
+        results.append(download_relative_filename(url,candidate_blanks_base,url_base=None))
+else:
+    pool = ThreadPool(n_download_threads)
+    results = list(tqdm(pool.imap(lambda s: download_relative_filename(
+        s,candidate_blanks_base,url_base=None),
+        blank_urls), total=len(blank_urls)))
+# pool.terminate()
+#%% Review results
+error_urls = []
+for r in results:
+    if r['status'] != 'success':
+        error_urls.append(r['url'])
+print('Errors on {} of {} downloads'.format(len(error_urls),len(results)))
+#%% Run MegaDetector on the folder
+md_results_file = os.path.join(project_base,'lila_blanks_md_results.json')
+cmd = 'python run_detector_batch.py MDV5A "{}" "{}"'.format(
+    candidate_blanks_base,md_results_file)
+cmd += ' --recursive --output_relative_filenames'
+import clipboard; clipboard.copy(cmd); print(cmd)
+#%% Review MD results that suggests images are non-empty
+assert os.path.isfile(md_results_file)
+category_name_to_threshold = {'animal':0.25,'person':0.25,'vehicle':0.25}
+min_threshold = min(category_name_to_threshold.values())
+with open(md_results_file,'r') as f:
+    md_results = json.load(f)
+images_to_review_to_detections = {}
+category_id_to_threshold = {}
+for category_id in md_results['detection_categories']:
+    category_name = md_results['detection_categories'][category_id]
+    category_id_to_threshold[category_id] = category_name_to_threshold[category_name]
+# im = md_results['images'][0]
+for im in md_results['images']:
+    if 'detections' not in im:
+        continue
+    found_object = False
+    for det in im['detections']:
+        threshold = category_id_to_threshold[det['category']]
+        if det['conf'] >= threshold:
+            found_object = True
+            break
+    if found_object:
+        images_to_review_to_detections[im['file']] = im['detections']
+print('Flagging {} of {} images for review'.format(len(images_to_review_to_detections),len(md_results['images'])))
+output_file_to_source_file = {}
+# i_fn = 0; source_file_relative = images_to_review[i_fn]
+for i_fn,source_file_relative in tqdm(enumerate(images_to_review_to_detections),
+                                      total=len(images_to_review_to_detections)):
+    source_file_abs = os.path.join(candidate_blanks_base,source_file_relative)
+    assert os.path.isfile(source_file_abs)
+    ext = os.path.splitext(source_file_abs)[1]
+    target_file_relative = str(i_fn).zfill(8) + ext
+    target_file_abs = os.path.join(md_possible_non_blanks_folder,target_file_relative)
+    output_file_to_source_file[target_file_relative] = source_file_relative
+    # shutil.copyfile(source_file_abs,target_file_abs)
+    vis_utils.draw_bounding_boxes_on_file(input_file=source_file_abs,
+                                          output_file=target_file_abs,
+                                          detections=images_to_review_to_detections[source_file_relative],
+                                          confidence_threshold=min_threshold,
+                                          target_size=(1280,-1))
+with open(os.path.join(project_base,'output_file_to_source_file.json'),'w') as f:
+    json.dump(output_file_to_source_file,f,indent=1)
+#%% Manual review
+# Delete images that are *not* empty
+#%% Figure out which images are still there; these are the actually-blank ones
+remaining_images = set(os.listdir(md_possible_non_blanks_folder))
+print('Kept {} of {} candidate blank images'.format(len(remaining_images),
+                                                    len(images_to_review_to_detections)))
+removed_blank_images_relative = []
+# output_file = next(iter(output_file_to_source_file.keys()))
+for output_file in tqdm(output_file_to_source_file.keys()):
+    if output_file not in remaining_images:
+        source_file_relative = output_file_to_source_file[output_file]
+        removed_blank_images_relative.append(source_file_relative)
+assert len(removed_blank_images_relative) + len(remaining_images) == len(output_file_to_source_file)
+#%% Copy all the confirmed blanks to the confirmed folder
+all_candidate_blanks = recursive_file_list(candidate_blanks_base,return_relative_paths=True)
+print('Found {} candidate blanks'.format(len(all_candidate_blanks)))
+for source_fn_relative in tqdm(all_candidate_blanks):
+    source_fn_abs = os.path.join(candidate_blanks_base,source_fn_relative)
+    assert os.path.isfile(source_fn_abs)
+    target_fn_abs = os.path.join(confirmed_blanks_base,source_fn_relative)
+    os.makedirs(os.path.dirname(target_fn_abs),exist_ok=True)
+    shutil.copyfile(source_fn_abs,target_fn_abs)
+#%% Record location information for each file
+fn_relative_to_location = {}
+for location in location_to_blank_image_urls:
+    urls_this_location = location_to_blank_image_urls[location]
+    for url in urls_this_location:
+        fn_relative = url.split('//')[1]
+        fn_relative_to_location[fn_relative] = location
+all_confirmed_blanks = recursive_file_list(confirmed_blanks_base,return_relative_paths=True)
+print('Found {} confirmed blanks'.format(len(all_confirmed_blanks)))
+for fn_relative in all_confirmed_blanks:
+    assert fn_relative in fn_relative_to_location

data_management/lila/create_lila_test_set.py CHANGED Viewed

@@ -124,6 +124,8 @@ for ds_name in metadata_table.keys():
 #%% Download those image files
+# TODO: trivially parallelizable
+#
 # ds_name = (list(metadata_table.keys()))[0]
 for ds_name in metadata_table.keys():
@@ -147,4 +149,3 @@ for ds_name in metadata_table.keys():
     # ...for each url
 # ...for each dataset

data_management/lila/create_links_to_md_results_files.py CHANGED Viewed

@@ -57,7 +57,7 @@ for i_row,row in df.iterrows():
         df.loc[i_row,'mdv5a_results_raw'] = md_base_url + mdv5a_files[0]
         df.loc[i_row,'mdv5b_results_raw'] = md_base_url + mdv5b_files[0]
     else:
-        # Exclude single-season files for snpashot-serengeti
+        # Exclude single-season files for snapshot-serengeti
         if dataset_shortname == 'snapshot-serengeti':
             matching_files = [fn for fn in matching_files if '_S' not in fn]
             assert len(matching_files) == 2

data_management/lila/download_lila_subset.py CHANGED Viewed

@@ -24,11 +24,11 @@ from urllib.parse import urlparse
 from collections import defaultdict
 from data_management.lila.lila_common import \
-    read_lila_all_images_file, read_lila_metadata, is_empty, azure_url_to_gcp_http_url
+    read_lila_all_images_file, is_empty, azure_url_to_gcp_http_url
 from md_utils.url_utils import download_url
 # If any of these strings appear in the common name of a species, we'll download that image
-species_of_interest = ['grey fox','red fox','leopard cat']
+species_of_interest = ['grey fox','red fox','leopard cat','kiwi']
 # We'll write images, metadata downloads, and temporary files here
 lila_local_base = os.path.expanduser('~/lila')
@@ -40,30 +40,28 @@ output_dir = os.path.join(lila_local_base,'lila_downloads_by_dataset')
 os.makedirs(output_dir,exist_ok=True)
 # Number of concurrent download threads
-n_download_threads = 50
+n_download_threads = 20
 max_images_per_dataset = 10 # None
 # This impacts the data download, but not the metadata download
+#
+# "Azure" really means "Azure if available"; recent datasets are only available
+# on GCP.
 image_download_source = 'azure' # 'azure' or 'gcp'
 random.seed(0)
-#%% Download and open the giant table of image metadata
+#%% Download and open the giant table of image URLs and labels
-# Opening this huge .csv file make take ~30 seconds
+# ~60 seconds to download, unzip, and open
 df = read_lila_all_images_file(metadata_dir)
-#%% Download and parse the metadata file
-metadata_table = read_lila_metadata(metadata_dir)
 #%% Find all the images we want to download
-# Searching over the giant table can take a couple of minutes
+# ~2 minutes
 ds_name_to_urls = defaultdict(list)
@@ -106,13 +104,24 @@ else:
 #%% Download those image files
-def download_relative_filename(url, output_base, verbose=False, url_base=None):
+container_to_url_base = {
+                         'lilablobssc.blob.core.windows.net':'/',
+                         'storage.googleapis.com':'/public-datasets-lila/'
+                         }
+def download_relative_filename(url, output_base, verbose=False, url_base=None, overwrite=False):
     """
     Download a URL to output_base, preserving relative path
     """
+    result = {'status':'unknown','url':url,'destination_filename':None}
     if url_base is None:
-        url_base = '/'
+        assert url.startswith('https://')
+        container = url.split('/')[2]
+        assert container in container_to_url_base
+        url_base = container_to_url_base[container]
     assert url_base.startswith('/') and url_base.endswith('/')
     p = urlparse(url)
@@ -122,29 +131,45 @@ def download_relative_filename(url, output_base, verbose=False, url_base=None):
     relative_filename = relative_filename.replace(url_base,'',1)
     destination_filename = os.path.join(output_base,relative_filename)
-    download_url(url, destination_filename, verbose=verbose)
+    result['destination_filename'] = destination_filename
+    if ((os.path.isfile(destination_filename)) and (not overwrite)):
+        result['status'] = 'skipped'
+        return result
+    try:
+        download_url(url, destination_filename, verbose=verbose)
+    except Exception as e:
+        print('Warning: error downloading URL {}: {}'.format(
+            url,str(e)))
+        result['status'] = 'error: {}'.format(str(e))
+        return result
+    result['status'] = 'success'
+    return result
+# ds_name_to_urls maps dataset names to lists of URLs; flatten to a single list of URLs
 all_urls = list(ds_name_to_urls.values())
 all_urls = [item for sublist in all_urls for item in sublist]
-url_base = '/'
 # Convert Azure URLs to GCP URLs if necessary
 if image_download_source != 'azure':
     assert image_download_source == 'gcp'
-    url_base = '/public-datasets-lila/'
     all_urls = [azure_url_to_gcp_http_url(url) for url in all_urls]
-print('Downloading {} images with Python requests'.format(len(all_urls)))
+print('Downloading {} images on {} workers'.format(len(all_urls),n_download_threads))
 if n_download_threads <= 1:
+    results = []
     # url = all_urls[0]
     for url in tqdm(all_urls):
-        download_relative_filename(url,output_dir,verbose=True,url_base=url_base)
+        results.append(download_relative_filename(url,output_dir,url_base=None))
 else:
     pool = ThreadPool(n_download_threads)
-    tqdm(pool.imap(lambda s: download_relative_filename(s,output_dir,verbose=False,url_base=url_base),
-                   all_urls), total=len(all_urls))
+    results = list(tqdm(pool.imap(lambda s: download_relative_filename(
+        s,output_dir,url_base=None),
+        all_urls), total=len(all_urls)))

megadetector 5.0.6__py3-none-any.whl → 5.0.7__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.6py3-none-any.whl → 5.0.7py3-none-any.whl