PyPI - megadetector - Versions diffs - 5.0.9__py3-none-any.whl → 5.0.11__py3-none-any.whl - Mend

megadetector 5.0.9py3-none-any.whl → 5.0.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (226) hide show

{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/LICENSE +0 -0
{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/METADATA +12 -11
megadetector-5.0.11.dist-info/RECORD +5 -0
megadetector-5.0.11.dist-info/top_level.txt +1 -0
api/__init__.py +0 -0
api/batch_processing/__init__.py +0 -0
api/batch_processing/api_core/__init__.py +0 -0
api/batch_processing/api_core/batch_service/__init__.py +0 -0
api/batch_processing/api_core/batch_service/score.py +0 -439
api/batch_processing/api_core/server.py +0 -294
api/batch_processing/api_core/server_api_config.py +0 -98
api/batch_processing/api_core/server_app_config.py +0 -55
api/batch_processing/api_core/server_batch_job_manager.py +0 -220
api/batch_processing/api_core/server_job_status_table.py +0 -152
api/batch_processing/api_core/server_orchestration.py +0 -360
api/batch_processing/api_core/server_utils.py +0 -92
api/batch_processing/api_core_support/__init__.py +0 -0
api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
api/batch_processing/api_support/__init__.py +0 -0
api/batch_processing/api_support/summarize_daily_activity.py +0 -152
api/batch_processing/data_preparation/__init__.py +0 -0
api/batch_processing/data_preparation/manage_local_batch.py +0 -2391
api/batch_processing/data_preparation/manage_video_batch.py +0 -327
api/batch_processing/integration/digiKam/setup.py +0 -6
api/batch_processing/integration/digiKam/xmp_integration.py +0 -465
api/batch_processing/integration/eMammal/test_scripts/config_template.py +0 -5
api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +0 -126
api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +0 -55
api/batch_processing/postprocessing/__init__.py +0 -0
api/batch_processing/postprocessing/add_max_conf.py +0 -64
api/batch_processing/postprocessing/categorize_detections_by_size.py +0 -163
api/batch_processing/postprocessing/combine_api_outputs.py +0 -249
api/batch_processing/postprocessing/compare_batch_results.py +0 -958
api/batch_processing/postprocessing/convert_output_format.py +0 -397
api/batch_processing/postprocessing/load_api_results.py +0 -195
api/batch_processing/postprocessing/md_to_coco.py +0 -310
api/batch_processing/postprocessing/md_to_labelme.py +0 -330
api/batch_processing/postprocessing/merge_detections.py +0 -401
api/batch_processing/postprocessing/postprocess_batch_results.py +0 -1904
api/batch_processing/postprocessing/remap_detection_categories.py +0 -170
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +0 -661
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +0 -211
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +0 -82
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +0 -1631
api/batch_processing/postprocessing/separate_detections_into_folders.py +0 -731
api/batch_processing/postprocessing/subset_json_detector_output.py +0 -696
api/batch_processing/postprocessing/top_folders_to_bottom.py +0 -223
api/synchronous/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/api_backend.py +0 -152
api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -266
api/synchronous/api_core/animal_detection_api/config.py +0 -35
api/synchronous/api_core/animal_detection_api/data_management/annotations/annotation_constants.py +0 -47
api/synchronous/api_core/animal_detection_api/detection/detector_training/copy_checkpoints.py +0 -43
api/synchronous/api_core/animal_detection_api/detection/detector_training/model_main_tf2.py +0 -114
api/synchronous/api_core/animal_detection_api/detection/process_video.py +0 -543
api/synchronous/api_core/animal_detection_api/detection/pytorch_detector.py +0 -304
api/synchronous/api_core/animal_detection_api/detection/run_detector.py +0 -627
api/synchronous/api_core/animal_detection_api/detection/run_detector_batch.py +0 -1029
api/synchronous/api_core/animal_detection_api/detection/run_inference_with_yolov5_val.py +0 -581
api/synchronous/api_core/animal_detection_api/detection/run_tiled_inference.py +0 -754
api/synchronous/api_core/animal_detection_api/detection/tf_detector.py +0 -165
api/synchronous/api_core/animal_detection_api/detection/video_utils.py +0 -495
api/synchronous/api_core/animal_detection_api/md_utils/azure_utils.py +0 -174
api/synchronous/api_core/animal_detection_api/md_utils/ct_utils.py +0 -262
api/synchronous/api_core/animal_detection_api/md_utils/directory_listing.py +0 -251
api/synchronous/api_core/animal_detection_api/md_utils/matlab_porting_tools.py +0 -97
api/synchronous/api_core/animal_detection_api/md_utils/path_utils.py +0 -416
api/synchronous/api_core/animal_detection_api/md_utils/process_utils.py +0 -110
api/synchronous/api_core/animal_detection_api/md_utils/sas_blob_utils.py +0 -509
api/synchronous/api_core/animal_detection_api/md_utils/string_utils.py +0 -59
api/synchronous/api_core/animal_detection_api/md_utils/url_utils.py +0 -144
api/synchronous/api_core/animal_detection_api/md_utils/write_html_image_list.py +0 -226
api/synchronous/api_core/animal_detection_api/md_visualization/visualization_utils.py +0 -841
api/synchronous/api_core/tests/__init__.py +0 -0
api/synchronous/api_core/tests/load_test.py +0 -110
classification/__init__.py +0 -0
classification/aggregate_classifier_probs.py +0 -108
classification/analyze_failed_images.py +0 -227
classification/cache_batchapi_outputs.py +0 -198
classification/create_classification_dataset.py +0 -627
classification/crop_detections.py +0 -516
classification/csv_to_json.py +0 -226
classification/detect_and_crop.py +0 -855
classification/efficientnet/__init__.py +0 -9
classification/efficientnet/model.py +0 -415
classification/efficientnet/utils.py +0 -610
classification/evaluate_model.py +0 -520
classification/identify_mislabeled_candidates.py +0 -152
classification/json_to_azcopy_list.py +0 -63
classification/json_validator.py +0 -695
classification/map_classification_categories.py +0 -276
classification/merge_classification_detection_output.py +0 -506
classification/prepare_classification_script.py +0 -194
classification/prepare_classification_script_mc.py +0 -228
classification/run_classifier.py +0 -286
classification/save_mislabeled.py +0 -110
classification/train_classifier.py +0 -825
classification/train_classifier_tf.py +0 -724
classification/train_utils.py +0 -322
data_management/__init__.py +0 -0
data_management/annotations/__init__.py +0 -0
data_management/annotations/annotation_constants.py +0 -34
data_management/camtrap_dp_to_coco.py +0 -238
data_management/cct_json_utils.py +0 -395
data_management/cct_to_md.py +0 -176
data_management/cct_to_wi.py +0 -289
data_management/coco_to_labelme.py +0 -272
data_management/coco_to_yolo.py +0 -662
data_management/databases/__init__.py +0 -0
data_management/databases/add_width_and_height_to_db.py +0 -33
data_management/databases/combine_coco_camera_traps_files.py +0 -206
data_management/databases/integrity_check_json_db.py +0 -477
data_management/databases/subset_json_db.py +0 -115
data_management/generate_crops_from_cct.py +0 -149
data_management/get_image_sizes.py +0 -188
data_management/importers/add_nacti_sizes.py +0 -52
data_management/importers/add_timestamps_to_icct.py +0 -79
data_management/importers/animl_results_to_md_results.py +0 -158
data_management/importers/auckland_doc_test_to_json.py +0 -372
data_management/importers/auckland_doc_to_json.py +0 -200
data_management/importers/awc_to_json.py +0 -189
data_management/importers/bellevue_to_json.py +0 -273
data_management/importers/cacophony-thermal-importer.py +0 -796
data_management/importers/carrizo_shrubfree_2018.py +0 -268
data_management/importers/carrizo_trail_cam_2017.py +0 -287
data_management/importers/cct_field_adjustments.py +0 -57
data_management/importers/channel_islands_to_cct.py +0 -913
data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
data_management/importers/eMammal/eMammal_helpers.py +0 -249
data_management/importers/eMammal/make_eMammal_json.py +0 -223
data_management/importers/ena24_to_json.py +0 -275
data_management/importers/filenames_to_json.py +0 -385
data_management/importers/helena_to_cct.py +0 -282
data_management/importers/idaho-camera-traps.py +0 -1407
data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
data_management/importers/jb_csv_to_json.py +0 -150
data_management/importers/mcgill_to_json.py +0 -250
data_management/importers/missouri_to_json.py +0 -489
data_management/importers/nacti_fieldname_adjustments.py +0 -79
data_management/importers/noaa_seals_2019.py +0 -181
data_management/importers/pc_to_json.py +0 -365
data_management/importers/plot_wni_giraffes.py +0 -123
data_management/importers/prepare-noaa-fish-data-for-lila.py +0 -359
data_management/importers/prepare_zsl_imerit.py +0 -131
data_management/importers/rspb_to_json.py +0 -356
data_management/importers/save_the_elephants_survey_A.py +0 -320
data_management/importers/save_the_elephants_survey_B.py +0 -332
data_management/importers/snapshot_safari_importer.py +0 -758
data_management/importers/snapshot_safari_importer_reprise.py +0 -665
data_management/importers/snapshot_serengeti_lila.py +0 -1067
data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
data_management/importers/sulross_get_exif.py +0 -65
data_management/importers/timelapse_csv_set_to_json.py +0 -490
data_management/importers/ubc_to_json.py +0 -399
data_management/importers/umn_to_json.py +0 -507
data_management/importers/wellington_to_json.py +0 -263
data_management/importers/wi_to_json.py +0 -441
data_management/importers/zamba_results_to_md_results.py +0 -181
data_management/labelme_to_coco.py +0 -548
data_management/labelme_to_yolo.py +0 -272
data_management/lila/__init__.py +0 -0
data_management/lila/add_locations_to_island_camera_traps.py +0 -97
data_management/lila/add_locations_to_nacti.py +0 -147
data_management/lila/create_lila_blank_set.py +0 -557
data_management/lila/create_lila_test_set.py +0 -151
data_management/lila/create_links_to_md_results_files.py +0 -106
data_management/lila/download_lila_subset.py +0 -177
data_management/lila/generate_lila_per_image_labels.py +0 -515
data_management/lila/get_lila_annotation_counts.py +0 -170
data_management/lila/get_lila_image_counts.py +0 -111
data_management/lila/lila_common.py +0 -300
data_management/lila/test_lila_metadata_urls.py +0 -132
data_management/ocr_tools.py +0 -874
data_management/read_exif.py +0 -681
data_management/remap_coco_categories.py +0 -84
data_management/remove_exif.py +0 -66
data_management/resize_coco_dataset.py +0 -189
data_management/wi_download_csv_to_coco.py +0 -246
data_management/yolo_output_to_md_output.py +0 -441
data_management/yolo_to_coco.py +0 -676
detection/__init__.py +0 -0
detection/detector_training/__init__.py +0 -0
detection/detector_training/model_main_tf2.py +0 -114
detection/process_video.py +0 -703
detection/pytorch_detector.py +0 -337
detection/run_detector.py +0 -779
detection/run_detector_batch.py +0 -1219
detection/run_inference_with_yolov5_val.py +0 -917
detection/run_tiled_inference.py +0 -935
detection/tf_detector.py +0 -188
detection/video_utils.py +0 -606
docs/source/conf.py +0 -43
md_utils/__init__.py +0 -0
md_utils/azure_utils.py +0 -174
md_utils/ct_utils.py +0 -612
md_utils/directory_listing.py +0 -246
md_utils/md_tests.py +0 -968
md_utils/path_utils.py +0 -1044
md_utils/process_utils.py +0 -157
md_utils/sas_blob_utils.py +0 -509
md_utils/split_locations_into_train_val.py +0 -228
md_utils/string_utils.py +0 -92
md_utils/url_utils.py +0 -323
md_utils/write_html_image_list.py +0 -225
md_visualization/__init__.py +0 -0
md_visualization/plot_utils.py +0 -293
md_visualization/render_images_with_thumbnails.py +0 -275
md_visualization/visualization_utils.py +0 -1537
md_visualization/visualize_db.py +0 -551
md_visualization/visualize_detector_output.py +0 -406
megadetector-5.0.9.dist-info/RECORD +0 -224
megadetector-5.0.9.dist-info/top_level.txt +0 -8
taxonomy_mapping/__init__.py +0 -0
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +0 -491
taxonomy_mapping/map_new_lila_datasets.py +0 -154
taxonomy_mapping/prepare_lila_taxonomy_release.py +0 -142
taxonomy_mapping/preview_lila_taxonomy.py +0 -591
taxonomy_mapping/retrieve_sample_image.py +0 -71
taxonomy_mapping/simple_image_download.py +0 -218
taxonomy_mapping/species_lookup.py +0 -834
taxonomy_mapping/taxonomy_csv_checker.py +0 -159
taxonomy_mapping/taxonomy_graph.py +0 -346
taxonomy_mapping/validate_lila_category_mappings.py +0 -83
{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/WHEEL +0 -0

classification/crop_detections.py DELETED Viewed

@@ -1,516 +0,0 @@
-"""
-crop_detections.py
-Given a detections JSON file from MegaDetector, crops the bounding boxes above
-a certain confidence threshold.
-This script takes as input a detections JSON file, usually the output of
-detection/run_tf_detector_batch.py or the output of the Batch API in the
-"Batch processing API output format".
-See https://github.com/agentmorris/MegaDetector/tree/master/api/batch_processing.
-The script can crop images that are either available locally or that need to be
-downloaded from an Azure Blob Storage container.
-We assume that no image contains over 100 bounding boxes, and we always save
-crops as RGB .jpg files for consistency. For each image, each bounding box is
-cropped and saved to a file with a suffix "___cropXX_mdvY.Y.jpg" added to the
-filename as the original image. "XX" ranges from "00" to "99" and "Y.Y"
-ndicates the MegaDetector version. Based on the given confidence threshold, we
-may skip saving certain bounding box crops, but we still increment the bounding
-box number for skipped boxes.
-Example cropped image path (with MegaDetector bbox):
-  "path/to/image.jpg___crop00_mdv4.1.jpg"
-By default, the images are cropped exactly per the given bounding box
-coordinates. However, if square crops are desired, pass the --square-crops
-flag. This will always generate a square crop whose size is the larger of the
-bounding box width or height. In the case that the square crop boundaries exceed
-the original image size, the crop is padded with 0s.
-This script outputs a log file to:
-   <output_dir>/crop_detections_log_{timestamp}.json
-...which contains images that failed to download and crop properly.
-"""
-#%% Imports
-from __future__ import annotations
-import argparse
-from collections.abc import Iterable, Mapping, Sequence
-from concurrent import futures
-from datetime import datetime
-import io
-import json
-import os
-from typing import Any, BinaryIO, Optional
-from azure.storage.blob import ContainerClient
-from PIL import Image, ImageOps
-from tqdm import tqdm
-#%% Example usage
-"""
-python crop_detections.py \
-    detections.json \
-    /path/to/crops \
-    --images-dir /path/to/images \
-    --container-url "https://account.blob.core.windows.net/container?sastoken" \
-    --detector-version "4.1" \
-    --threshold 0.8 \
-    --save-full-images --square-crops \
-    --threads 50 \
-    --logdir "."
-"""
-#%% Main function
-def main(detections_json_path: str,
-         cropped_images_dir: str,
-         images_dir: Optional[str],
-         container_url: Optional[str],
-         detector_version: Optional[str],
-         save_full_images: bool,
-         square_crops: bool,
-         check_crops_valid: bool,
-         confidence_threshold: float,
-         threads: int,
-         logdir: str) -> None:
-    """
-    Args:
-        detections_json_path: str, path to detections JSON file
-        cropped_images_dir: str, path to local directory for saving crops of
-            bounding boxes
-        images_dir: optional str, path to local directory where images are saved
-        container_url: optional str, URL (with SAS token, if necessary) of Azure
-            Blob Storage container to download images from, if images are not
-            all already locally available in <images_dir>
-        detector_version: str, detector version string, e.g., '4.1',
-            see {batch_detection_api_url}/supported_model_versions
-        save_full_images: bool, whether to save downloaded images to images_dir,
-            images_dir must be given if save_full_images=True
-        square_crops: bool, whether to crop bounding boxes as squares
-        check_crops_valid: bool, whether to load each crop to ensure the file is
-            valid (i.e., not truncated)
-        confidence_threshold: float, only crop bounding boxes above this value
-        threads: int, number of threads to use for downloading images
-        logdir: str, path to directory to save log file
-    """
-    # error checking
-    assert 0 <= confidence_threshold <= 1, \
-            'Invalid confidence threshold {}'.format(confidence_threshold)
-    if save_full_images:
-        assert images_dir is not None, \
-            'save_full_images specified but no images_dir provided'
-        if not os.path.exists(images_dir):
-            os.makedirs(images_dir, exist_ok=True)
-            print(f'Created images_dir at {images_dir}')
-    # load detections JSON
-    with open(detections_json_path, 'r') as f:
-        js = json.load(f)
-    detections = {img['file']: img for img in js['images']}
-    detection_categories = js['detection_categories']
-    # get detector version
-    if 'info' in js and 'detector' in js['info']:
-        api_det_version = js['info']['detector'] # .rsplit('v', maxsplit=1)[1]
-        if detector_version is not None:
-            assert api_det_version == detector_version,\
-            '.json file specifies a detector version of {}, but the caller has specified {}'.format(
-            api_det_version,detector_version)
-        else:
-            detector_version = api_det_version
-    if detector_version is None:
-        detector_version = 'unknown'
-    # convert from category ID to category name
-    images_missing_detections = []
-    # copy keys to modify dict in-place
-    for img_path in list(detections.keys()):
-        info_dict = detections[img_path]
-        if 'detections' not in info_dict or info_dict['detections'] is None:
-            del detections[img_path]
-            images_missing_detections.append(img_path)
-            continue
-        for d in info_dict['detections']:
-            if d['category'] not in detection_categories:
-                print('Warning: ignoring detection with category {} for image {}'.format(
-                    d['category'],img_path))
-                # This will be removed later when we filter for animals
-                d['category'] = 'unsupported'
-            else:
-                d['category'] = detection_categories[d['category']]
-    images_failed_dload_crop, num_downloads, num_crops = download_and_crop(
-        detections=detections,
-        cropped_images_dir=cropped_images_dir,
-        images_dir=images_dir,
-        container_url=container_url,
-        detector_version=detector_version,
-        confidence_threshold=confidence_threshold,
-        save_full_images=save_full_images,
-        square_crops=square_crops,
-        check_crops_valid=check_crops_valid,
-        threads=threads)
-    print(f'{len(images_failed_dload_crop)} images failed to download or crop.')
-    # save log of bad images
-    log = {
-        'images_missing_detections': images_missing_detections,
-        'images_failed_download_or_crop': images_failed_dload_crop,
-        'num_new_downloads': num_downloads,
-        'num_new_crops': num_crops
-    }
-    os.makedirs(logdir, exist_ok=True)
-    date = datetime.now().strftime('%Y%m%d_%H%M%S')  # e.g., '20200722_110816'
-    log_path = os.path.join(logdir, f'crop_detections_log_{date}.json')
-    with open(log_path, 'w') as f:
-        json.dump(log, f, indent=1)
-#%% Support functions
-def download_and_crop(
-        detections: Mapping[str, Mapping[str, Any]],
-        cropped_images_dir: str,
-        images_dir: Optional[str],
-        container_url: Optional[str],
-        detector_version: str,
-        confidence_threshold: float,
-        save_full_images: bool,
-        square_crops: bool,
-        check_crops_valid: bool,
-        threads: int = 1
-        ) -> tuple[list[str], int, int]:
-    """
-    Saves crops to a file with the same name as the original image with an
-    additional suffix appended, starting with 3 underscores:
-    - if image has ground truth bboxes: "___cropXX.jpg", where "XX" indicates
-        the bounding box index
-    - if image has bboxes from MegaDetector: "___cropXX_mdvY.Y.jpg", where
-        "Y.Y" indicates the MegaDetector version
-    See module docstring for more info and examples.
-    Args:
-        detections: dict, maps image paths to info dict
-            {
-                "detections": [{
-                    "category": "animal",  # must be name, not "1" or "2"
-                    "conf": 0.926,
-                    "bbox": [0.0, 0.2762, 0.1539, 0.2825],
-                }],
-                "is_ground_truth": True  # whether bboxes are ground truth
-            }
-        cropped_images_dir: str, path to folder where cropped images are saved
-        images_dir: optional str, path to folder where full images are saved
-        container_url: optional str, URL (with SAS token, if necessary) of Azure
-            Blob Storage container to download images from, if images are not
-            all already locally available in <images_dir>
-        detector_version: str, detector version string, e.g., '4.1'
-        confidence_threshold: float, only crop bounding boxes above this value
-        save_full_images: bool, whether to save downloaded images to images_dir,
-            images_dir must be given and must exist if save_full_images=True
-        square_crops: bool, whether to crop bounding boxes as squares
-        check_crops_valid: bool, whether to load each crop to ensure the file is
-            valid (i.e., not truncated)
-        threads: int, number of threads to use for downloading images
-    Returns:
-        images_failed_download: list of str, images with bounding boxes that
-            failed to download or crop properly
-        total_downloads: int, number of images downloaded
-        total_new_crops: int, number of new crops saved to cropped_images_dir
-    """
-    # True for ground truth, False for MegaDetector
-    # always save as .jpg for consistency
-    crop_path_template = {
-        True: os.path.join(cropped_images_dir, '{img_path}___crop{n:>02d}.jpg'),
-        False: os.path.join(
-            cropped_images_dir,
-            '{img_path}___crop{n:>02d}_' + f'{detector_version}.jpg')
-    }
-    pool = futures.ThreadPoolExecutor(max_workers=threads)
-    future_to_img_path = {}
-    images_failed_download = []
-    container_client = None
-    if container_url is not None:
-        container_client = ContainerClient.from_container_url(container_url)
-    print(f'Getting bbox info for {len(detections)} images...')
-    for img_path in tqdm(sorted(detections.keys())):
-        # we already did all error checking above, so we don't do any here
-        info_dict = detections[img_path]
-        bbox_dicts = info_dict['detections']
-        is_ground_truth = info_dict.get('is_ground_truth', False)
-        # get the image, either from disk or from Blob Storage
-        future = pool.submit(
-            load_and_crop, img_path, images_dir, container_client, bbox_dicts,
-            confidence_threshold, crop_path_template[is_ground_truth],
-            save_full_images, square_crops, check_crops_valid)
-        future_to_img_path[future] = img_path
-    total = len(future_to_img_path)
-    total_downloads = 0
-    total_new_crops = 0
-    print(f'Reading/downloading {total} images and cropping...')
-    for future in tqdm(futures.as_completed(future_to_img_path), total=total):
-        img_path = future_to_img_path[future]
-        try:
-            did_download, num_new_crops = future.result()
-            total_downloads += did_download
-            total_new_crops += num_new_crops
-        except Exception as e:  # pylint: disable=broad-except
-            exception_type = type(e).__name__
-            tqdm.write(f'{img_path} - generated {exception_type}: {e}')
-            images_failed_download.append(img_path)
-    pool.shutdown()
-    if container_client is not None:
-        # inelegant way to close the container_client
-        with container_client:
-            pass
-    print(f'Downloaded {total_downloads} images.')
-    print(f'Made {total_new_crops} new crops.')
-    return images_failed_download, total_downloads, total_new_crops
-def load_local_image(img_path: str |  BinaryIO) -> Optional[Image.Image]:
-    """
-    Attempts to load an image from a local path.
-    """
-    try:
-        with Image.open(img_path) as img:
-            img.load()
-        return img
-    except OSError as e:  # PIL.UnidentifiedImageError is a subclass of OSError
-        exception_type = type(e).__name__
-        tqdm.write(f'Unable to load {img_path}. {exception_type}: {e}.')
-    return None
-def load_and_crop(img_path: str,
-                  images_dir: Optional[str],
-                  container_client: Optional[ContainerClient],
-                  bbox_dicts: Iterable[Mapping[str, Any]],
-                  confidence_threshold: float,
-                  crop_path_template: str,
-                  save_full_image: bool,
-                  square_crops: bool,
-                  check_crops_valid: bool) -> tuple[bool, int]:
-    """
-    Given an image and a list of bounding boxes, checks if the crops already
-    exist. If not, loads the image locally or Azure Blob Storage, then crops it.
-    local image path: <images_dir>/<img_path>
-    Azure storage: <img_path> as the blob name inside the container
-    An image is only downloaded from Azure Blob Storage if it does not already
-    exist locally and if it has at least 1 bounding box with confidence greater
-    than the confidence threshold.
-    Args:
-        img_path: str, image path
-        images_dir: optional str, path to local directory of images, and where
-            full images are saved if save_full_images=True
-        container_client: optional ContainerClient, this function does not
-            use container_client in any context manager
-        bbox_dicts: list of dicts, each dict contains info on a bounding box
-        confidence_threshold: float, only crop bounding boxes above this value
-        crop_path_template: str, contains placeholders {img_path} and {n}
-        save_full_images: bool, whether to save downloaded images to images_dir,
-            images_dir must be given and must exist if save_full_images=True
-        square_crops: bool, whether to crop bounding boxes as squares
-        check_crops_valid: bool, whether to load each crop to ensure the file is
-            valid (i.e., not truncated)
-    Returns:
-        did_download: bool, whether image was downloaded from Azure Blob Storage
-        num_new_crops: int, number of new crops successfully saved
-    """
-    did_download = False
-    num_new_crops = 0
-    # crop_path => normalized bbox coordinates [xmin, ymin, width, height]
-    bboxes_tocrop: dict[str, list[float]] = {}
-    for i, bbox_dict in enumerate(bbox_dicts):
-        # only ground-truth bboxes do not have a "confidence" value
-        if 'conf' in bbox_dict and bbox_dict['conf'] < confidence_threshold:
-            continue
-        if bbox_dict['category'] != 'animal':
-            continue
-        crop_path = crop_path_template.format(img_path=img_path, n=i)
-        if not os.path.exists(crop_path) or (
-                check_crops_valid and load_local_image(crop_path) is None):
-            bboxes_tocrop[crop_path] = bbox_dict['bbox']
-    if len(bboxes_tocrop) == 0:
-        return did_download, num_new_crops
-    img = None
-    # try loading image from local directory
-    if images_dir is not None:
-        full_img_path = os.path.join(images_dir, img_path)
-        debug_path = full_img_path
-        if os.path.exists(full_img_path):
-            img = load_local_image(full_img_path)
-    # try to download image from Blob Storage
-    if img is None and container_client is not None:
-        debug_path = img_path
-        with io.BytesIO() as stream:
-            container_client.download_blob(img_path).readinto(stream)
-            stream.seek(0)
-            if save_full_image:
-                os.makedirs(os.path.dirname(full_img_path), exist_ok=True)
-                with open(full_img_path, 'wb') as f:
-                    f.write(stream.read())
-                stream.seek(0)
-            img = load_local_image(stream)
-        did_download = True
-    assert img is not None, 'image "{}" failed to load or download properly'.format(
-        debug_path)
-    if img.mode != 'RGB':
-        img = img.convert(mode='RGB')  # always save as RGB for consistency
-    # crop the image
-    for crop_path, bbox in bboxes_tocrop.items():
-        num_new_crops += save_crop(
-            img, bbox_norm=bbox, square_crop=square_crops, save=crop_path)
-    return did_download, num_new_crops
-def save_crop(img: Image.Image, bbox_norm: Sequence[float], square_crop: bool,
-              save: str) -> bool:
-    """
-    Crops an image and saves the crop to file.
-    Args:
-        img: PIL.Image.Image object, already loaded
-        bbox_norm: list or tuple of float, [xmin, ymin, width, height] all in
-            normalized coordinates
-        square_crop: bool, whether to crop bounding boxes as a square
-        save: str, path to save cropped image
-    Returns: bool, True if a crop was saved, False otherwise
-    """
-    img_w, img_h = img.size
-    xmin = int(bbox_norm[0] * img_w)
-    ymin = int(bbox_norm[1] * img_h)
-    box_w = int(bbox_norm[2] * img_w)
-    box_h = int(bbox_norm[3] * img_h)
-    if square_crop:
-        # expand box width or height to be square, but limit to img size
-        box_size = max(box_w, box_h)
-        xmin = max(0, min(
-            xmin - int((box_size - box_w) / 2),
-            img_w - box_w))
-        ymin = max(0, min(
-            ymin - int((box_size - box_h) / 2),
-            img_h - box_h))
-        box_w = min(img_w, box_size)
-        box_h = min(img_h, box_size)
-    if box_w == 0 or box_h == 0:
-        tqdm.write(f'Skipping size-0 crop (w={box_w}, h={box_h}) at {save}')
-        return False
-    # Image.crop() takes box=[left, upper, right, lower]
-    crop = img.crop(box=[xmin, ymin, xmin + box_w, ymin + box_h])
-    if square_crop and (box_w != box_h):
-        # pad to square using 0s
-        crop = ImageOps.pad(crop, size=(box_size, box_size), color=0)
-    os.makedirs(os.path.dirname(save), exist_ok=True)
-    crop.save(save)
-    return True
-#%% Command-line driver
-def _parse_args() -> argparse.Namespace:
-    parser = argparse.ArgumentParser(
-        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
-        description='Crop detections from MegaDetector.')
-    parser.add_argument(
-        'detections_json',
-        help='path to detections JSON file')
-    parser.add_argument(
-        'cropped_images_dir',
-        help='path to local directory for saving crops of bounding boxes')
-    parser.add_argument(
-        '-i', '--images-dir',
-        help='path to directory where full images are already available, '
-             'or where images will be written if --save-full-images is set')
-    parser.add_argument(
-        '-c', '--container-url',
-        help='URL (including SAS token, if necessary) of Azure Blob Storage '
-             'container to download images from, if images are not all already '
-             'locally available in <images_dir>')
-    parser.add_argument(
-        '-v', '--detector-version',
-        help='detector version string, e.g., "4.1", used if detector version '
-             'cannot be inferred from detections JSON')
-    parser.add_argument(
-        '--save-full-images', action='store_true',
-        help='forces downloading of full images to --images-dir')
-    parser.add_argument(
-        '--square-crops', action='store_true',
-        help='crop bounding boxes as squares')
-    parser.add_argument(
-        '--check-crops-valid', action='store_true',
-        help='load each crop to ensure file is valid (i.e., not truncated)')
-    parser.add_argument(
-        '-t', '--threshold', type=float, default=0.0,
-        help='confidence threshold above which to crop bounding boxes')
-    parser.add_argument(
-        '-n', '--threads', type=int, default=1,
-        help='number of threads to use for downloading and cropping images')
-    parser.add_argument(
-        '--logdir', default='.',
-        help='path to directory to save log file')
-    return parser.parse_args()
-if __name__ == '__main__':
-    args = _parse_args()
-    main(detections_json_path=args.detections_json,
-         cropped_images_dir=args.cropped_images_dir,
-         images_dir=args.images_dir,
-         container_url=args.container_url,
-         detector_version=args.detector_version,
-         save_full_images=args.save_full_images,
-         square_crops=args.square_crops,
-         check_crops_valid=args.check_crops_valid,
-         confidence_threshold=args.threshold,
-         threads=args.threads,
-         logdir=args.logdir)

megadetector 5.0.9__py3-none-any.whl → 5.0.11__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.9py3-none-any.whl → 5.0.11py3-none-any.whl