PyPI - megadetector - Versions diffs - 5.0.10__py3-none-any.whl → 5.0.11__py3-none-any.whl - Mend

megadetector 5.0.10py3-none-any.whl → 5.0.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (226) hide show

{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/LICENSE +0 -0
{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/METADATA +12 -11
megadetector-5.0.11.dist-info/RECORD +5 -0
megadetector-5.0.11.dist-info/top_level.txt +1 -0
api/__init__.py +0 -0
api/batch_processing/__init__.py +0 -0
api/batch_processing/api_core/__init__.py +0 -0
api/batch_processing/api_core/batch_service/__init__.py +0 -0
api/batch_processing/api_core/batch_service/score.py +0 -439
api/batch_processing/api_core/server.py +0 -294
api/batch_processing/api_core/server_api_config.py +0 -98
api/batch_processing/api_core/server_app_config.py +0 -55
api/batch_processing/api_core/server_batch_job_manager.py +0 -220
api/batch_processing/api_core/server_job_status_table.py +0 -152
api/batch_processing/api_core/server_orchestration.py +0 -360
api/batch_processing/api_core/server_utils.py +0 -92
api/batch_processing/api_core_support/__init__.py +0 -0
api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
api/batch_processing/api_support/__init__.py +0 -0
api/batch_processing/api_support/summarize_daily_activity.py +0 -152
api/batch_processing/data_preparation/__init__.py +0 -0
api/batch_processing/data_preparation/manage_local_batch.py +0 -2391
api/batch_processing/data_preparation/manage_video_batch.py +0 -327
api/batch_processing/integration/digiKam/setup.py +0 -6
api/batch_processing/integration/digiKam/xmp_integration.py +0 -465
api/batch_processing/integration/eMammal/test_scripts/config_template.py +0 -5
api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +0 -126
api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +0 -55
api/batch_processing/postprocessing/__init__.py +0 -0
api/batch_processing/postprocessing/add_max_conf.py +0 -64
api/batch_processing/postprocessing/categorize_detections_by_size.py +0 -163
api/batch_processing/postprocessing/combine_api_outputs.py +0 -249
api/batch_processing/postprocessing/compare_batch_results.py +0 -958
api/batch_processing/postprocessing/convert_output_format.py +0 -397
api/batch_processing/postprocessing/load_api_results.py +0 -195
api/batch_processing/postprocessing/md_to_coco.py +0 -310
api/batch_processing/postprocessing/md_to_labelme.py +0 -330
api/batch_processing/postprocessing/merge_detections.py +0 -401
api/batch_processing/postprocessing/postprocess_batch_results.py +0 -1904
api/batch_processing/postprocessing/remap_detection_categories.py +0 -170
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +0 -661
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +0 -211
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +0 -82
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +0 -1631
api/batch_processing/postprocessing/separate_detections_into_folders.py +0 -731
api/batch_processing/postprocessing/subset_json_detector_output.py +0 -696
api/batch_processing/postprocessing/top_folders_to_bottom.py +0 -223
api/synchronous/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/api_backend.py +0 -152
api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -266
api/synchronous/api_core/animal_detection_api/config.py +0 -35
api/synchronous/api_core/animal_detection_api/data_management/annotations/annotation_constants.py +0 -47
api/synchronous/api_core/animal_detection_api/detection/detector_training/copy_checkpoints.py +0 -43
api/synchronous/api_core/animal_detection_api/detection/detector_training/model_main_tf2.py +0 -114
api/synchronous/api_core/animal_detection_api/detection/process_video.py +0 -543
api/synchronous/api_core/animal_detection_api/detection/pytorch_detector.py +0 -304
api/synchronous/api_core/animal_detection_api/detection/run_detector.py +0 -627
api/synchronous/api_core/animal_detection_api/detection/run_detector_batch.py +0 -1029
api/synchronous/api_core/animal_detection_api/detection/run_inference_with_yolov5_val.py +0 -581
api/synchronous/api_core/animal_detection_api/detection/run_tiled_inference.py +0 -754
api/synchronous/api_core/animal_detection_api/detection/tf_detector.py +0 -165
api/synchronous/api_core/animal_detection_api/detection/video_utils.py +0 -495
api/synchronous/api_core/animal_detection_api/md_utils/azure_utils.py +0 -174
api/synchronous/api_core/animal_detection_api/md_utils/ct_utils.py +0 -262
api/synchronous/api_core/animal_detection_api/md_utils/directory_listing.py +0 -251
api/synchronous/api_core/animal_detection_api/md_utils/matlab_porting_tools.py +0 -97
api/synchronous/api_core/animal_detection_api/md_utils/path_utils.py +0 -416
api/synchronous/api_core/animal_detection_api/md_utils/process_utils.py +0 -110
api/synchronous/api_core/animal_detection_api/md_utils/sas_blob_utils.py +0 -509
api/synchronous/api_core/animal_detection_api/md_utils/string_utils.py +0 -59
api/synchronous/api_core/animal_detection_api/md_utils/url_utils.py +0 -144
api/synchronous/api_core/animal_detection_api/md_utils/write_html_image_list.py +0 -226
api/synchronous/api_core/animal_detection_api/md_visualization/visualization_utils.py +0 -841
api/synchronous/api_core/tests/__init__.py +0 -0
api/synchronous/api_core/tests/load_test.py +0 -110
classification/__init__.py +0 -0
classification/aggregate_classifier_probs.py +0 -108
classification/analyze_failed_images.py +0 -227
classification/cache_batchapi_outputs.py +0 -198
classification/create_classification_dataset.py +0 -627
classification/crop_detections.py +0 -516
classification/csv_to_json.py +0 -226
classification/detect_and_crop.py +0 -855
classification/efficientnet/__init__.py +0 -9
classification/efficientnet/model.py +0 -415
classification/efficientnet/utils.py +0 -610
classification/evaluate_model.py +0 -520
classification/identify_mislabeled_candidates.py +0 -152
classification/json_to_azcopy_list.py +0 -63
classification/json_validator.py +0 -695
classification/map_classification_categories.py +0 -276
classification/merge_classification_detection_output.py +0 -506
classification/prepare_classification_script.py +0 -194
classification/prepare_classification_script_mc.py +0 -228
classification/run_classifier.py +0 -286
classification/save_mislabeled.py +0 -110
classification/train_classifier.py +0 -825
classification/train_classifier_tf.py +0 -724
classification/train_utils.py +0 -322
data_management/__init__.py +0 -0
data_management/annotations/__init__.py +0 -0
data_management/annotations/annotation_constants.py +0 -34
data_management/camtrap_dp_to_coco.py +0 -238
data_management/cct_json_utils.py +0 -395
data_management/cct_to_md.py +0 -176
data_management/cct_to_wi.py +0 -289
data_management/coco_to_labelme.py +0 -272
data_management/coco_to_yolo.py +0 -662
data_management/databases/__init__.py +0 -0
data_management/databases/add_width_and_height_to_db.py +0 -33
data_management/databases/combine_coco_camera_traps_files.py +0 -206
data_management/databases/integrity_check_json_db.py +0 -477
data_management/databases/subset_json_db.py +0 -115
data_management/generate_crops_from_cct.py +0 -149
data_management/get_image_sizes.py +0 -188
data_management/importers/add_nacti_sizes.py +0 -52
data_management/importers/add_timestamps_to_icct.py +0 -79
data_management/importers/animl_results_to_md_results.py +0 -158
data_management/importers/auckland_doc_test_to_json.py +0 -372
data_management/importers/auckland_doc_to_json.py +0 -200
data_management/importers/awc_to_json.py +0 -189
data_management/importers/bellevue_to_json.py +0 -273
data_management/importers/cacophony-thermal-importer.py +0 -796
data_management/importers/carrizo_shrubfree_2018.py +0 -268
data_management/importers/carrizo_trail_cam_2017.py +0 -287
data_management/importers/cct_field_adjustments.py +0 -57
data_management/importers/channel_islands_to_cct.py +0 -913
data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
data_management/importers/eMammal/eMammal_helpers.py +0 -249
data_management/importers/eMammal/make_eMammal_json.py +0 -223
data_management/importers/ena24_to_json.py +0 -275
data_management/importers/filenames_to_json.py +0 -385
data_management/importers/helena_to_cct.py +0 -282
data_management/importers/idaho-camera-traps.py +0 -1407
data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
data_management/importers/jb_csv_to_json.py +0 -150
data_management/importers/mcgill_to_json.py +0 -250
data_management/importers/missouri_to_json.py +0 -489
data_management/importers/nacti_fieldname_adjustments.py +0 -79
data_management/importers/noaa_seals_2019.py +0 -181
data_management/importers/pc_to_json.py +0 -365
data_management/importers/plot_wni_giraffes.py +0 -123
data_management/importers/prepare-noaa-fish-data-for-lila.py +0 -359
data_management/importers/prepare_zsl_imerit.py +0 -131
data_management/importers/rspb_to_json.py +0 -356
data_management/importers/save_the_elephants_survey_A.py +0 -320
data_management/importers/save_the_elephants_survey_B.py +0 -332
data_management/importers/snapshot_safari_importer.py +0 -758
data_management/importers/snapshot_safari_importer_reprise.py +0 -665
data_management/importers/snapshot_serengeti_lila.py +0 -1067
data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
data_management/importers/sulross_get_exif.py +0 -65
data_management/importers/timelapse_csv_set_to_json.py +0 -490
data_management/importers/ubc_to_json.py +0 -399
data_management/importers/umn_to_json.py +0 -507
data_management/importers/wellington_to_json.py +0 -263
data_management/importers/wi_to_json.py +0 -441
data_management/importers/zamba_results_to_md_results.py +0 -181
data_management/labelme_to_coco.py +0 -548
data_management/labelme_to_yolo.py +0 -272
data_management/lila/__init__.py +0 -0
data_management/lila/add_locations_to_island_camera_traps.py +0 -97
data_management/lila/add_locations_to_nacti.py +0 -147
data_management/lila/create_lila_blank_set.py +0 -557
data_management/lila/create_lila_test_set.py +0 -151
data_management/lila/create_links_to_md_results_files.py +0 -106
data_management/lila/download_lila_subset.py +0 -177
data_management/lila/generate_lila_per_image_labels.py +0 -515
data_management/lila/get_lila_annotation_counts.py +0 -170
data_management/lila/get_lila_image_counts.py +0 -111
data_management/lila/lila_common.py +0 -300
data_management/lila/test_lila_metadata_urls.py +0 -132
data_management/ocr_tools.py +0 -874
data_management/read_exif.py +0 -681
data_management/remap_coco_categories.py +0 -84
data_management/remove_exif.py +0 -66
data_management/resize_coco_dataset.py +0 -189
data_management/wi_download_csv_to_coco.py +0 -246
data_management/yolo_output_to_md_output.py +0 -441
data_management/yolo_to_coco.py +0 -676
detection/__init__.py +0 -0
detection/detector_training/__init__.py +0 -0
detection/detector_training/model_main_tf2.py +0 -114
detection/process_video.py +0 -703
detection/pytorch_detector.py +0 -337
detection/run_detector.py +0 -779
detection/run_detector_batch.py +0 -1219
detection/run_inference_with_yolov5_val.py +0 -917
detection/run_tiled_inference.py +0 -935
detection/tf_detector.py +0 -188
detection/video_utils.py +0 -606
docs/source/conf.py +0 -43
md_utils/__init__.py +0 -0
md_utils/azure_utils.py +0 -174
md_utils/ct_utils.py +0 -612
md_utils/directory_listing.py +0 -246
md_utils/md_tests.py +0 -968
md_utils/path_utils.py +0 -1044
md_utils/process_utils.py +0 -157
md_utils/sas_blob_utils.py +0 -509
md_utils/split_locations_into_train_val.py +0 -228
md_utils/string_utils.py +0 -92
md_utils/url_utils.py +0 -323
md_utils/write_html_image_list.py +0 -225
md_visualization/__init__.py +0 -0
md_visualization/plot_utils.py +0 -293
md_visualization/render_images_with_thumbnails.py +0 -275
md_visualization/visualization_utils.py +0 -1537
md_visualization/visualize_db.py +0 -551
md_visualization/visualize_detector_output.py +0 -406
megadetector-5.0.10.dist-info/RECORD +0 -224
megadetector-5.0.10.dist-info/top_level.txt +0 -8
taxonomy_mapping/__init__.py +0 -0
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +0 -491
taxonomy_mapping/map_new_lila_datasets.py +0 -154
taxonomy_mapping/prepare_lila_taxonomy_release.py +0 -142
taxonomy_mapping/preview_lila_taxonomy.py +0 -591
taxonomy_mapping/retrieve_sample_image.py +0 -71
taxonomy_mapping/simple_image_download.py +0 -218
taxonomy_mapping/species_lookup.py +0 -834
taxonomy_mapping/taxonomy_csv_checker.py +0 -159
taxonomy_mapping/taxonomy_graph.py +0 -346
taxonomy_mapping/validate_lila_category_mappings.py +0 -83
{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/WHEEL +0 -0

data_management/read_exif.py DELETED Viewed

@@ -1,681 +0,0 @@
-"""
-read_exif.py
-Given a folder of images, reads relevant metadata (EXIF/IPTC/XMP) fields from all images,
-and writes them to  a .json or .csv file.
-This module can use either PIL (which can only reliably read EXIF data) or exiftool (which
-can read everything).  The latter approach expects that exiftool is available on the system
-path.  No attempt is made to be consistent in format across the two approaches.
-"""
-#%% Imports and constants
-import os
-import subprocess
-import json
-from datetime import datetime
-from multiprocessing.pool import ThreadPool as ThreadPool
-from multiprocessing.pool import Pool as Pool
-from tqdm import tqdm
-from PIL import Image, ExifTags
-from md_utils.path_utils import find_images, is_executable
-from md_utils.ct_utils import args_to_object
-debug_max_images = None
-#%% Options
-class ReadExifOptions:
-    """
-    Parameters controlling metadata extraction.
-    """
-    #: Enable additional debug console output
-    verbose = False
-    #: If this is True and an output file is specified for read_exif_from_folder,
-    #: and we encounter a serialization issue, we'll return the results but won't
-    #: error.
-    allow_write_error = False
-    #: Number of concurrent workers, set to <= 1 to disable parallelization
-    n_workers = 1
-    #: Should we use threads (vs. processes) for parallelization?
-    #:
-    #: Not relevant if n_workers is <= 1.
-    use_threads = True
-    #: "File" and "ExifTool" are tag types used by ExifTool to report data that
-    #: doesn't come from EXIF, rather from the file (e.g. file size).
-    tag_types_to_ignore = set(['File','ExifTool'])
-    #: Include/exclude specific tags (tags_to_include and tags_to_exclude are mutually incompatible)
-    #:
-    #: A useful set of tags one might want to limit queries for:
-    #:
-    #: options.tags_to_include = ['DateTime','Model','Make','ExifImageWidth','ExifImageHeight','DateTime',
-    #: 'DateTimeOriginal','Orientation']
-    tags_to_include = None
-    #: Include/exclude specific tags (tags_to_include and tags_to_exclude are mutually incompatible)
-    tags_to_exclude = None
-    #: The command line to invoke if using exiftool, can be an absolute path to exiftool.exe, or
-    #: can be just "exiftool", in which case it should be on your system path.
-    exiftool_command_name = 'exiftool'
-    #: How should we handle byte-formatted EXIF tags?
-    #:
-    #: 'convert_to_string': convert to a Python string
-    #: 'delete': don't include at all
-    #: 'raw': include as a byte string
-    byte_handling = 'convert_to_string' # 'convert_to_string','delete','raw'
-    #: Should we use exiftool or PIL?
-    processing_library = 'pil' # 'exiftool','pil'
-#%% Functions
-def _get_exif_ifd(exif):
-    """
-    Read EXIF data from by finding the EXIF offset and reading tags directly
-    https://github.com/python-pillow/Pillow/issues/5863
-    """
-    # Find the offset for all the EXIF information
-    for key, value in ExifTags.TAGS.items():
-        if value == "ExifOffset":
-            break
-    info = exif.get_ifd(key)
-    return {
-        ExifTags.TAGS.get(key, key): value
-        for key, value in info.items()
-    }
-def read_pil_exif(im,options=None):
-    """
-    Read all the EXIF data we know how to read from an image, using PIL.  This is primarily
-    an internal function; the main entry point for single-image EXIF information is
-    read_exif_tags_for_image().
-    Args:
-        im (str or PIL.Image.Image): image (as a filename or an Image object) from which
-            we should read EXIF data.
-    Returns:
-        dict: a dictionary mapping EXIF tag names to their values
-    """
-    if options is None:
-        options = ReadExifOptions()
-    image_name = '[image]'
-    if isinstance(im,str):
-        image_name = im
-        im = Image.open(im)
-    exif_tags = {}
-    try:
-        exif_info = im.getexif()
-    except Exception:
-        exif_info = None
-    if exif_info is None:
-        return exif_tags
-    for k, v in exif_info.items():
-        assert isinstance(k,str) or isinstance(k,int), \
-            'Invalid EXIF key {}'.format(str(k))
-        if k in ExifTags.TAGS:
-            exif_tags[ExifTags.TAGS[k]] = str(v)
-        else:
-            # print('Warning: unrecognized EXIF tag: {}'.format(k))
-            exif_tags[k] = str(v)
-    exif_ifd_tags = _get_exif_ifd(exif_info)
-    for k in exif_ifd_tags.keys():
-        v = exif_ifd_tags[k]
-        if k in exif_tags:
-            if options.verbose:
-                print('Warning: redundant EXIF values for {} in {}:\n{}\n{}'.format(
-                    k,image_name,exif_tags[k],v))
-        else:
-            exif_tags[k] = v
-    exif_tag_names = list(exif_tags.keys())
-    # Type conversion and cleanup
-    #
-    # Most quirky types will get serialized to string when we write to .json.
-    for k in exif_tag_names:
-        if isinstance(exif_tags[k],bytes):
-            if options.byte_handling == 'delete':
-                del exif_tags[k]
-            elif options.byte_handling == 'raw':
-                pass
-            else:
-                assert options.byte_handling == 'convert_to_string'
-                exif_tags[k] = str(exif_tags[k])
-        elif isinstance(exif_tags[k],str):
-            exif_tags[k] = exif_tags[k].strip()
-    return exif_tags
-# ...read_pil_exif()
-def format_datetime_as_exif_datetime_string(dt):
-    """
-    Returns a Python datetime object rendered using the standard EXIF datetime
-    string format ('%Y:%m:%d %H:%M:%S')
-    """
-    return datetime.strftime(dt, '%Y:%m:%d %H:%M:%S')
-def parse_exif_datetime_string(s,verbose=False):
-    """"
-    Exif datetimes are strings, but in a standard format:
-    %Y:%m:%d %H:%M:%S
-    Parses one of those strings into a Python datetime object.
-    Args:
-        s (str): datetime string to parse, should be in standard EXIF datetime format
-        verbose (bool, optional): enable additional debug output
-    Returns:
-        datetime: the datetime object created from [s]
-    """
-    dt = None
-    try:
-        dt = datetime.strptime(s, '%Y:%m:%d %H:%M:%S')
-    except Exception:
-        if verbose:
-            print('Warning: could not parse datetime {}'.format(str(s)))
-    return dt
-def _filter_tags(tags,options):
-    """
-    Internal function used to include/exclude specific tags from the exif_tags
-    dict.
-    """
-    if options is None:
-        return tags
-    if options.tags_to_include is None and options.tags_to_exclude is None:
-        return tags
-    if options.tags_to_include is not None:
-        assert options.tags_to_exclude is None, "tags_to_include and tags_to_exclude are incompatible"
-        tags_to_return = {}
-        for tag_name in tags.keys():
-            if tag_name in options.tags_to_include:
-                tags_to_return[tag_name] = tags[tag_name]
-        return tags_to_return
-    if options.tags_to_exclude is not None:
-        assert options.tags_to_include is None, "tags_to_include and tags_to_exclude are incompatible"
-        tags_to_return = {}
-        for tag_name in tags.keys():
-            if tag_name not in options.tags_to_exclude:
-                tags_to_return[tag_name] = tags[tag_name]
-        return tags_to_return
-def read_exif_tags_for_image(file_path,options=None):
-    """
-    Get relevant fields from EXIF data for an image
-    Returns:
-        dict: a dict with fields 'status' (str) and 'tags'. The exact format of 'tags' depends on
-        options (ReadExifOptions, optional): parameters controlling metadata extraction
-        options.processing_library:
-            - For exiftool, 'tags' is a list of lists, where each element is (type/tag/value)
-            - For PIL, 'tags' is a dict (str:str)
-    """
-    if options is None:
-        options = ReadExifOptions()
-    result = {'status':'unknown','tags':[]}
-    if options.processing_library == 'pil':
-        try:
-            exif_tags = read_pil_exif(file_path,options)
-        except Exception as e:
-            if options.verbose:
-                print('Read failure for image {}: {}'.format(
-                    file_path,str(e)))
-            result['status'] = 'read_failure'
-            result['error'] = str(e)
-        if result['status'] == 'unknown':
-            if exif_tags is None:
-                result['status'] = 'empty_read'
-            else:
-                result['status'] = 'success'
-                result['tags'] = _filter_tags(exif_tags,options)
-        return result
-    elif options.processing_library == 'exiftool':
-        # -G means "Print group name for each tag", e.g. print:
-        #
-        # [File]          Bits Per Sample                 : 8
-        #
-        # ...instead of:
-        #
-        # Bits Per Sample                 : 8
-        proc = subprocess.Popen([options.exiftool_command_name, '-G', file_path],
-                                stdout=subprocess.PIPE, encoding='utf8')
-        exif_lines = proc.stdout.readlines()
-        exif_lines = [s.strip() for s in exif_lines]
-        if ( (exif_lines is None) or (len(exif_lines) == 0) or not \
-            any([s.lower().startswith('[exif]') for s in exif_lines])):
-            result['status'] = 'failure'
-            return result
-        # A list of three-element lists (type/tag/value)
-        exif_tags = []
-        # line_raw = exif_lines[0]
-        for line_raw in exif_lines:
-            # A typical line:
-            #
-            # [ExifTool]      ExifTool Version Number         : 12.13
-            line = line_raw.strip()
-            # Split on the first occurrence of ":"
-            tokens = line.split(':',1)
-            assert(len(tokens) == 2), 'EXIF tokenization failure ({} tokens, expected 2)'.format(
-                len(tokens))
-            field_value = tokens[1].strip()
-            field_name_type = tokens[0].strip()
-            field_name_type_tokens = field_name_type.split(None,1)
-            assert len(field_name_type_tokens) == 2, 'EXIF tokenization failure'
-            field_type = field_name_type_tokens[0].strip()
-            assert field_type.startswith('[') and field_type.endswith(']'), \
-                'Invalid EXIF field {}'.format(field_type)
-            field_type = field_type[1:-1]
-            if field_type in options.tag_types_to_ignore:
-                if options.verbose:
-                    print('Ignoring tag with type {}'.format(field_type))
-                continue
-            field_name = field_name_type_tokens[1].strip()
-            if options.tags_to_exclude is not None and field_name in options.tags_to_exclude:
-                continue
-            if options.tags_to_include is not None and field_name not in options.tags_to_include:
-                continue
-            tag = [field_type,field_name,field_value]
-            exif_tags.append(tag)
-        # ...for each output line
-        result['status'] = 'success'
-        result['tags'] = exif_tags
-        return result
-    else:
-        raise ValueError('Unknown processing library {}'.format(
-            options.processing_library))
-    # ...which processing library are we using?
-# ...read_exif_tags_for_image()
-def _populate_exif_data(im, image_base, options=None):
-    """
-    Populate EXIF data into the 'exif_tags' field in the image object [im].
-    im['file_name'] should be prepopulated, relative to image_base.
-    Returns a modified version of [im], also modifies [im] in place.
-    """
-    if options is None:
-        options = ReadExifOptions()
-    fn = im['file_name']
-    if options.verbose:
-        print('Processing {}'.format(fn))
-    try:
-        file_path = os.path.join(image_base,fn)
-        assert os.path.isfile(file_path), 'Could not find file {}'.format(file_path)
-        result = read_exif_tags_for_image(file_path,options)
-        if result['status'] == 'success':
-            exif_tags = result['tags']
-            im['exif_tags'] = exif_tags
-        else:
-            im['exif_tags'] = None
-            im['status'] = result['status']
-            if 'error' in result:
-                im['error'] = result['error']
-            if options.verbose:
-                print('Error reading EXIF data for {}'.format(file_path))
-    except Exception as e:
-        s = 'Error on {}: {}'.format(fn,str(e))
-        print(s)
-        im['error'] = s
-        im['status'] = 'read failure'
-        im['exif_tags'] = None
-    return im
-# ..._populate_exif_data()
-def _create_image_objects(image_files,recursive=True):
-    """
-    Create empty image objects for every image in [image_files], which can be a
-    list of relative paths (which will get stored without processing, so the base
-    path doesn't matter here), or a folder name.
-    Returns a list of dicts with field 'file_name' (a relative path).
-    "recursive" is ignored if "image_files" is a list.
-    """
-    # Enumerate *relative* paths
-    if isinstance(image_files,str):
-        print('Enumerating image files in {}'.format(image_files))
-        assert os.path.isdir(image_files), 'Invalid image folder {}'.format(image_files)
-        image_files = find_images(image_files,
-                                  recursive=recursive,
-                                  return_relative_paths=True,
-                                  convert_slashes=True)
-    images = []
-    for fn in image_files:
-        im = {}
-        im['file_name'] = fn
-        images.append(im)
-    if debug_max_images is not None:
-        print('Trimming input list to {} images'.format(debug_max_images))
-        images = images[0:debug_max_images]
-    return images
-def _populate_exif_for_images(image_base,images,options=None):
-    """
-    Main worker loop: read EXIF data for each image object in [images] and
-    populate the image objects.
-    'images' should be a list of dicts with the field 'file_name' containing
-    a relative path (relative to 'image_base').
-    """
-    if options is None:
-        options = ReadExifOptions()
-    if options.n_workers == 1:
-        results = []
-        for im in tqdm(images):
-            results.append(_populate_exif_data(im,image_base,options))
-    else:
-        from functools import partial
-        if options.use_threads:
-            print('Starting parallel thread pool with {} workers'.format(options.n_workers))
-            pool = ThreadPool(options.n_workers)
-        else:
-            print('Starting parallel process pool with {} workers'.format(options.n_workers))
-            pool = Pool(options.n_workers)
-        results = list(tqdm(pool.imap(partial(_populate_exif_data,image_base=image_base,
-                                        options=options),images),total=len(images)))
-    return results
-def _write_exif_results(results,output_file):
-    """
-    Write EXIF information to [output_file].
-    'results' is a list of dicts with fields 'exif_tags' and 'file_name'.
-    Writes to .csv or .json depending on the extension of 'output_file'.
-    """
-    if output_file.endswith('.json'):
-        with open(output_file,'w') as f:
-            json.dump(results,f,indent=1,default=str)
-    elif output_file.endswith('.csv'):
-        # Find all EXIF tags that exist in any image
-        all_keys = set()
-        for im in results:
-            keys_this_image = set()
-            exif_tags = im['exif_tags']
-            file_name = im['file_name']
-            for tag in exif_tags:
-                tag_name = tag[1]
-                assert tag_name not in keys_this_image, \
-                    'Error: tag {} appears twice in image {}'.format(
-                        tag_name,file_name)
-                all_keys.add(tag_name)
-            # ...for each tag in this image
-        # ...for each image
-        all_keys = sorted(list(all_keys))
-        header = ['File Name']
-        header.extend(all_keys)
-        import csv
-        with open(output_file,'w') as csvfile:
-            writer = csv.writer(csvfile)
-            # Write header
-            writer.writerow(header)
-            for im in results:
-                row = [im['file_name']]
-                kvp_this_image = {tag[1]:tag[2] for tag in im['exif_tags']}
-                for i_key,key in enumerate(all_keys):
-                    value = ''
-                    if key in kvp_this_image:
-                        value = kvp_this_image[key]
-                    row.append(value)
-                # ...for each key that *might* be present in this image
-                assert len(row) == len(header)
-                writer.writerow(row)
-            # ...for each image
-        # ...with open()
-    else:
-        raise ValueError('Could not determine output type from file {}'.format(
-            output_file))
-    # ...if we're writing to .json/.csv
-    print('Wrote results to {}'.format(output_file))
-def read_exif_from_folder(input_folder,output_file=None,options=None,filenames=None,recursive=True):
-    """
-    Read EXIF data for a folder of images.
-    Args:
-        input_folder (str): folder to process; if this is None, [filenames] should be a list of absolute
-            paths
-        output_file (str, optional): .json file to which we should write results; if this is None, results
-            are returned but not written to disk
-        options (ReadExifOptions, optional): parameters controlling metadata extraction
-        filenames (list, optional): allowlist of relative filenames (if [input_folder] is not None) or
-            a list of absolute filenames (if [input_folder] is None)
-        recursive (bool, optional): whether to recurse into [input_folder], not relevant if [input_folder]
-            is None.
-    Returns:
-        dict: a dictionary mapping relative filenames to EXIF data, whose format depends on whether
-        we're using PIL or exiftool.
-    """
-    if options is None:
-        options = ReadExifOptions()
-    # Validate options
-    if options.tags_to_include is not None:
-        assert options.tags_to_exclude is None, "tags_to_include and tags_to_exclude are incompatible"
-    if options.tags_to_exclude is not None:
-        assert options.tags_to_include is None, "tags_to_include and tags_to_exclude are incompatible"
-    if input_folder is None:
-        input_folder = ''
-    if len(input_folder) > 0:
-        assert os.path.isdir(input_folder), \
-            '{} is not a valid folder'.format(input_folder)
-    assert (len(input_folder) > 0) or (filenames is not None), \
-        'Must specify either a folder or a list of files'
-    if output_file is not None:
-        assert output_file.lower().endswith('.json') or output_file.lower().endswith('.csv'), \
-            'I only know how to write results to .json or .csv'
-        try:
-            with open(output_file, 'a') as f:
-                if not f.writable():
-                    raise IOError('File not writable')
-        except Exception:
-            print('Could not write to file {}'.format(output_file))
-            raise
-    if options.processing_library == 'exif':
-        assert is_executable(options.exiftool_command_name), 'exiftool not available'
-    if filenames is None:
-        images = _create_image_objects(input_folder,recursive=recursive)
-    else:
-        assert isinstance(filenames,list)
-        images = _create_image_objects(filenames)
-    results = _populate_exif_for_images(input_folder,images,options)
-    if output_file is not None:
-        try:
-            _write_exif_results(results,output_file)
-        except Exception as e:
-            if not options.allow_write_error:
-                raise
-            else:
-                print('Warning: error serializing EXIF data: {}'.format(str(e)))
-    return results
-#%% Interactive driver
-if False:
-    #%%
-    input_folder = r'C:\temp\md-name-testing'
-    output_file = None # r'C:\temp\md-name-testing\exif.json'
-    options = ReadExifOptions()
-    options.verbose = False
-    options.n_workers = 10
-    options.use_threads = False
-    options.processing_library = 'pil'
-    # options.processing_library = 'exiftool'
-    options.tags_to_include = ['DateTime','Model','Make','ExifImageWidth','ExifImageHeight','DateTime','DateTimeOriginal','Orientation']
-    # options.tags_to_exclude = ['MakerNote']
-    results = read_exif_from_folder(input_folder,output_file,options)
-    #%%
-    with open(output_file,'r') as f:
-        d = json.load(f)
-#%% Command-line driver
-import argparse
-import sys
-def main():
-    options = ReadExifOptions()
-    parser = argparse.ArgumentParser(description=('Read EXIF information from all images in' + \
-                                                  ' a folder, and write the results to .csv or .json'))
-    parser.add_argument('input_folder', type=str,
-                        help='Folder of images from which we should read EXIF information')
-    parser.add_argument('output_file', type=str,
-                        help='Output file (.json) to which we should write EXIF information')
-    parser.add_argument('--n_workers', type=int, default=1,
-                        help='Number of concurrent workers to use (defaults to 1)')
-    parser.add_argument('--use_threads', action='store_true',
-                        help='Use threads (instead of processes) for multitasking')
-    parser.add_argument('--processing_library', type=str, default=options.processing_library,
-                        help='Processing library (exif or pil)')
-    if len(sys.argv[1:]) == 0:
-        parser.print_help()
-        parser.exit()
-    args = parser.parse_args()
-    args_to_object(args, options)
-    options.processing_library = options.processing_library.lower()
-    read_exif_from_folder(args.input_folder,args.output_file,options)
-if __name__ == '__main__':
-    main()

megadetector 5.0.10__py3-none-any.whl → 5.0.11__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.10py3-none-any.whl → 5.0.11py3-none-any.whl