PyPI - megadetector - Versions diffs - 5.0.9__py3-none-any.whl → 5.0.11__py3-none-any.whl - Mend

megadetector 5.0.9py3-none-any.whl → 5.0.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (226) hide show

{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/LICENSE +0 -0
{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/METADATA +12 -11
megadetector-5.0.11.dist-info/RECORD +5 -0
megadetector-5.0.11.dist-info/top_level.txt +1 -0
api/__init__.py +0 -0
api/batch_processing/__init__.py +0 -0
api/batch_processing/api_core/__init__.py +0 -0
api/batch_processing/api_core/batch_service/__init__.py +0 -0
api/batch_processing/api_core/batch_service/score.py +0 -439
api/batch_processing/api_core/server.py +0 -294
api/batch_processing/api_core/server_api_config.py +0 -98
api/batch_processing/api_core/server_app_config.py +0 -55
api/batch_processing/api_core/server_batch_job_manager.py +0 -220
api/batch_processing/api_core/server_job_status_table.py +0 -152
api/batch_processing/api_core/server_orchestration.py +0 -360
api/batch_processing/api_core/server_utils.py +0 -92
api/batch_processing/api_core_support/__init__.py +0 -0
api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
api/batch_processing/api_support/__init__.py +0 -0
api/batch_processing/api_support/summarize_daily_activity.py +0 -152
api/batch_processing/data_preparation/__init__.py +0 -0
api/batch_processing/data_preparation/manage_local_batch.py +0 -2391
api/batch_processing/data_preparation/manage_video_batch.py +0 -327
api/batch_processing/integration/digiKam/setup.py +0 -6
api/batch_processing/integration/digiKam/xmp_integration.py +0 -465
api/batch_processing/integration/eMammal/test_scripts/config_template.py +0 -5
api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +0 -126
api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +0 -55
api/batch_processing/postprocessing/__init__.py +0 -0
api/batch_processing/postprocessing/add_max_conf.py +0 -64
api/batch_processing/postprocessing/categorize_detections_by_size.py +0 -163
api/batch_processing/postprocessing/combine_api_outputs.py +0 -249
api/batch_processing/postprocessing/compare_batch_results.py +0 -958
api/batch_processing/postprocessing/convert_output_format.py +0 -397
api/batch_processing/postprocessing/load_api_results.py +0 -195
api/batch_processing/postprocessing/md_to_coco.py +0 -310
api/batch_processing/postprocessing/md_to_labelme.py +0 -330
api/batch_processing/postprocessing/merge_detections.py +0 -401
api/batch_processing/postprocessing/postprocess_batch_results.py +0 -1904
api/batch_processing/postprocessing/remap_detection_categories.py +0 -170
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +0 -661
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +0 -211
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +0 -82
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +0 -1631
api/batch_processing/postprocessing/separate_detections_into_folders.py +0 -731
api/batch_processing/postprocessing/subset_json_detector_output.py +0 -696
api/batch_processing/postprocessing/top_folders_to_bottom.py +0 -223
api/synchronous/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/api_backend.py +0 -152
api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -266
api/synchronous/api_core/animal_detection_api/config.py +0 -35
api/synchronous/api_core/animal_detection_api/data_management/annotations/annotation_constants.py +0 -47
api/synchronous/api_core/animal_detection_api/detection/detector_training/copy_checkpoints.py +0 -43
api/synchronous/api_core/animal_detection_api/detection/detector_training/model_main_tf2.py +0 -114
api/synchronous/api_core/animal_detection_api/detection/process_video.py +0 -543
api/synchronous/api_core/animal_detection_api/detection/pytorch_detector.py +0 -304
api/synchronous/api_core/animal_detection_api/detection/run_detector.py +0 -627
api/synchronous/api_core/animal_detection_api/detection/run_detector_batch.py +0 -1029
api/synchronous/api_core/animal_detection_api/detection/run_inference_with_yolov5_val.py +0 -581
api/synchronous/api_core/animal_detection_api/detection/run_tiled_inference.py +0 -754
api/synchronous/api_core/animal_detection_api/detection/tf_detector.py +0 -165
api/synchronous/api_core/animal_detection_api/detection/video_utils.py +0 -495
api/synchronous/api_core/animal_detection_api/md_utils/azure_utils.py +0 -174
api/synchronous/api_core/animal_detection_api/md_utils/ct_utils.py +0 -262
api/synchronous/api_core/animal_detection_api/md_utils/directory_listing.py +0 -251
api/synchronous/api_core/animal_detection_api/md_utils/matlab_porting_tools.py +0 -97
api/synchronous/api_core/animal_detection_api/md_utils/path_utils.py +0 -416
api/synchronous/api_core/animal_detection_api/md_utils/process_utils.py +0 -110
api/synchronous/api_core/animal_detection_api/md_utils/sas_blob_utils.py +0 -509
api/synchronous/api_core/animal_detection_api/md_utils/string_utils.py +0 -59
api/synchronous/api_core/animal_detection_api/md_utils/url_utils.py +0 -144
api/synchronous/api_core/animal_detection_api/md_utils/write_html_image_list.py +0 -226
api/synchronous/api_core/animal_detection_api/md_visualization/visualization_utils.py +0 -841
api/synchronous/api_core/tests/__init__.py +0 -0
api/synchronous/api_core/tests/load_test.py +0 -110
classification/__init__.py +0 -0
classification/aggregate_classifier_probs.py +0 -108
classification/analyze_failed_images.py +0 -227
classification/cache_batchapi_outputs.py +0 -198
classification/create_classification_dataset.py +0 -627
classification/crop_detections.py +0 -516
classification/csv_to_json.py +0 -226
classification/detect_and_crop.py +0 -855
classification/efficientnet/__init__.py +0 -9
classification/efficientnet/model.py +0 -415
classification/efficientnet/utils.py +0 -610
classification/evaluate_model.py +0 -520
classification/identify_mislabeled_candidates.py +0 -152
classification/json_to_azcopy_list.py +0 -63
classification/json_validator.py +0 -695
classification/map_classification_categories.py +0 -276
classification/merge_classification_detection_output.py +0 -506
classification/prepare_classification_script.py +0 -194
classification/prepare_classification_script_mc.py +0 -228
classification/run_classifier.py +0 -286
classification/save_mislabeled.py +0 -110
classification/train_classifier.py +0 -825
classification/train_classifier_tf.py +0 -724
classification/train_utils.py +0 -322
data_management/__init__.py +0 -0
data_management/annotations/__init__.py +0 -0
data_management/annotations/annotation_constants.py +0 -34
data_management/camtrap_dp_to_coco.py +0 -238
data_management/cct_json_utils.py +0 -395
data_management/cct_to_md.py +0 -176
data_management/cct_to_wi.py +0 -289
data_management/coco_to_labelme.py +0 -272
data_management/coco_to_yolo.py +0 -662
data_management/databases/__init__.py +0 -0
data_management/databases/add_width_and_height_to_db.py +0 -33
data_management/databases/combine_coco_camera_traps_files.py +0 -206
data_management/databases/integrity_check_json_db.py +0 -477
data_management/databases/subset_json_db.py +0 -115
data_management/generate_crops_from_cct.py +0 -149
data_management/get_image_sizes.py +0 -188
data_management/importers/add_nacti_sizes.py +0 -52
data_management/importers/add_timestamps_to_icct.py +0 -79
data_management/importers/animl_results_to_md_results.py +0 -158
data_management/importers/auckland_doc_test_to_json.py +0 -372
data_management/importers/auckland_doc_to_json.py +0 -200
data_management/importers/awc_to_json.py +0 -189
data_management/importers/bellevue_to_json.py +0 -273
data_management/importers/cacophony-thermal-importer.py +0 -796
data_management/importers/carrizo_shrubfree_2018.py +0 -268
data_management/importers/carrizo_trail_cam_2017.py +0 -287
data_management/importers/cct_field_adjustments.py +0 -57
data_management/importers/channel_islands_to_cct.py +0 -913
data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
data_management/importers/eMammal/eMammal_helpers.py +0 -249
data_management/importers/eMammal/make_eMammal_json.py +0 -223
data_management/importers/ena24_to_json.py +0 -275
data_management/importers/filenames_to_json.py +0 -385
data_management/importers/helena_to_cct.py +0 -282
data_management/importers/idaho-camera-traps.py +0 -1407
data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
data_management/importers/jb_csv_to_json.py +0 -150
data_management/importers/mcgill_to_json.py +0 -250
data_management/importers/missouri_to_json.py +0 -489
data_management/importers/nacti_fieldname_adjustments.py +0 -79
data_management/importers/noaa_seals_2019.py +0 -181
data_management/importers/pc_to_json.py +0 -365
data_management/importers/plot_wni_giraffes.py +0 -123
data_management/importers/prepare-noaa-fish-data-for-lila.py +0 -359
data_management/importers/prepare_zsl_imerit.py +0 -131
data_management/importers/rspb_to_json.py +0 -356
data_management/importers/save_the_elephants_survey_A.py +0 -320
data_management/importers/save_the_elephants_survey_B.py +0 -332
data_management/importers/snapshot_safari_importer.py +0 -758
data_management/importers/snapshot_safari_importer_reprise.py +0 -665
data_management/importers/snapshot_serengeti_lila.py +0 -1067
data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
data_management/importers/sulross_get_exif.py +0 -65
data_management/importers/timelapse_csv_set_to_json.py +0 -490
data_management/importers/ubc_to_json.py +0 -399
data_management/importers/umn_to_json.py +0 -507
data_management/importers/wellington_to_json.py +0 -263
data_management/importers/wi_to_json.py +0 -441
data_management/importers/zamba_results_to_md_results.py +0 -181
data_management/labelme_to_coco.py +0 -548
data_management/labelme_to_yolo.py +0 -272
data_management/lila/__init__.py +0 -0
data_management/lila/add_locations_to_island_camera_traps.py +0 -97
data_management/lila/add_locations_to_nacti.py +0 -147
data_management/lila/create_lila_blank_set.py +0 -557
data_management/lila/create_lila_test_set.py +0 -151
data_management/lila/create_links_to_md_results_files.py +0 -106
data_management/lila/download_lila_subset.py +0 -177
data_management/lila/generate_lila_per_image_labels.py +0 -515
data_management/lila/get_lila_annotation_counts.py +0 -170
data_management/lila/get_lila_image_counts.py +0 -111
data_management/lila/lila_common.py +0 -300
data_management/lila/test_lila_metadata_urls.py +0 -132
data_management/ocr_tools.py +0 -874
data_management/read_exif.py +0 -681
data_management/remap_coco_categories.py +0 -84
data_management/remove_exif.py +0 -66
data_management/resize_coco_dataset.py +0 -189
data_management/wi_download_csv_to_coco.py +0 -246
data_management/yolo_output_to_md_output.py +0 -441
data_management/yolo_to_coco.py +0 -676
detection/__init__.py +0 -0
detection/detector_training/__init__.py +0 -0
detection/detector_training/model_main_tf2.py +0 -114
detection/process_video.py +0 -703
detection/pytorch_detector.py +0 -337
detection/run_detector.py +0 -779
detection/run_detector_batch.py +0 -1219
detection/run_inference_with_yolov5_val.py +0 -917
detection/run_tiled_inference.py +0 -935
detection/tf_detector.py +0 -188
detection/video_utils.py +0 -606
docs/source/conf.py +0 -43
md_utils/__init__.py +0 -0
md_utils/azure_utils.py +0 -174
md_utils/ct_utils.py +0 -612
md_utils/directory_listing.py +0 -246
md_utils/md_tests.py +0 -968
md_utils/path_utils.py +0 -1044
md_utils/process_utils.py +0 -157
md_utils/sas_blob_utils.py +0 -509
md_utils/split_locations_into_train_val.py +0 -228
md_utils/string_utils.py +0 -92
md_utils/url_utils.py +0 -323
md_utils/write_html_image_list.py +0 -225
md_visualization/__init__.py +0 -0
md_visualization/plot_utils.py +0 -293
md_visualization/render_images_with_thumbnails.py +0 -275
md_visualization/visualization_utils.py +0 -1537
md_visualization/visualize_db.py +0 -551
md_visualization/visualize_detector_output.py +0 -406
megadetector-5.0.9.dist-info/RECORD +0 -224
megadetector-5.0.9.dist-info/top_level.txt +0 -8
taxonomy_mapping/__init__.py +0 -0
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +0 -491
taxonomy_mapping/map_new_lila_datasets.py +0 -154
taxonomy_mapping/prepare_lila_taxonomy_release.py +0 -142
taxonomy_mapping/preview_lila_taxonomy.py +0 -591
taxonomy_mapping/retrieve_sample_image.py +0 -71
taxonomy_mapping/simple_image_download.py +0 -218
taxonomy_mapping/species_lookup.py +0 -834
taxonomy_mapping/taxonomy_csv_checker.py +0 -159
taxonomy_mapping/taxonomy_graph.py +0 -346
taxonomy_mapping/validate_lila_category_mappings.py +0 -83
{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/WHEEL +0 -0

data_management/coco_to_yolo.py DELETED Viewed

@@ -1,662 +0,0 @@
-"""
-coco_to_yolo.py
-Converts a COCO-formatted dataset to a YOLO-formatted dataset, flattening
-the dataset (to a single folder) in the process.
-If the input and output folders are the same, writes .txt files to the input folder,
-and neither moves nor modifies images.
-Currently ignores segmentation masks, and errors if an annotation has a
-segmentation polygon but no bbox.
-Has only been tested on a handful of COCO Camera Traps data sets; if you
-use it for more general COCO conversion, YMMV.
-"""
-#%% Imports and constants
-import json
-import os
-import shutil
-from collections import defaultdict
-from tqdm import tqdm
-from md_utils.path_utils import safe_create_link,find_images
-#%% Support functions
-def write_yolo_dataset_file(yolo_dataset_file,
-                            dataset_base_dir,
-                            class_list,
-                            train_folder_relative=None,
-                            val_folder_relative=None,
-                            test_folder_relative=None):
-    """
-    Write a YOLOv5 dataset.yaml file to the absolute path [yolo_dataset_file] (should
-    have a .yaml extension, though it's only a warning if it doesn't).
-    Args:
-        yolo_dataset_file (str): the file, typically ending in .yaml or .yml, to write.
-            Does not have to be within dataset_base_dir.
-        dataset_base_dir (str): the absolute base path of the YOLO dataset
-        class_list (list or str): an ordered list of class names (the first item will be class 0,
-            etc.), or the name of a text file containing an ordered list of class names (one per
-            line, starting from class zero).
-    """
-    # Read class names
-    if isinstance(class_list,str):
-        with open(class_list,'r') as f:
-            class_lines = f.readlines()
-        class_lines = [s.strip() for s in class_lines]
-        class_list = [s for s in class_lines if len(s) > 0]
-    if not (yolo_dataset_file.endswith('.yml') or yolo_dataset_file.endswith('.yaml')):
-        print('Warning: writing dataset file to a non-yml/yaml extension:\n{}'.format(
-            yolo_dataset_file))
-    # Write dataset.yaml
-    with open(yolo_dataset_file,'w') as f:
-        f.write('# Train/val sets\n')
-        f.write('path: {}\n'.format(dataset_base_dir))
-        if train_folder_relative is not None:
-            f.write('train: {}\n'.format(train_folder_relative))
-        if val_folder_relative is not None:
-            f.write('val: {}\n'.format(val_folder_relative))
-        if test_folder_relative is not None:
-            f.write('val: {}\n'.format(test_folder_relative))
-        f.write('\n')
-        f.write('# Classes\n')
-        f.write('names:\n')
-        for i_class,class_name in enumerate(class_list):
-            f.write('  {}: {}\n'.format(i_class,class_name))
-# ...def write_yolo_dataset_file(...)
-def coco_to_yolo(input_image_folder,
-                 output_folder,
-                 input_file,
-                 source_format='coco',
-                 overwrite_images=False,
-                 create_image_and_label_folders=False,
-                 class_file_name='classes.txt',
-                 allow_empty_annotations=False,
-                 clip_boxes=False,
-                 image_id_to_output_image_json_file=None,
-                 images_to_exclude=None,
-                 path_replacement_char='#',
-                 category_names_to_exclude=None,
-                 category_names_to_include=None,
-                 write_output=True,
-                 flatten_paths=True):
-    """
-    Converts a COCO-formatted dataset to a YOLO-formatted dataset, optionally flattening the
-    dataset to a single folder in the process.
-    If the input and output folders are the same, writes .txt files to the input folder,
-    and neither moves nor modifies images.
-    Currently ignores segmentation masks, and errors if an annotation has a
-    segmentation polygon but no bbox.
-    Args:
-        input_image_folder (str): the folder where images live; filenames in the COCO .json
-            file [input_file] should be relative to this folder
-        output_folder (str): the base folder for the YOLO dataset
-        input_file (str): a .json file in COCO format; can be the same as [input_image_folder], in which case
-            images are left alone.
-        source_format (str, optional): can be 'coco' (default) or 'coco_camera_traps'.  The only difference
-            is that when source_format is 'coco_camera_traps', we treat an image with a non-bbox
-            annotation with a category id of 0 as a special case, i.e. that's how an empty image
-            is indicated.  The original COCO standard is a little ambiguous on this issue.  If
-            source_format is 'coco', we either treat images as empty or error, depending on the value
-            of [allow_empty_annotations].  [allow_empty_annotations] has no effect if source_format is
-            'coco_camera_traps'.
-        create_image_and_label_folder (bool, optional): whether to create separate folders called 'images' and
-            'labels' in the YOLO output folder.  If create_image_and_label_folders is False,
-            a/b/c/image001.jpg will become a#b#c#image001.jpg, and the corresponding text file will
-            be a#b#c#image001.txt.  If create_image_and_label_folders is True, a/b/c/image001.jpg will become
-            images/a#b#c#image001.jpg, and the corresponding text file will be
-            labels/a#b#c#image001.txt.
-        clip_boxes (bool, optional): whether to clip bounding box coordinates to the range [0,1] before
-            converting to YOLO xywh format
-        image_id_to_output_image_json_file (str, optional): an optional *output* file, to which we will write
-            a mapping from image IDs to output file names
-        images_to_exclude (list, optional): a list of image files (relative paths in the input folder) that we
-            should ignore
-        path_replacement_char (str, optional): only relevant if [flatten_paths] is True; this is used to replace
-            path separators, e.g. if [path_replacement_char] is '#' and [flatten_paths] is True, a/b/c/d.jpg
-            becomes a#b#c#d.jpg
-        category_names_to_exclude (str, optional): category names that should not be represented in the
-            YOLO output; only impacts annotations, does not prevent copying images.  There's almost no reason
-            you would want to specify this and [category_names_to_include].
-        category_names_to_include (str, optional): allow-list of category names that should be represented in the
-            YOLO output; only impacts annotations, does not prevent copying images.  There's almost no reason
-            you would want to specify this and [category_names_to_exclude].
-        write_output (bool, optional): determines whether we actually copy images and write annotations;
-            setting this to False mostly puts this function in "dry run" "mode.  The class list
-            file is written regardless of the value of write_output.
-    Returns:
-        dict: information about the coco --> yolo mapping, containing at least the fields:
-        - class_list_filename: the filename to which we wrote the flat list of class names required
-          by the YOLO format.
-        - source_image_to_dest_image: a dict mapping source images to destination images
-        - coco_id_to_yolo_id: a dict mapping COCO category IDs to YOLO category IDs
-    """
-    ## Validate input
-    if category_names_to_include is not None and category_names_to_exclude is not None:
-        raise ValueError('category_names_to_include and category_names_to_exclude are mutually exclusive')
-    if output_folder is None:
-        output_folder = input_image_folder
-    if images_to_exclude is not None:
-        images_to_exclude = set(images_to_exclude)
-    if category_names_to_exclude is None:
-        category_names_to_exclude = {}
-    assert os.path.isdir(input_image_folder)
-    assert os.path.isfile(input_file)
-    os.makedirs(output_folder,exist_ok=True)
-    if (output_folder == input_image_folder) and (overwrite_images) and \
-        (not create_image_and_label_folders) and (not flatten_paths):
-            print('Warning: output folder and input folder are the same, disabling overwrite_images')
-            overwrite_images = False
-    ## Read input data
-    with open(input_file,'r') as f:
-        data = json.load(f)
-    ## Parse annotations
-    image_id_to_annotations = defaultdict(list)
-    # i_ann = 0; ann = data['annotations'][0]
-    for i_ann,ann in enumerate(data['annotations']):
-        # Make sure no annotations have *only* segmentation data
-        if ( \
-            ('segmentation' in ann.keys()) and \
-            (ann['segmentation'] is not None) and \
-            (len(ann['segmentation']) > 0) ) \
-            and \
-            (('bbox' not in ann.keys()) or (ann['bbox'] is None) or (len(ann['bbox'])==0)):
-                raise ValueError('Oops: segmentation data present without bbox information, ' + \
-                                 'this script isn\'t ready for this dataset')
-        image_id_to_annotations[ann['image_id']].append(ann)
-    print('Parsed annotations for {} images'.format(len(image_id_to_annotations)))
-    # Re-map class IDs to make sure they run from 0...n-classes-1
-    #
-    # Note: this allows unused categories in the output data set.  This is OK for
-    # some training pipelines, not for others.
-    next_category_id = 0
-    coco_id_to_yolo_id = {}
-    coco_id_to_name = {}
-    yolo_id_to_name = {}
-    coco_category_ids_to_exclude = set()
-    for category in data['categories']:
-        coco_id_to_name[category['id']] = category['name']
-        if (category_names_to_include is not None) and \
-            (category['name'] not in category_names_to_include):
-            coco_category_ids_to_exclude.add(category['id'])
-            continue
-        elif (category['name'] in category_names_to_exclude):
-            coco_category_ids_to_exclude.add(category['id'])
-            continue
-        assert category['id'] not in coco_id_to_yolo_id
-        coco_id_to_yolo_id[category['id']] = next_category_id
-        yolo_id_to_name[next_category_id] = category['name']
-        next_category_id += 1
-    ## Process images (everything but I/O)
-    # List of dictionaries with keys 'source_image','dest_image','bboxes','dest_txt'
-    images_to_copy = []
-    missing_images = []
-    excluded_images = []
-    image_names = set()
-    typical_image_extensions = set(['.jpg','.jpeg','.png','.gif','.tif','.bmp'])
-    printed_empty_annotation_warning = False
-    image_id_to_output_image_name = {}
-    print('Processing annotations')
-    n_clipped_boxes = 0
-    n_total_boxes = 0
-    # i_image = 0; im = data['images'][i_image]
-    for i_image,im in tqdm(enumerate(data['images']),total=len(data['images'])):
-        output_info = {}
-        source_image = os.path.join(input_image_folder,im['file_name'])
-        output_info['source_image'] = source_image
-        if images_to_exclude is not None and im['file_name'] in images_to_exclude:
-            excluded_images.append(im['file_name'])
-            continue
-        tokens = os.path.splitext(im['file_name'])
-        if tokens[1].lower() not in typical_image_extensions:
-            print('Warning: unusual image file name {}'.format(im['file_name']))
-        if flatten_paths:
-            image_name = tokens[0].replace('\\','/').replace('/',path_replacement_char) + \
-                '_' + str(i_image).zfill(6)
-        else:
-            image_name = tokens[0]
-        assert image_name not in image_names, 'Image name collision for {}'.format(image_name)
-        image_names.add(image_name)
-        assert im['id'] not in image_id_to_output_image_name
-        image_id_to_output_image_name[im['id']] = image_name
-        dest_image_relative = image_name + tokens[1]
-        output_info['dest_image_relative'] = dest_image_relative
-        dest_txt_relative = image_name + '.txt'
-        output_info['dest_txt_relative'] = dest_txt_relative
-        output_info['bboxes'] = []
-        # assert os.path.isfile(source_image), 'Could not find image {}'.format(source_image)
-        if not os.path.isfile(source_image):
-            print('Warning: could not find image {}'.format(source_image))
-            missing_images.append(im['file_name'])
-            continue
-        image_id = im['id']
-        image_bboxes = []
-        if image_id in image_id_to_annotations:
-            for ann in image_id_to_annotations[image_id]:
-                # If this annotation has no bounding boxes...
-                if 'bbox' not in ann or ann['bbox'] is None or len(ann['bbox']) == 0:
-                    if source_format == 'coco':
-                        if not allow_empty_annotations:
-                            # This is not entirely clear from the COCO spec, but it seems to be consensus
-                            # that if you want to specify an image with no objects, you don't include any
-                            # annotations for that image.
-                            raise ValueError('If an annotation exists, it should have content')
-                        else:
-                            continue
-                    elif source_format == 'coco_camera_traps':
-                        # We allow empty bbox lists in COCO camera traps; this is typically a negative
-                        # example in a dataset that has bounding boxes, and 0 is typically the empty
-                        # category.
-                        if ann['category_id'] != 0:
-                            if not printed_empty_annotation_warning:
-                                printed_empty_annotation_warning = True
-                                print('Warning: non-bbox annotation found with category {}'.format(
-                                    ann['category_id']))
-                        continue
-                    else:
-                        raise ValueError('Unrecognized COCO variant: {}'.format(source_format))
-                # ...if this is an empty annotation
-                coco_bbox = ann['bbox']
-                # This category isn't in our category list.  This typically corresponds to whole sets
-                # of images that were excluded from the YOLO set.
-                if ann['category_id'] in coco_category_ids_to_exclude:
-                    continue
-                yolo_category_id = coco_id_to_yolo_id[ann['category_id']]
-                # COCO: [x_min, y_min, width, height] in absolute coordinates
-                # YOLO: [class, x_center, y_center, width, height] in normalized coordinates
-                # Convert from COCO coordinates to YOLO coordinates
-                img_w = im['width']
-                img_h = im['height']
-                if source_format in ('coco','coco_camera_traps'):
-                    x_min_absolute = coco_bbox[0]
-                    y_min_absolute = coco_bbox[1]
-                    box_w_absolute = coco_bbox[2]
-                    box_h_absolute = coco_bbox[3]
-                    x_center_absolute = (x_min_absolute + (x_min_absolute + box_w_absolute)) / 2
-                    y_center_absolute = (y_min_absolute + (y_min_absolute + box_h_absolute)) / 2
-                    x_center_relative = x_center_absolute / img_w
-                    y_center_relative = y_center_absolute / img_h
-                    box_w_relative = box_w_absolute / img_w
-                    box_h_relative = box_h_absolute / img_h
-                else:
-                    raise ValueError('Unrecognized source format {}'.format(source_format))
-                if clip_boxes:
-                    clipped_box = False
-                    box_right = x_center_relative + (box_w_relative / 2.0)
-                    if box_right > 1.0:
-                        clipped_box = True
-                        overhang = box_right - 1.0
-                        box_w_relative -= overhang
-                        x_center_relative -= (overhang / 2.0)
-                    box_bottom = y_center_relative + (box_h_relative / 2.0)
-                    if box_bottom > 1.0:
-                        clipped_box = True
-                        overhang = box_bottom - 1.0
-                        box_h_relative -= overhang
-                        y_center_relative -= (overhang / 2.0)
-                    box_left = x_center_relative - (box_w_relative / 2.0)
-                    if box_left < 0.0:
-                        clipped_box = True
-                        overhang = abs(box_left)
-                        box_w_relative -= overhang
-                        x_center_relative += (overhang / 2.0)
-                    box_top = y_center_relative - (box_h_relative / 2.0)
-                    if box_top < 0.0:
-                        clipped_box = True
-                        overhang = abs(box_top)
-                        box_h_relative -= overhang
-                        y_center_relative += (overhang / 2.0)
-                    if clipped_box:
-                        n_clipped_boxes += 1
-                yolo_box = [yolo_category_id,
-                            x_center_relative, y_center_relative,
-                            box_w_relative, box_h_relative]
-                image_bboxes.append(yolo_box)
-                n_total_boxes += 1
-            # ...for each annotation
-        # ...if this image has annotations
-        output_info['bboxes'] = image_bboxes
-        images_to_copy.append(output_info)
-    # ...for each image
-    print('\nWriting {} boxes ({} clipped) for {} images'.format(n_total_boxes,
-                                                               n_clipped_boxes,len(images_to_copy)))
-    print('{} missing images (of {})'.format(len(missing_images),len(data['images'])))
-    if images_to_exclude is not None:
-        print('{} excluded images (of {})'.format(len(excluded_images),len(data['images'])))
-    ## Write output
-    print('Generating class list')
-    class_list_filename = os.path.join(output_folder,class_file_name)
-    with open(class_list_filename, 'w') as f:
-        print('Writing class list to {}'.format(class_list_filename))
-        for i_class in range(0,len(yolo_id_to_name)):
-            # Category IDs should range from 0..N-1
-            assert i_class in yolo_id_to_name
-            f.write(yolo_id_to_name[i_class] + '\n')
-    if image_id_to_output_image_json_file is not None:
-        print('Writing image ID mapping to {}'.format(image_id_to_output_image_json_file))
-        with open(image_id_to_output_image_json_file,'w') as f:
-            json.dump(image_id_to_output_image_name,f,indent=1)
-    if (output_folder == input_image_folder) and (not create_image_and_label_folders):
-        print('Creating annotation files (not copying images, input and output folder are the same)')
-    else:
-        print('Copying images and creating annotation files')
-    if create_image_and_label_folders:
-        dest_image_folder = os.path.join(output_folder,'images')
-        dest_txt_folder = os.path.join(output_folder,'labels')
-    else:
-        dest_image_folder = output_folder
-        dest_txt_folder = output_folder
-    source_image_to_dest_image = {}
-    # TODO: parallelize this loop
-    #
-    # output_info = images_to_copy[0]
-    for output_info in tqdm(images_to_copy):
-        source_image = output_info['source_image']
-        dest_image_relative = output_info['dest_image_relative']
-        dest_txt_relative = output_info['dest_txt_relative']
-        dest_image = os.path.join(dest_image_folder,dest_image_relative)
-        dest_txt = os.path.join(dest_txt_folder,dest_txt_relative)
-        source_image_to_dest_image[source_image] = dest_image
-        if write_output:
-            os.makedirs(os.path.dirname(dest_image),exist_ok=True)
-            os.makedirs(os.path.dirname(dest_txt),exist_ok=True)
-            if not create_image_and_label_folders:
-                assert os.path.dirname(dest_image) == os.path.dirname(dest_txt)
-            if (not os.path.isfile(dest_image)) or (overwrite_images):
-                shutil.copyfile(source_image,dest_image)
-            bboxes = output_info['bboxes']
-            # Only write an annotation file if there are bounding boxes.  Images with
-            # no .txt files are treated as hard negatives, at least by YOLOv5:
-            #
-            # https://github.com/ultralytics/yolov5/issues/3218
-            #
-            # I think this is also true for images with empty .txt files, but
-            # I'm using the convention suggested on that issue, i.e. hard
-            # negatives are expressed as images without .txt files.
-            if len(bboxes) > 0:
-                with open(dest_txt,'w') as f:
-                    # bbox = bboxes[0]
-                    for bbox in bboxes:
-                        assert len(bbox) == 5
-                        s = '{} {} {} {} {}'.format(bbox[0],bbox[1],bbox[2],bbox[3],bbox[4])
-                        f.write(s + '\n')
-        # ...if we're actually writing output
-    # ...for each image
-    coco_to_yolo_info = {}
-    coco_to_yolo_info['class_list_filename'] = class_list_filename
-    coco_to_yolo_info['source_image_to_dest_image'] = source_image_to_dest_image
-    coco_to_yolo_info['coco_id_to_yolo_id'] = coco_id_to_yolo_id
-    return coco_to_yolo_info
-# ...def coco_to_yolo(...)
-def create_yolo_symlinks(source_folder,images_folder,labels_folder,
-                         class_list_file=None,
-                         class_list_output_name='object.data',
-                         force_lowercase_image_extension=False):
-    """
-    Given a YOLO-formatted folder of images and .txt files, creates a folder
-    of symlinks to all the images, and a folder of symlinks to all the labels.
-    Used to support preview/editing tools that assume images and labels are in separate
-    folders.
-    :meta private:
-    """
-    assert source_folder != images_folder and source_folder != labels_folder
-    os.makedirs(images_folder,exist_ok=True)
-    os.makedirs(labels_folder,exist_ok=True)
-    image_files_relative = find_images(source_folder,recursive=True,return_relative_paths=True)
-    # image_fn_relative = image_files_relative[0]=
-    for image_fn_relative in tqdm(image_files_relative):
-        source_file_abs = os.path.join(source_folder,image_fn_relative)
-        target_file_abs = os.path.join(images_folder,image_fn_relative)
-        if force_lowercase_image_extension:
-            tokens = os.path.splitext(target_file_abs)
-            target_file_abs = tokens[0] + tokens[1].lower()
-        os.makedirs(os.path.dirname(target_file_abs),exist_ok=True)
-        safe_create_link(source_file_abs,target_file_abs)
-        source_annotation_file_abs = os.path.splitext(source_file_abs)[0] + '.txt'
-        if os.path.isfile(source_annotation_file_abs):
-            target_annotation_file_abs = \
-                os.path.splitext(os.path.join(labels_folder,image_fn_relative))[0] + '.txt'
-            os.makedirs(os.path.dirname(target_annotation_file_abs),exist_ok=True)
-            safe_create_link(source_annotation_file_abs,target_annotation_file_abs)
-    # ...for each image
-    if class_list_file is not None:
-        target_class_list_file = os.path.join(labels_folder,class_list_output_name)
-        safe_create_link(class_list_file,target_class_list_file)
-# ...def create_yolo_symlinks(...)
-#%% Interactive driver
-if False:
-    pass
-    #%% Options
-    input_file = os.path.expanduser('~/data/md-test-coco.json')
-    image_folder = os.path.expanduser('~/data/md-test')
-    output_folder = os.path.expanduser('~/data/md-test-yolo')
-    create_image_and_label_folders=False
-    class_file_name='classes.txt'
-    allow_empty_annotations=False
-    clip_boxes=False
-    image_id_to_output_image_json_file=None
-    images_to_exclude=None
-    path_replacement_char='#'
-    category_names_to_exclude=None
-    #%% Programmatic execution
-    coco_to_yolo_results = coco_to_yolo(image_folder,output_folder,input_file,
-                     source_format='coco',
-                     overwrite_images=False,
-                     create_image_and_label_folders=create_image_and_label_folders,
-                     class_file_name=class_file_name,
-                     allow_empty_annotations=allow_empty_annotations,
-                     clip_boxes=clip_boxes)
-    create_yolo_symlinks(source_folder=output_folder,
-                         images_folder=output_folder + '/images',
-                         labels_folder=output_folder + '/labels',
-                         class_list_file=coco_to_yolo_results['class_list_filename'],
-                         class_list_output_name='object.data',
-                         force_lowercase_image_extension=True)
-    #%% Prepare command-line example
-    s = 'python coco_to_yolo.py {} {} {} --create_bounding_box_editor_symlinks'.format(
-        image_folder,output_folder,input_file)
-    print(s)
-    import clipboard; clipboard.copy(s)
-#%% Command-line driver
-import sys,argparse
-def main():
-    parser = argparse.ArgumentParser(
-        description='Convert COCO-formatted data to YOLO format, flattening the image structure')
-    # input_image_folder,output_folder,input_file
-    parser.add_argument(
-        'input_folder',
-        type=str,
-        help='Path to input images')
-    parser.add_argument(
-        'output_folder',
-        type=str,
-        help='Path to flat, YOLO-formatted dataset')
-    parser.add_argument(
-        'input_file',
-        type=str,
-        help='Path to COCO dataset file (.json)')
-    parser.add_argument(
-        '--create_bounding_box_editor_symlinks',
-        action='store_true',
-        help='Prepare symlinks so the whole folder appears to contain "images" and "labels" folderss')
-    if len(sys.argv[1:]) == 0:
-        parser.print_help()
-        parser.exit()
-    args = parser.parse_args()
-    coco_to_yolo_results = coco_to_yolo(args.input_folder,args.output_folder,args.input_file)
-    if args.create_bounding_box_editor_symlinks:
-        create_yolo_symlinks(source_folder=args.output_folder,
-                             images_folder=args.output_folder + '/images',
-                             labels_folder=args.output_folder + '/labels',
-                             class_list_file=coco_to_yolo_results['class_list_filename'],
-                             class_list_output_name='object.data',
-                             force_lowercase_image_extension=True)
-if __name__ == '__main__':
-    main()

data_management/databases/__init__.py DELETED Viewed

File without changes

data_management/databases/add_width_and_height_to_db.py DELETED Viewed

@@ -1,33 +0,0 @@
-"""
-add_width_and_height_to_db.py
-Grabs width and height from actual image files for a .json database that is missing w/h.
-TODO: this is a one-off script waiting to be cleaned up for more general use.
-"""
-#%% Imports and constants
-import json
-from PIL import Image
-datafile = '/datadrive/snapshotserengeti/databases/snapshotserengeti.json'
-image_base = '/datadrive/snapshotserengeti/images/'
-def main():
-    with open(datafile,'r') as f:
-        data = json.load(f)
-    for im in data['images']:
-        if 'height' not in im:
-            im_w, im_h = Image.open(image_base+im['file_name']).size
-            im['height'] = im_h
-            im['width'] = im_w
-    json.dump(data, open(datafile,'w'))
-if __name__ == '__main__':
-    main()

megadetector 5.0.9__py3-none-any.whl → 5.0.11__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.9py3-none-any.whl → 5.0.11py3-none-any.whl