PyPI - megadetector - Versions diffs - 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl - Mend

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (197) hide show

megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/efficientnet/model.py +8 -8
megadetector/classification/efficientnet/utils.py +6 -5
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +26 -26
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -2
megadetector/data_management/camtrap_dp_to_coco.py +79 -46
megadetector/data_management/cct_json_utils.py +103 -103
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +210 -193
megadetector/data_management/databases/add_width_and_height_to_db.py +86 -12
megadetector/data_management/databases/combine_coco_camera_traps_files.py +40 -40
megadetector/data_management/databases/integrity_check_json_db.py +228 -200
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +88 -39
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +133 -125
megadetector/data_management/labelme_to_yolo.py +159 -73
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +365 -107
megadetector/data_management/lila/get_lila_annotation_counts.py +35 -33
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +73 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +28 -19
megadetector/data_management/mewc_to_md.py +344 -340
megadetector/data_management/ocr_tools.py +262 -255
megadetector/data_management/read_exif.py +249 -227
megadetector/data_management/remap_coco_categories.py +90 -28
megadetector/data_management/remove_exif.py +81 -21
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +588 -120
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +248 -122
megadetector/data_management/yolo_to_coco.py +333 -191
megadetector/detection/change_detection.py +832 -0
megadetector/detection/process_video.py +340 -337
megadetector/detection/pytorch_detector.py +358 -278
megadetector/detection/run_detector.py +399 -186
megadetector/detection/run_detector_batch.py +404 -377
megadetector/detection/run_inference_with_yolov5_val.py +340 -327
megadetector/detection/run_tiled_inference.py +257 -249
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +332 -295
megadetector/postprocessing/add_max_conf.py +19 -11
megadetector/postprocessing/categorize_detections_by_size.py +45 -45
megadetector/postprocessing/classification_postprocessing.py +468 -433
megadetector/postprocessing/combine_batch_outputs.py +23 -23
megadetector/postprocessing/compare_batch_results.py +590 -525
megadetector/postprocessing/convert_output_format.py +106 -102
megadetector/postprocessing/create_crop_folder.py +347 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -499
megadetector/postprocessing/load_api_results.py +48 -27
megadetector/postprocessing/md_to_coco.py +133 -102
megadetector/postprocessing/md_to_labelme.py +107 -90
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +92 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -301
megadetector/postprocessing/remap_detection_categories.py +91 -38
megadetector/postprocessing/render_detection_confusion_matrix.py +214 -205
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +704 -679
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +18 -19
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +54 -33
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +67 -67
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +156 -74
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +10 -10
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/ct_utils.py +1049 -211
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +632 -529
megadetector/utils/path_utils.py +1520 -431
megadetector/utils/process_utils.py +41 -41
megadetector/utils/split_locations_into_train_val.py +62 -62
megadetector/utils/string_utils.py +148 -27
megadetector/utils/url_utils.py +489 -176
megadetector/utils/wi_utils.py +2658 -2526
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +34 -30
megadetector/visualization/render_images_with_thumbnails.py +39 -74
megadetector/visualization/visualization_utils.py +487 -435
megadetector/visualization/visualize_db.py +232 -198
megadetector/visualization/visualize_detector_output.py +82 -76
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/METADATA +5 -2
megadetector-10.0.0.dist-info/RECORD +139 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/WHEEL +1 -1
megadetector/api/batch_processing/api_core/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/score.py +0 -439
megadetector/api/batch_processing/api_core/server.py +0 -294
megadetector/api/batch_processing/api_core/server_api_config.py +0 -97
megadetector/api/batch_processing/api_core/server_app_config.py +0 -55
megadetector/api/batch_processing/api_core/server_batch_job_manager.py +0 -220
megadetector/api/batch_processing/api_core/server_job_status_table.py +0 -149
megadetector/api/batch_processing/api_core/server_orchestration.py +0 -360
megadetector/api/batch_processing/api_core/server_utils.py +0 -88
megadetector/api/batch_processing/api_core_support/__init__.py +0 -0
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
megadetector/api/batch_processing/api_support/__init__.py +0 -0
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +0 -152
megadetector/api/batch_processing/data_preparation/__init__.py +0 -0
megadetector/api/synchronous/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/api_backend.py +0 -151
megadetector/api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -263
megadetector/api/synchronous/api_core/animal_detection_api/config.py +0 -35
megadetector/api/synchronous/api_core/tests/__init__.py +0 -0
megadetector/api/synchronous/api_core/tests/load_test.py +0 -110
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector/utils/azure_utils.py +0 -178
megadetector/utils/sas_blob_utils.py +0 -509
megadetector-5.0.28.dist-info/RECORD +0 -209
/megadetector/{api/batch_processing/__init__.py → __init__.py} +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/top_level.txt +0 -0

megadetector/data_management/coco_to_yolo.py CHANGED Viewed

@@ -8,7 +8,7 @@ the dataset (to a single folder) in the process.
 If the input and output folders are the same, writes .txt files to the input folder,
 and neither moves nor modifies images.
-Currently ignores segmentation masks, and errors if an annotation has a
+Currently ignores segmentation masks, and errors if an annotation has a
 segmentation polygon but no bbox.
 Has only been tested on a handful of COCO Camera Traps data sets; if you
@@ -21,6 +21,8 @@ use it for more general COCO conversion, YMMV.
 import json
 import os
 import shutil
+import sys
+import argparse
 from collections import defaultdict
 from tqdm import tqdm
@@ -38,34 +40,40 @@ def write_yolo_dataset_file(yolo_dataset_file,
                             test_folder_relative=None):
     """
     Write a YOLOv5 dataset.yaml file to the absolute path [yolo_dataset_file] (should
-    have a .yaml extension, though it's only a warning if it doesn't).
+    have a .yaml extension, though it's only a warning if it doesn't).
     Args:
-        yolo_dataset_file (str): the file, typically ending in .yaml or .yml, to write.
+        yolo_dataset_file (str): the file, typically ending in .yaml or .yml, to write.
             Does not have to be within dataset_base_dir.
         dataset_base_dir (str): the absolute base path of the YOLO dataset
-        class_list (list or str): an ordered list of class names (the first item will be class 0,
-            etc.), or the name of a text file containing an ordered list of class names (one per
+        class_list (list or str): an ordered list of class names (the first item will be class 0,
+            etc.), or the name of a text file containing an ordered list of class names (one per
             line, starting from class zero).
-        train_folder_relative (str, optional): train folder name, used only to populate dataset.yaml
-        val_folder_relative (str, optional): val folder name, used only to populate dataset.yaml
-        test_folder_relative (str, optional): test folder name, used only to populate dataset.yaml
+        train_folder_relative (str, optional): train folder name, used only to
+            populate dataset.yaml.  Can also be a filename (e.g. a .txt file with image
+            files).
+        val_folder_relative (str, optional): val folder name, used only to
+            populate dataset.yaml.  Can also be a filename (e.g. a .txt file with image
+            files).
+        test_folder_relative (str, optional): test folder name, used only to
+            populate dataset.yaml.  Can also be a filename (e.g. a .txt file with image
+            files).
     """
     # Read class names
     if isinstance(class_list,str):
         with open(class_list,'r') as f:
             class_lines = f.readlines()
-        class_lines = [s.strip() for s in class_lines]
+        class_lines = [s.strip() for s in class_lines]
         class_list = [s for s in class_lines if len(s) > 0]
     if not (yolo_dataset_file.endswith('.yml') or yolo_dataset_file.endswith('.yaml')):
         print('Warning: writing dataset file to a non-yml/yaml extension:\n{}'.format(
             yolo_dataset_file))
     # Write dataset.yaml
     with open(yolo_dataset_file,'w') as f:
         f.write('# Train/val sets\n')
         f.write('path: {}\n'.format(dataset_base_dir))
         if train_folder_relative is not None:
@@ -74,9 +82,9 @@ def write_yolo_dataset_file(yolo_dataset_file,
             f.write('val: {}\n'.format(val_folder_relative))
         if test_folder_relative is not None:
             f.write('val: {}\n'.format(test_folder_relative))
         f.write('\n')
         f.write('# Classes\n')
         f.write('names:\n')
         for i_class,class_name in enumerate(class_list):
@@ -84,7 +92,7 @@ def write_yolo_dataset_file(yolo_dataset_file,
 # ...def write_yolo_dataset_file(...)
 def coco_to_yolo(input_image_folder,
                  output_folder,
                  input_file,
@@ -102,15 +110,15 @@ def coco_to_yolo(input_image_folder,
                  write_output=True,
                  flatten_paths=False):
     """
-    Converts a COCO-formatted dataset to a YOLO-formatted dataset, optionally flattening the
+    Converts a COCO-formatted dataset to a YOLO-formatted dataset, optionally flattening the
     dataset to a single folder in the process.
     If the input and output folders are the same, writes .txt files to the input folder,
     and neither moves nor modifies images.
-    Currently ignores segmentation masks, and errors if an annotation has a
+    Currently ignores segmentation masks, and errors if an annotation has a
     segmentation polygon but no bbox.
     Args:
         input_image_folder (str): the folder where images live; filenames in the COCO .json
             file [input_file] should be relative to this folder
@@ -119,88 +127,88 @@ def coco_to_yolo(input_image_folder,
             images are left alone.
         source_format (str, optional): can be 'coco' (default) or 'coco_camera_traps'.  The only difference
             is that when source_format is 'coco_camera_traps', we treat an image with a non-bbox
-            annotation as a special case, i.e. that's how an empty image is indicated.  The original
-            COCO standard is a little ambiguous on this issue.  If source_format is 'coco', we
+            annotation as a special case, i.e. that's how an empty image is indicated.  The original
+            COCO standard is a little ambiguous on this issue.  If source_format is 'coco', we
             either treat images as empty or error, depending on the value of [allow_empty_annotations].
             [allow_empty_annotations] has no effect if source_format is 'coco_camera_traps'.
         overwrite_images (bool, optional): over-write images in the output folder if they exist
-        create_image_and_label_folder (bool, optional): whether to create separate folders called 'images' and
-            'labels' in the YOLO output folder.  If create_image_and_label_folders is False,
-            a/b/c/image001.jpg will become a#b#c#image001.jpg, and the corresponding text file will
-            be a#b#c#image001.txt.  If create_image_and_label_folders is True, a/b/c/image001.jpg will become
-            images/a#b#c#image001.jpg, and the corresponding text file will be
-            labels/a#b#c#image001.txt.
-        class_file_name (str, optional): .txt file (relative to the output folder) that we should
+        create_image_and_label_folders (bool, optional): whether to create separate folders called 'images' and
+            'labels' in the YOLO output folder.  If create_image_and_label_folders is False,
+            a/b/c/image001.jpg will become a#b#c#image001.jpg, and the corresponding text file will
+            be a#b#c#image001.txt.  If create_image_and_label_folders is True, a/b/c/image001.jpg will become
+            images/a#b#c#image001.jpg, and the corresponding text file will be
+            labels/a#b#c#image001.txt.
+        class_file_name (str, optional): .txt file (relative to the output folder) that we should
             populate with a list of classes (or None to omit)
-        allow_empty_annotations (bool, optional): if this is False and [source_format] is 'coco',
+        allow_empty_annotations (bool, optional): if this is False and [source_format] is 'coco',
             we'll error on annotations that have no 'bbox' field
         clip_boxes (bool, optional): whether to clip bounding box coordinates to the range [0,1] before
             converting to YOLO xywh format
         image_id_to_output_image_json_file (str, optional): an optional *output* file, to which we will write
             a mapping from image IDs to output file names
-        images_to_exclude (list, optional): a list of image files (relative paths in the input folder) that we
+        images_to_exclude (list, optional): a list of image files (relative paths in the input folder) that we
             should ignore
         path_replacement_char (str, optional): only relevant if [flatten_paths] is True; this is used to replace
             path separators, e.g. if [path_replacement_char] is '#' and [flatten_paths] is True, a/b/c/d.jpg
             becomes a#b#c#d.jpg
         category_names_to_exclude (str, optional): category names that should not be represented in the
             YOLO output; only impacts annotations, does not prevent copying images.  There's almost no reason
-            you would want to specify this and [category_names_to_include].
-        category_names_to_include (str, optional): allow-list of category names that should be represented
-            in the YOLO output; only impacts annotations, does not prevent copying images.  There's almost
-            no reason you would want to specify this and [category_names_to_exclude].
+            you would want to specify this and [category_names_to_include].
+        category_names_to_include (str, optional): allow-list of category names that should be represented
+            in the YOLO output; only impacts annotations, does not prevent copying images.  There's almost
+            no reason you would want to specify this and [category_names_to_exclude].
         write_output (bool, optional): determines whether we actually copy images and write annotations;
             setting this to False mostly puts this function in "dry run" "mode.  The class list
             file is written regardless of the value of write_output.
         flatten_paths (bool, optional): replace /'s in image filenames with [path_replacement_char],
             which ensures that the output folder is a single flat folder.
     Returns:
         dict: information about the coco --> yolo mapping, containing at least the fields:
-        - class_list_filename: the filename to which we wrote the flat list of class names required
+        - class_list_filename: the filename to which we wrote the flat list of class names required
           by the YOLO format.
         - source_image_to_dest_image: a dict mapping source images to destination images
-        - coco_id_to_yolo_id: a dict mapping COCO category IDs to YOLO category IDs
+        - coco_id_to_yolo_id: a dict mapping COCO category IDs to YOLO category IDs
     """
     ## Validate input
     if category_names_to_include is not None and category_names_to_exclude is not None:
         raise ValueError('category_names_to_include and category_names_to_exclude are mutually exclusive')
     if output_folder is None:
         output_folder = input_image_folder
     if images_to_exclude is not None:
         images_to_exclude = set(images_to_exclude)
     if category_names_to_exclude is None:
         category_names_to_exclude = {}
     assert os.path.isdir(input_image_folder)
     assert os.path.isfile(input_file)
     os.makedirs(output_folder,exist_ok=True)
     if (output_folder == input_image_folder) and (overwrite_images) and \
         (not create_image_and_label_folders) and (not flatten_paths):
             print('Warning: output folder and input folder are the same, disabling overwrite_images')
             overwrite_images = False
     ## Read input data
     with open(input_file,'r') as f:
         data = json.load(f)
     ## Parse annotations
     image_id_to_annotations = defaultdict(list)
     # i_ann = 0; ann = data['annotations'][0]
     for i_ann,ann in enumerate(data['annotations']):
-        # Make sure no annotations have *only* segmentation data
+        # Make sure no annotations have *only* segmentation data
         if ( \
             ('segmentation' in ann.keys()) and \
             (ann['segmentation'] is not None) and \
@@ -209,21 +217,21 @@ def coco_to_yolo(input_image_folder,
             (('bbox' not in ann.keys()) or (ann['bbox'] is None) or (len(ann['bbox'])==0)):
                 raise ValueError('Oops: segmentation data present without bbox information, ' + \
                                  'this script isn\'t ready for this dataset')
         image_id_to_annotations[ann['image_id']].append(ann)
     print('Parsed annotations for {} images'.format(len(image_id_to_annotations)))
     # Re-map class IDs to make sure they run from 0...n-classes-1
     #
     # Note: this allows unused categories in the output data set.  This is OK for
     # some training pipelines, not for others.
     next_category_id = 0
-    coco_id_to_yolo_id = {}
+    coco_id_to_yolo_id = {}
     coco_id_to_name = {}
     yolo_id_to_name = {}
     coco_category_ids_to_exclude = set()
     for category in data['categories']:
         coco_id_to_name[category['id']] = category['name']
         if (category_names_to_include is not None) and \
@@ -232,86 +240,86 @@ def coco_to_yolo(input_image_folder,
             continue
         elif (category['name'] in category_names_to_exclude):
             coco_category_ids_to_exclude.add(category['id'])
-            continue
+            continue
         assert category['id'] not in coco_id_to_yolo_id
         coco_id_to_yolo_id[category['id']] = next_category_id
         yolo_id_to_name[next_category_id] = category['name']
         next_category_id += 1
     ## Process images (everything but I/O)
     # List of dictionaries with keys 'source_image','dest_image','bboxes','dest_txt'
     images_to_copy = []
     missing_images = []
     excluded_images = []
     image_names = set()
     typical_image_extensions = set(['.jpg','.jpeg','.png','.gif','.tif','.bmp'])
     printed_empty_annotation_warning = False
     image_id_to_output_image_name = {}
     print('Processing annotations')
     n_clipped_boxes = 0
     n_total_boxes = 0
     # i_image = 0; im = data['images'][i_image]
     for i_image,im in tqdm(enumerate(data['images']),total=len(data['images'])):
         output_info = {}
-        source_image = os.path.join(input_image_folder,im['file_name'])
+        source_image = os.path.join(input_image_folder,im['file_name'])
         output_info['source_image'] = source_image
         if images_to_exclude is not None and im['file_name'] in images_to_exclude:
             excluded_images.append(im['file_name'])
             continue
         tokens = os.path.splitext(im['file_name'])
         if tokens[1].lower() not in typical_image_extensions:
             print('Warning: unusual image file name {}'.format(im['file_name']))
         if flatten_paths:
             image_name = tokens[0].replace('\\','/').replace('/',path_replacement_char) + \
-                '_' + str(i_image).zfill(6)
+                '_' + str(i_image).zfill(6)
         else:
             image_name = tokens[0]
         assert image_name not in image_names, 'Image name collision for {}'.format(image_name)
         image_names.add(image_name)
         assert im['id'] not in image_id_to_output_image_name
         image_id_to_output_image_name[im['id']] = image_name
         dest_image_relative = image_name + tokens[1]
         output_info['dest_image_relative'] = dest_image_relative
         dest_txt_relative = image_name + '.txt'
         output_info['dest_txt_relative'] = dest_txt_relative
         output_info['bboxes'] = []
         # assert os.path.isfile(source_image), 'Could not find image {}'.format(source_image)
         if not os.path.isfile(source_image):
             print('Warning: could not find image {}'.format(source_image))
             missing_images.append(im['file_name'])
             continue
         image_id = im['id']
         image_bboxes = []
         if image_id in image_id_to_annotations:
             for ann in image_id_to_annotations[image_id]:
                 # If this annotation has no bounding boxes...
                 if 'bbox' not in ann or ann['bbox'] is None or len(ann['bbox']) == 0:
                     if source_format == 'coco':
                         if not allow_empty_annotations:
                             # This is not entirely clear from the COCO spec, but it seems to be consensus
                             # that if you want to specify an image with no objects, you don't include any
@@ -319,11 +327,11 @@ def coco_to_yolo(input_image_folder,
                             raise ValueError('If an annotation exists, it should have content')
                         else:
                             continue
                     elif source_format == 'coco_camera_traps':
-                        # We allow empty bbox lists in COCO camera traps files; this is typically a
-                        # negative example in a dataset that has bounding boxes, and 0 is typically
+                        # We allow empty bbox lists in COCO camera traps files; this is typically a
+                        # negative example in a dataset that has bounding boxes, and 0 is typically
                         # the empty category, which is typically 0.
                         if ann['category_id'] != 0:
                             if not printed_empty_annotation_warning:
@@ -331,113 +339,113 @@ def coco_to_yolo(input_image_folder,
                                 print('Warning: non-bbox annotation found with category {}'.format(
                                     ann['category_id']))
                         continue
                     else:
                         raise ValueError('Unrecognized COCO variant: {}'.format(source_format))
                 # ...if this is an empty annotation
                 coco_bbox = ann['bbox']
                 # This category isn't in our category list.  This typically corresponds to whole sets
                 # of images that were excluded from the YOLO set.
                 if ann['category_id'] in coco_category_ids_to_exclude:
                     continue
                 yolo_category_id = coco_id_to_yolo_id[ann['category_id']]
                 # COCO: [x_min, y_min, width, height] in absolute coordinates
                 # YOLO: [class, x_center, y_center, width, height] in normalized coordinates
                 # Convert from COCO coordinates to YOLO coordinates
                 img_w = im['width']
                 img_h = im['height']
                 if source_format in ('coco','coco_camera_traps'):
                     x_min_absolute = coco_bbox[0]
                     y_min_absolute = coco_bbox[1]
                     box_w_absolute = coco_bbox[2]
                     box_h_absolute = coco_bbox[3]
                     x_center_absolute = (x_min_absolute + (x_min_absolute + box_w_absolute)) / 2
                     y_center_absolute = (y_min_absolute + (y_min_absolute + box_h_absolute)) / 2
                     x_center_relative = x_center_absolute / img_w
                     y_center_relative = y_center_absolute / img_h
                     box_w_relative = box_w_absolute / img_w
                     box_h_relative = box_h_absolute / img_h
                 else:
                     raise ValueError('Unrecognized source format {}'.format(source_format))
                 if clip_boxes:
                     clipped_box = False
-                    box_right = x_center_relative + (box_w_relative / 2.0)
+                    box_right = x_center_relative + (box_w_relative / 2.0)
                     if box_right > 1.0:
                         clipped_box = True
                         overhang = box_right - 1.0
                         box_w_relative -= overhang
                         x_center_relative -= (overhang / 2.0)
-                    box_bottom = y_center_relative + (box_h_relative / 2.0)
+                    box_bottom = y_center_relative + (box_h_relative / 2.0)
                     if box_bottom > 1.0:
                         clipped_box = True
                         overhang = box_bottom - 1.0
                         box_h_relative -= overhang
                         y_center_relative -= (overhang / 2.0)
                     box_left = x_center_relative - (box_w_relative / 2.0)
                     if box_left < 0.0:
                         clipped_box = True
                         overhang = abs(box_left)
                         box_w_relative -= overhang
                         x_center_relative += (overhang / 2.0)
                     box_top = y_center_relative - (box_h_relative / 2.0)
                     if box_top < 0.0:
                         clipped_box = True
                         overhang = abs(box_top)
                         box_h_relative -= overhang
                         y_center_relative += (overhang / 2.0)
                     if clipped_box:
                         n_clipped_boxes += 1
                 yolo_box = [yolo_category_id,
-                            x_center_relative, y_center_relative,
+                            x_center_relative, y_center_relative,
                             box_w_relative, box_h_relative]
                 image_bboxes.append(yolo_box)
                 n_total_boxes += 1
-            # ...for each annotation
+            # ...for each annotation
         # ...if this image has annotations
         output_info['bboxes'] = image_bboxes
-        images_to_copy.append(output_info)
+        images_to_copy.append(output_info)
     # ...for each image
     print('\nWriting {} boxes ({} clipped) for {} images'.format(n_total_boxes,
                                                                n_clipped_boxes,len(images_to_copy)))
     print('{} missing images (of {})'.format(len(missing_images),len(data['images'])))
     if images_to_exclude is not None:
         print('{} excluded images (of {})'.format(len(excluded_images),len(data['images'])))
     ## Write output
     print('Generating class list')
     if class_file_name is not None:
         class_list_filename = os.path.join(output_folder,class_file_name)
         with open(class_list_filename, 'w') as f:
@@ -446,12 +454,12 @@ def coco_to_yolo(input_image_folder,
                 # Category IDs should range from 0..N-1
                 assert i_class in yolo_id_to_name
                 f.write(yolo_id_to_name[i_class] + '\n')
     if image_id_to_output_image_json_file is not None:
         print('Writing image ID mapping to {}'.format(image_id_to_output_image_json_file))
         with open(image_id_to_output_image_json_file,'w') as f:
             json.dump(image_id_to_output_image_name,f,indent=1)
     if (output_folder == input_image_folder) and (not create_image_and_label_folders):
         print('Creating annotation files (not copying images, input and output folder are the same)')
@@ -464,12 +472,12 @@ def coco_to_yolo(input_image_folder,
     else:
         dest_image_folder = output_folder
         dest_txt_folder = output_folder
     source_image_to_dest_image = {}
     label_files_written = []
     n_boxes_written = 0
     # TODO: parallelize this loop
     #
     # output_info = images_to_copy[0]
@@ -478,96 +486,107 @@ def coco_to_yolo(input_image_folder,
         source_image = output_info['source_image']
         dest_image_relative = output_info['dest_image_relative']
         dest_txt_relative = output_info['dest_txt_relative']
         dest_image = os.path.join(dest_image_folder,dest_image_relative)
         dest_txt = os.path.join(dest_txt_folder,dest_txt_relative)
         source_image_to_dest_image[source_image] = dest_image
         # Copy the image if necessary
         if write_output:
-            os.makedirs(os.path.dirname(dest_image),exist_ok=True)
+            os.makedirs(os.path.dirname(dest_image),exist_ok=True)
             os.makedirs(os.path.dirname(dest_txt),exist_ok=True)
             if not create_image_and_label_folders:
                 assert os.path.dirname(dest_image) == os.path.dirname(dest_txt)
             if (not os.path.isfile(dest_image)) or (overwrite_images):
                 shutil.copyfile(source_image,dest_image)
-        bboxes = output_info['bboxes']
+        bboxes = output_info['bboxes']
         # Write the annotation file if necessary
         #
-        # Only write an annotation file if there are bounding boxes.  Images with
+        # Only write an annotation file if there are bounding boxes.  Images with
         # no .txt files are treated as hard negatives, at least by YOLOv5:
         #
         # https://github.com/ultralytics/yolov5/issues/3218
         #
-        # I think this is also true for images with empty .txt files, but
-        # I'm using the convention suggested on that issue, i.e. hard
+        # I think this is also true for images with empty .txt files, but
+        # I'm using the convention suggested on that issue, i.e. hard
         # negatives are expressed as images without .txt files.
         if len(bboxes) > 0:
             n_boxes_written += len(bboxes)
             label_files_written.append(dest_txt)
             if write_output:
                 with open(dest_txt,'w') as f:
                     # bbox = bboxes[0]
                     for bbox in bboxes:
                         assert len(bbox) == 5
                         s = '{} {} {} {} {}'.format(bbox[0],bbox[1],bbox[2],bbox[3],bbox[4])
                         f.write(s + '\n')
     # ...for each image
     coco_to_yolo_info = {}
     coco_to_yolo_info['class_list_filename'] = class_list_filename
     coco_to_yolo_info['source_image_to_dest_image'] = source_image_to_dest_image
     coco_to_yolo_info['coco_id_to_yolo_id'] = coco_id_to_yolo_id
     coco_to_yolo_info['label_files_written'] = label_files_written
     coco_to_yolo_info['n_boxes_written'] = n_boxes_written
     return coco_to_yolo_info
 # ...def coco_to_yolo(...)
-def create_yolo_symlinks(source_folder,images_folder,labels_folder,
+def create_yolo_symlinks(source_folder,
+                         images_folder,
+                         labels_folder,
                          class_list_file=None,
                          class_list_output_name='object.data',
                          force_lowercase_image_extension=False):
     """
     Given a YOLO-formatted folder of images and .txt files, creates a folder
-    of symlinks to all the images, and a folder of symlinks to all the labels.
-    Used to support preview/editing tools that assume images and labels are in separate
+    of symlinks to all the images, and a folder of symlinks to all the labels.
+    Used to support preview/editing tools that assume images and labels are in separate
     folders.
+    Args:
+        source_folder (str): input folder
+        images_folder (str): output folder with links to images
+        labels_folder (str): output folder with links to labels
+        class_list_file (str, optional): list to classes.txt file
+        class_list_output_name (str, optional): output file to write with class information
+        force_lowercase_image_extension (bool, False): create symlinks with, e.g., .jpg, even
+            if the input image is, e.g., .JPG
     :meta private:
-    """
+    """
     assert source_folder != images_folder and source_folder != labels_folder
     os.makedirs(images_folder,exist_ok=True)
     os.makedirs(labels_folder,exist_ok=True)
     image_files_relative = find_images(source_folder,recursive=True,return_relative_paths=True)
-    # image_fn_relative = image_files_relative[0]=
+    # image_fn_relative = image_files_relative[0]=
     for image_fn_relative in tqdm(image_files_relative):
         source_file_abs = os.path.join(source_folder,image_fn_relative)
         target_file_abs = os.path.join(images_folder,image_fn_relative)
         if force_lowercase_image_extension:
             tokens = os.path.splitext(target_file_abs)
             target_file_abs = tokens[0] + tokens[1].lower()
         os.makedirs(os.path.dirname(target_file_abs),exist_ok=True)
         safe_create_link(source_file_abs,target_file_abs)
         source_annotation_file_abs = os.path.splitext(source_file_abs)[0] + '.txt'
@@ -577,7 +596,7 @@ def create_yolo_symlinks(source_folder,images_folder,labels_folder,
             os.makedirs(os.path.dirname(target_annotation_file_abs),exist_ok=True)
             safe_create_link(source_annotation_file_abs,target_annotation_file_abs)
-    # ...for each image
+    # ...for each image
     if class_list_file is not None:
         target_class_list_file = os.path.join(labels_folder,class_list_output_name)
@@ -589,14 +608,14 @@ def create_yolo_symlinks(source_folder,images_folder,labels_folder,
 #%% Interactive driver
 if False:
     pass
     #%% Options
     input_file = os.path.expanduser('~/data/md-test-coco.json')
-    image_folder = os.path.expanduser('~/data/md-test')
-    output_folder = os.path.expanduser('~/data/md-test-yolo')
+    image_folder = os.path.expanduser('~/data/md-test')
+    output_folder = os.path.expanduser('~/data/md-test-yolo')
     create_image_and_label_folders=False
     class_file_name='classes.txt'
     allow_empty_annotations=False
@@ -605,18 +624,18 @@ if False:
     images_to_exclude=None
     path_replacement_char='#'
     category_names_to_exclude=None
     #%% Programmatic execution
     coco_to_yolo_results = coco_to_yolo(image_folder,output_folder,input_file,
                      source_format='coco',
                      overwrite_images=False,
                      create_image_and_label_folders=create_image_and_label_folders,
                      class_file_name=class_file_name,
                      allow_empty_annotations=allow_empty_annotations,
-                     clip_boxes=clip_boxes)
+                     clip_boxes=clip_boxes)
     create_yolo_symlinks(source_folder=output_folder,
                          images_folder=output_folder + '/images',
                          labels_folder=output_folder + '/labels',
@@ -630,40 +649,38 @@ if False:
     s = 'python coco_to_yolo.py {} {} {} --create_bounding_box_editor_symlinks'.format(
         image_folder,output_folder,input_file)
     print(s)
-    import clipboard; clipboard.copy(s)
+    import clipboard; clipboard.copy(s)
 #%% Command-line driver
-import sys,argparse
-def main():
+def main(): # noqa
     parser = argparse.ArgumentParser(
         description='Convert COCO-formatted data to YOLO format, flattening the image structure')
     # input_image_folder,output_folder,input_file
     parser.add_argument(
         'input_folder',
         type=str,
         help='Path to input images')
     parser.add_argument(
         'output_folder',
         type=str,
         help='Path to flat, YOLO-formatted dataset')
     parser.add_argument(
         'input_file',
         type=str,
         help='Path to COCO dataset file (.json)')
     parser.add_argument(
         '--create_bounding_box_editor_symlinks',
         action='store_true',
-        help='Prepare symlinks so the whole folder appears to contain "images" and "labels" folderss')
+        help='Prepare symlinks so the whole folder appears to contain "images" and "labels" folderss')
     if len(sys.argv[1:]) == 0:
         parser.print_help()
         parser.exit()
@@ -671,7 +688,7 @@ def main():
     args = parser.parse_args()
     coco_to_yolo_results = coco_to_yolo(args.input_folder,args.output_folder,args.input_file)
     if args.create_bounding_box_editor_symlinks:
         create_yolo_symlinks(source_folder=args.output_folder,
                              images_folder=args.output_folder + '/images',
@@ -679,6 +696,6 @@ def main():
                              class_list_file=coco_to_yolo_results['class_list_filename'],
                              class_list_output_name='object.data',
                              force_lowercase_image_extension=True)
 if __name__ == '__main__':
     main()

megadetector 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl