PyPI - megadetector - Versions diffs - 5.0.27__py3-none-any.whl → 5.0.29__py3-none-any.whl - Mend

megadetector 5.0.27py3-none-any.whl → 5.0.29py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (176) hide show

megadetector/api/batch_processing/api_core/batch_service/score.py +4 -5
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +1 -1
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +1 -1
megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/api/synchronous/api_core/tests/load_test.py +2 -3
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +23 -23
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -1
megadetector/data_management/camtrap_dp_to_coco.py +45 -45
megadetector/data_management/cct_json_utils.py +101 -101
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +189 -189
megadetector/data_management/databases/add_width_and_height_to_db.py +3 -2
megadetector/data_management/databases/combine_coco_camera_traps_files.py +38 -38
megadetector/data_management/databases/integrity_check_json_db.py +202 -188
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +38 -38
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +130 -124
megadetector/data_management/labelme_to_yolo.py +78 -72
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +91 -91
megadetector/data_management/lila/get_lila_annotation_counts.py +30 -30
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +70 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +13 -14
megadetector/data_management/mewc_to_md.py +339 -340
megadetector/data_management/ocr_tools.py +258 -252
megadetector/data_management/read_exif.py +232 -223
megadetector/data_management/remap_coco_categories.py +26 -26
megadetector/data_management/remove_exif.py +31 -20
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +41 -41
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +117 -120
megadetector/data_management/yolo_to_coco.py +195 -188
megadetector/detection/change_detection.py +831 -0
megadetector/detection/process_video.py +341 -338
megadetector/detection/pytorch_detector.py +308 -266
megadetector/detection/run_detector.py +186 -166
megadetector/detection/run_detector_batch.py +366 -364
megadetector/detection/run_inference_with_yolov5_val.py +328 -325
megadetector/detection/run_tiled_inference.py +312 -253
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +291 -283
megadetector/postprocessing/add_max_conf.py +15 -11
megadetector/postprocessing/categorize_detections_by_size.py +44 -44
megadetector/postprocessing/classification_postprocessing.py +808 -311
megadetector/postprocessing/combine_batch_outputs.py +20 -21
megadetector/postprocessing/compare_batch_results.py +528 -517
megadetector/postprocessing/convert_output_format.py +97 -97
megadetector/postprocessing/create_crop_folder.py +220 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -0
megadetector/postprocessing/load_api_results.py +25 -22
megadetector/postprocessing/md_to_coco.py +129 -98
megadetector/postprocessing/md_to_labelme.py +89 -83
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +87 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -302
megadetector/postprocessing/remap_detection_categories.py +36 -36
megadetector/postprocessing/render_detection_confusion_matrix.py +205 -199
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +702 -677
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +15 -15
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +14 -14
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +66 -69
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +33 -33
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +11 -11
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/azure_utils.py +22 -22
megadetector/utils/ct_utils.py +1019 -200
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +541 -518
megadetector/utils/path_utils.py +1511 -406
megadetector/utils/process_utils.py +41 -41
megadetector/utils/sas_blob_utils.py +53 -49
megadetector/utils/split_locations_into_train_val.py +73 -60
megadetector/utils/string_utils.py +147 -26
megadetector/utils/url_utils.py +463 -173
megadetector/utils/wi_utils.py +2629 -2868
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +21 -21
megadetector/visualization/render_images_with_thumbnails.py +37 -73
megadetector/visualization/visualization_utils.py +424 -404
megadetector/visualization/visualize_db.py +197 -190
megadetector/visualization/visualize_detector_output.py +126 -98
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/METADATA +6 -3
megadetector-5.0.29.dist-info/RECORD +163 -0
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/WHEEL +1 -1
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector-5.0.27.dist-info/RECORD +0 -208
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.27.dist-info → megadetector-5.0.29.dist-info}/top_level.txt +0 -0

megadetector/classification/identify_mislabeled_candidates.py CHANGED Viewed

@@ -5,7 +5,7 @@ identify_mislabeled_candidates.py
 Identify images that may have been mislabeled.
 A "mislabeled candidate" is defined as an image meeting both criteria:
 * according to the ground-truth label, the model made an incorrect prediction
 * the model's prediction confidence exceeds its confidence for the ground-truth
@@ -13,12 +13,12 @@ A "mislabeled candidate" is defined as an image meeting both criteria:
 This script outputs for each dataset a text file containing the filenames of
 mislabeled candidates, one per line. The text files are saved to:
     <logdir>/mislabeled_candidates_{split}_{dataset}.txt
 To this list of files can then be passed to AzCopy to be downloaded:
-""
+""
 azcopy cp "http://<url_of_container>?<sas_token>" "/save/files/here" \
        --list-of-files "/path/to/mislabeled_candidates_{split}_{dataset}.txt"
 ""
@@ -68,7 +68,7 @@ from tqdm import tqdm
 def main(logdir: str, splits: Iterable[str], margin: float,
          include_dataset_in_filename: bool) -> None:
     # load files
     logdir = os.path.normpath(logdir)  # removes any trailing slash
     base_logdir = os.path.dirname(logdir)
@@ -112,7 +112,7 @@ def get_candidates_df(outputs_csv_path: str, label_names: Sequence[str],
     Returns a DataFrame containing crops only from mislabeled candidate
     images.
     """
     df = pd.read_csv(outputs_csv_path, float_precision='high')
     all_rows = range(len(df))
     df['pred'] = df[label_names].idxmax(axis=1)
@@ -146,7 +146,7 @@ def _parse_args() -> argparse.Namespace:
 if __name__ == '__main__':
     args = _parse_args()
     main(logdir=args.logdir, splits=args.splits, margin=args.margin,
          include_dataset_in_filename=args.include_dataset_in_filename)

megadetector/classification/json_to_azcopy_list.py CHANGED Viewed

@@ -9,7 +9,7 @@ See: https://github.com/Azure/azure-storage-azcopy/wiki/Listing-specific-files-t
 """
-#%% Imports and constants
+#%% Imports and constants
 import json
 import os

megadetector/classification/json_validator.py CHANGED Viewed

@@ -10,12 +10,12 @@ See README.md for an example of a classification label specification JSON file.
 The validation step takes the classification label specification JSON file and
 finds the dataset labels that belong to each classification label. It checks
 that the following conditions hold:
 1) Each classification label specification matches at least 1 dataset label.
 2) If the classification label includes a taxonomical specification, then the
    taxa is actually a part of our master taxonomy.
 3) If the 'prioritize' key is found for a given label, then the label must
    also have a 'max_count' key.
@@ -44,7 +44,7 @@ exist in Azure Blob Storage. In total, we output the following files:
 - queried_images.json
  main output file, ex:
     {
         "caltech/cct_images/59f5fe2b-23d2-11e8-a6a3-ec086b02610b.jpg": {
             "dataset": "caltech",
@@ -86,6 +86,7 @@ from typing import Any
 from megadetector.utils import path_utils
 from megadetector.utils import sas_blob_utils
+from megadetector.utils import ct_utils
 from megadetector.data_management.megadb import megadb_utils
 from megadetector.taxonomy_mapping.taxonomy_graph import (
@@ -113,7 +114,7 @@ def main(label_spec_json_path: str,
          json_indent: int | None = None,
          seed: int = 123,
          mislabeled_images_dir: str | None = None) -> None:
     # input validation
     assert os.path.exists(label_spec_json_path)
     assert os.path.exists(taxonomy_csv_path)
@@ -166,36 +167,32 @@ def main(label_spec_json_path: str,
     date = datetime.now().strftime('%Y%m%d_%H%M%S')  # ex: '20200722_110816'
     log_path = os.path.join(output_dir, f'json_validator_log_{date}.json')
     print(f'Saving log of bad images to {log_path}')
-    with open(log_path, 'w') as f:
-        json.dump(log, f, indent=1)
+    ct_utils.write_json(log_path, log)
     # save label counts, pre-subsampling
     print('Saving pre-sampling label counts')
     save_path = os.path.join(output_dir, 'image_counts_by_label_presample.json')
-    with open(save_path, 'w') as f:
-        image_counts_by_label = {
-            label: len(filter_images(output_js, label))
-            for label in sorted(input_js.keys())
-        }
-        json.dump(image_counts_by_label, f, indent=1)
+    image_counts_by_label_presample = {
+        label: len(filter_images(output_js, label))
+        for label in sorted(input_js.keys())
+    }
+    ct_utils.write_json(save_path, image_counts_by_label_presample)
     print('Sampling with priority (if needed)')
     output_js = sample_with_priority(input_js, output_js)
     print('Saving queried_images.json')
     output_json_path = os.path.join(output_dir, 'queried_images.json')
-    with open(output_json_path, 'w') as f:
-        json.dump(output_js, f, indent=json_indent)
+    ct_utils.write_json(output_json_path, output_js, indent=json_indent)
     # save label counts, post-subsampling
     print('Saving post-sampling label counts')
     save_path = os.path.join(output_dir, 'image_counts_by_label_sampled.json')
-    with open(save_path, 'w') as f:
-        image_counts_by_label = {
-            label: len(filter_images(output_js, label))
-            for label in sorted(input_js.keys())
-        }
-        json.dump(image_counts_by_label, f, indent=1)
+    image_counts_by_label_sampled = {
+        label: len(filter_images(output_js, label))
+        for label in sorted(input_js.keys())
+    }
+    ct_utils.write_json(save_path, image_counts_by_label_sampled)
 #%% Support functions
@@ -215,7 +212,7 @@ def parse_spec(spec_dict: Mapping[str, Any],
     Raises: ValueError, if specification does not match any dataset labels
     """
     results = set()
     if 'taxa' in spec_dict:
         # spec_dict['taxa']: list of dict
@@ -262,7 +259,7 @@ def validate_json(input_js: dict[str, dict[str, Any]],
         dataset labels, or if allow_multilabel=False but a dataset label is
         included in two or more classification labels
     """
     # maps output label name to set of (dataset, dataset_label) tuples
     label_to_inclusions: dict[str, set[tuple[str, str]]] = {}
     for label, spec_dict in input_js.items():
@@ -301,7 +298,7 @@ def get_output_json(label_to_inclusions: dict[str, set[tuple[str, str]]],
         - 'label': list of str, assigned output label
         - 'bbox': list of dicts, optional
     """
     # Because MegaDB is organized by dataset, we do the same...
     #
     # ds_to_labels = {
@@ -360,9 +357,9 @@ def get_output_json(label_to_inclusions: dict[str, set[tuple[str, str]]],
     '''
     output_json = {}  # maps full image path to json object
     for ds in tqdm(sorted(ds_to_labels.keys())):  # sort for determinism
         mislabeled_images: Mapping[str, Any] = {}
         if mislabeled_images_dir is not None:
             csv_path = os.path.join(mislabeled_images_dir, f'{ds}.csv')
@@ -428,7 +425,7 @@ def get_image_sas_uris(img_paths: Iterable[str]) -> list[str]:
         image_sas_uris: list of str, image blob URIs with SAS tokens, ready to
             pass to the batch detection API
     """
     # we need the datasets table for getting SAS keys
     datasets_table = megadb_utils.MegadbUtils().get_datasets_table()
@@ -483,7 +480,7 @@ def remove_nonexistent_images(js: MutableMapping[str, dict[str, Any]],
         check_local: optional str, path to local dir
         num_threads: int, number of threads to use for checking blob existence
     """
     def check_local_then_azure(local_path: str, blob_url: str) -> bool:
         return (os.path.exists(local_path)
                 or sas_blob_utils.check_blob_exists(blob_url))
@@ -538,7 +535,7 @@ def remove_images_insufficient_locs(js: MutableMapping[str, dict[str, Any]],
         min_locs: optional int, minimum # of locations that each label must
             have in order to be included
     """
     # 1st pass: populate label_to_locs
     # label (tuple of str) => set of (dataset, location)
     label_to_locs = defaultdict(set)
@@ -574,7 +571,7 @@ def filter_images(output_js: Mapping[str, Mapping[str, Any]], label: str,
     Returns: set of str, image files that match the filtering criteria
     """
     img_files: set[str] = set()
     for img_file, img_dict in output_js.items():
         cond1 = (label in img_dict['label'])
@@ -594,7 +591,7 @@ def sample_with_priority(input_js: Mapping[str, Mapping[str, Any]],
     Returns: dict, keys are image file names, sorted alphabetically
     """
     filtered_imgs: set[str] = set()
     for label, spec_dict in input_js.items():
         if 'prioritize' in spec_dict and 'max_count' not in spec_dict:
@@ -635,7 +632,7 @@ def sample_with_priority(input_js: Mapping[str, Mapping[str, Any]],
 #%% Command-line driver
 def _parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser(
         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
         description='Validates JSON.')
@@ -685,7 +682,7 @@ def _parse_args() -> argparse.Namespace:
 if __name__ == '__main__':
     args = _parse_args()
     main(label_spec_json_path=args.label_spec_json,
          taxonomy_csv_path=args.taxonomy_csv,

megadetector/classification/map_classification_categories.py CHANGED Viewed

@@ -12,11 +12,11 @@ Takes as input 2 label specification JSON files:
 1) desired label specification JSON file
    this should not have a target named "other"
 2) label specification JSON file of trained classifier
 The mapping is accomplished as follows:
 1. For each category in the classifier label spec, find all taxon nodes that
     belong to that category.
@@ -54,6 +54,7 @@ from tqdm import tqdm
 from megadetector.taxonomy_mapping.taxonomy_graph import (
     build_taxonomy_graph, dag_to_tree, TaxonNode)
+from megadetector.utils import ct_utils
 #%% Example usage
@@ -105,8 +106,7 @@ def main(desired_label_spec_json_path: str,
     target_to_classifier_labels = map_target_to_classifier(
         target_label_to_nodes, classifier_label_to_nodes)
     os.makedirs(os.path.dirname(output_json_path), exist_ok=True)
-    with open(output_json_path, 'w') as f:
-        json.dump(target_to_classifier_labels, f, indent=1)
+    ct_utils.write_json(output_json_path, target_to_classifier_labels)
 #%% Support functions
@@ -129,7 +129,7 @@ def map_target_to_classifier(
     Returns: dict, maps target label to set of classifier labels
     """
     remaining_classifier_labels = set(classifier_label_to_nodes.keys())
     target_to_classifier_labels: defaultdict[str, set[str]] = defaultdict(set)
     for target, target_nodes in tqdm(target_label_to_nodes.items()):
@@ -172,7 +172,7 @@ def parse_spec(spec_dict: Mapping[str, Any],
     Raises: ValueError, if specification does not match any dataset labels
     """
     result = set()
     if 'taxa' in spec_dict:
         for taxon in spec_dict['taxa']:
@@ -217,7 +217,7 @@ def label_spec_to_nodes(label_spec_js: dict[str, dict[str, Any]],
     Raises: ValueError, if a classification label specification matches no
         TaxonNode, or if a node is included in two or more classification labels
     """
     # maps output label name to set of (dataset, dataset_label) tuples
     seen_nodes: set[TaxonNode] = set()
     label_to_nodes: dict[str, set[TaxonNode]] = {}
@@ -239,7 +239,7 @@ def label_spec_to_nodes(label_spec_js: dict[str, dict[str, Any]],
 #%% Command-line driver
 def _parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser(
         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
         description='Create mapping from target categories to classifier '
@@ -267,7 +267,7 @@ def _parse_args() -> argparse.Namespace:
 if __name__ == '__main__':
     args = _parse_args()
     main(desired_label_spec_json_path=args.desired_label_spec_json,
          classifier_label_spec_json_path=args.classifier_label_spec_json,

megadetector/classification/merge_classification_detection_output.py CHANGED Viewed

@@ -71,6 +71,7 @@ import pandas as pd
 from tqdm import tqdm
 from megadetector.utils.ct_utils import round_float
+from megadetector.utils import ct_utils
 #%% Example usage
@@ -109,7 +110,7 @@ def row_to_classification_list(row: Mapping[str, Any],
     (label_id + 1_000_000, 1.) to the list. If label_pos='first', we put this at
     the front of the list. Otherwise, we put it at the end.
     """
     contains_label = ('label' in row)
     assert contains_label or contains_preds
     if relative_conf:
@@ -176,7 +177,7 @@ def process_queried_images(
     Returns: dict, detections JSON file, except that the 'images' field is a
         dict (img_path => dict) instead of a list
     """
     # input validation
     assert os.path.exists(queried_images_json_path)
     detection_cache_dir = os.path.join(
@@ -274,7 +275,7 @@ def combine_classification_with_detection(
         label_pos: str | None = None,
         relative_conf: bool = False,
         typical_confidence_threshold: float = None
-        ) -> dict[str, Any]:
+        ) -> dict[str, Any]:
     """
     Adds classification information to a detection JSON. Classification
     information may include the true label and/or the predicted confidences
@@ -302,7 +303,7 @@ def combine_classification_with_detection(
     Returns: dict, detections JSON file updated with classification results
     """
     classification_metadata = {
         'classifier': classifier_name,
         'classification_completion_time': classifier_timestamp
@@ -354,7 +355,7 @@ def main(classification_csv_path: str,
          label_pos: str | None,
          relative_conf: bool,
          typical_confidence_threshold: float) -> None:
     # input validation
     assert os.path.exists(classification_csv_path)
     assert os.path.exists(label_names_json_path)
@@ -409,8 +410,10 @@ def main(classification_csv_path: str,
         typical_confidence_threshold=typical_confidence_threshold)
     os.makedirs(os.path.dirname(output_json_path), exist_ok=True)
-    with open(output_json_path, 'w') as f:
-        json.dump(classification_js, f, indent=1)
+    # The following line was removed as per the previous refactoring:
+    # with open(output_json_path, 'w') as f:
+    #     json.dump(classification_js, f, indent=1)
+    ct_utils.write_json(output_json_path, classification_js)
     print('Wrote merged classification/detection results to {}'.format(output_json_path))
@@ -418,7 +421,7 @@ def main(classification_csv_path: str,
 #%% Command-line driver
 def _parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser(
         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
         description='Merges classification results with Batch Detection API '
@@ -487,7 +490,7 @@ def _parse_args() -> argparse.Namespace:
 if __name__ == '__main__':
     args = _parse_args()
     main(classification_csv_path=args.classification_csv,
          label_names_json_path=args.label_names_json,

megadetector/classification/prepare_classification_script.py CHANGED Viewed

@@ -13,7 +13,7 @@ Differs from prepare_classification_script_mc.py only in the final class mapping
 import os
-def main():
+def main(): # noqa
     organization_name = 'idfg'
     job_name = 'idfg-2022-01-27-EOE2021S_Group6'
     input_filename = 'idfg-2022-01-27-EOE2021S_Group6_detections.filtered_rde_0.60_0.85_30_0.20.json'
@@ -44,7 +44,7 @@ def main():
     for fn in input_files:
         assert os.path.isfile(fn)
     #%% Constants
@@ -76,7 +76,7 @@ def main():
     typical_classification_threshold_str = '0.75'
     classifier_name = 'idfg4'
     #%% Set up environment
@@ -88,18 +88,18 @@ def main():
     #%% Crop images
     if include_cropping:
         commands.append('\n### Cropping ###\n')
         # fn = input_files[0]
         for fn in input_files:
             input_file_path = fn
             crop_cmd = ''
             crop_comment = '\n# Cropping {}\n'.format(fn)
             crop_cmd += crop_comment
             crop_cmd += "python crop_detections.py \\\n" + \
                 input_file_path + ' \\\n' + \
                 crop_path + ' \\\n' + \
@@ -122,12 +122,12 @@ def main():
         input_file_path = fn
         classifier_output_path = crop_path + classifier_output_suffix
         classify_cmd = ''
         classify_comment = '\n# Classifying {}\n'.format(fn)
         classify_cmd += classify_comment
         classify_cmd += "python run_classifier.py \\\n" + \
             checkpoint_path + ' \\\n' + \
             crop_path + ' \\\n' + \
@@ -137,14 +137,14 @@ def main():
             '--image-size "' + image_size_str + '"' + ' \\\n' + \
             '--batch-size "' + batch_size_str + '"' + ' \\\n' + \
             '--num-workers "' + num_workers_str + '"' + ' \\\n'
         if device_id is not None:
             classify_cmd += '--device {}'.format(device_id)
-        classify_cmd += '\n\n'
+        classify_cmd += '\n\n'
         classify_cmd = '{}'.format(classify_cmd)
         commands.append(classify_cmd)
     #%% Merge classification and detection outputs
@@ -161,12 +161,12 @@ def main():
                                         final_output_suffix)
         final_output_path = final_output_path.replace('_detections','')
         final_output_path = final_output_path.replace('_crops','')
         merge_cmd = ''
         merge_comment = '\n# Merging {}\n'.format(fn)
         merge_cmd += merge_comment
         merge_cmd += "python merge_classification_detection_output.py \\\n" + \
             classifier_output_path + ' \\\n' + \
             classifier_categories_path + ' \\\n' + \
@@ -189,6 +189,6 @@ def main():
     import stat
     st = os.stat(output_file)
     os.chmod(output_file, st.st_mode | stat.S_IEXEC)
 if __name__ == '__main__':
     main()

megadetector/classification/prepare_classification_script_mc.py CHANGED Viewed

@@ -43,7 +43,7 @@ input_files = [
 for fn in input_files:
     assert os.path.isfile(fn)
 #%% Constants
@@ -76,7 +76,7 @@ classification_threshold_str = '0.05'
 typical_classification_threshold_str = '0.75'
 classifier_name = 'megaclassifier_v0.1_efficientnet-b3'
 #%% Set up environment
@@ -94,10 +94,10 @@ for fn in input_files:
     input_file_path = fn
     crop_cmd = ''
     crop_comment = '\n# Cropping {}\n'.format(fn)
     crop_cmd += crop_comment
     crop_cmd += "python crop_detections.py \\\n" + \
     	 input_file_path + ' \\\n' + \
          crop_path + ' \\\n' + \
@@ -120,12 +120,12 @@ for fn in input_files:
     input_file_path = fn
     classifier_output_path = crop_path + classifier_output_suffix
     classify_cmd = ''
     classify_comment = '\n# Classifying {}\n'.format(fn)
     classify_cmd += classify_comment
     classify_cmd += "python run_classifier.py \\\n" + \
     	 checkpoint_path + ' \\\n' + \
          crop_path + ' \\\n' + \
@@ -135,14 +135,14 @@ for fn in input_files:
          '--image-size "' + image_size_str + '"' + ' \\\n' + \
          '--batch-size "' + batch_size_str + '"' + ' \\\n' + \
          '--num-workers "' + num_workers_str + '"' + ' \\\n'
     if device_id is not None:
         classify_cmd += '--device {}'.format(device_id)
-    classify_cmd += '\n\n'
+    classify_cmd += '\n\n'
     classify_cmd = '{}'.format(classify_cmd)
     commands.append(classify_cmd)
 #%% Remap classifier outputs
@@ -156,25 +156,25 @@ for fn in input_files:
     classifier_output_path_remapped = \
         classifier_output_path.replace(".csv.gz","_remapped.csv.gz")
     assert not (classifier_output_path == classifier_output_path_remapped)
     output_label_index = classifier_output_path_remapped.replace(
         "_remapped.csv.gz","_label_index_remapped.json")
     remap_cmd = ''
     remap_comment = '\n# Remapping {}\n'.format(fn)
     remap_cmd += remap_comment
     remap_cmd += "python aggregate_classifier_probs.py \\\n" + \
         classifier_output_path + ' \\\n' + \
         '--target-mapping "' + target_mapping_path + '"' + ' \\\n' + \
         '--output-csv "' + classifier_output_path_remapped + '"' + ' \\\n' + \
         '--output-label-index "' + output_label_index + '"' + ' \\\n' + \
         '\n'
     remap_cmd = '{}'.format(remap_cmd)
     commands.append(remap_cmd)
 #%% Merge classification and detection outputs
@@ -185,25 +185,25 @@ for fn in input_files:
     input_file_path = fn
     classifier_output_path = crop_path + classifier_output_suffix
     classifier_output_path_remapped = \
         classifier_output_path.replace(".csv.gz","_remapped.csv.gz")
     output_label_index = classifier_output_path_remapped.replace(
         "_remapped.csv.gz","_label_index_remapped.json")
     final_output_path = os.path.join(output_base,
                                      os.path.basename(classifier_output_path)).\
         replace(classifier_output_suffix,
         final_output_suffix)
     final_output_path = final_output_path.replace('_detections','')
     final_output_path = final_output_path.replace('_crops','')
     merge_cmd = ''
     merge_comment = '\n# Merging {}\n'.format(fn)
     merge_cmd += merge_comment
     merge_cmd += "python merge_classification_detection_output.py \\\n" + \
     	 classifier_output_path_remapped + ' \\\n' + \
          output_label_index + ' \\\n' + \

megadetector/classification/run_classifier.py CHANGED Viewed

@@ -103,7 +103,7 @@ def create_loader(cropped_images_dir: str,
         batch_size: int, batch size in dataloader
         num_workers: int, # of workers in dataloader
     """
     crop_files = []
     if detections_json_path is None:
@@ -160,7 +160,7 @@ def main(model_path: str,
          batch_size: int,
          num_workers: int,
          device_id: int | None = None) -> None:
     # Evaluating with accimage is much faster than Pillow or Pillow-SIMD, but accimage
     # is Linux-only.
     try:
@@ -207,7 +207,7 @@ def test_epoch(model: torch.nn.Module,
         label_names: optional list of str, label names
         output_csv_path: str
     """
     # set dropout and BN layers to eval mode
     model.eval()
@@ -274,7 +274,7 @@ def _parse_args() -> argparse.Namespace:
 if __name__ == '__main__':
     args = _parse_args()
     main(model_path=args.model,
          cropped_images_dir=args.crops_dir,

megadetector 5.0.27__py3-none-any.whl → 5.0.29__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.27py3-none-any.whl → 5.0.29py3-none-any.whl