PyPI - megadetector - Versions diffs - 10.0.15__py3-none-any.whl - Mend

megadetector 10.0.15__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (147) hide show

megadetector/__init__.py +0 -0
megadetector/api/__init__.py +0 -0
megadetector/api/batch_processing/integration/digiKam/setup.py +6 -0
megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +465 -0
megadetector/api/batch_processing/integration/eMammal/test_scripts/config_template.py +5 -0
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +125 -0
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +55 -0
megadetector/classification/__init__.py +0 -0
megadetector/classification/aggregate_classifier_probs.py +108 -0
megadetector/classification/analyze_failed_images.py +227 -0
megadetector/classification/cache_batchapi_outputs.py +198 -0
megadetector/classification/create_classification_dataset.py +626 -0
megadetector/classification/crop_detections.py +516 -0
megadetector/classification/csv_to_json.py +226 -0
megadetector/classification/detect_and_crop.py +853 -0
megadetector/classification/efficientnet/__init__.py +9 -0
megadetector/classification/efficientnet/model.py +415 -0
megadetector/classification/efficientnet/utils.py +608 -0
megadetector/classification/evaluate_model.py +520 -0
megadetector/classification/identify_mislabeled_candidates.py +152 -0
megadetector/classification/json_to_azcopy_list.py +63 -0
megadetector/classification/json_validator.py +696 -0
megadetector/classification/map_classification_categories.py +276 -0
megadetector/classification/merge_classification_detection_output.py +509 -0
megadetector/classification/prepare_classification_script.py +194 -0
megadetector/classification/prepare_classification_script_mc.py +228 -0
megadetector/classification/run_classifier.py +287 -0
megadetector/classification/save_mislabeled.py +110 -0
megadetector/classification/train_classifier.py +827 -0
megadetector/classification/train_classifier_tf.py +725 -0
megadetector/classification/train_utils.py +323 -0
megadetector/data_management/__init__.py +0 -0
megadetector/data_management/animl_to_md.py +161 -0
megadetector/data_management/annotations/__init__.py +0 -0
megadetector/data_management/annotations/annotation_constants.py +33 -0
megadetector/data_management/camtrap_dp_to_coco.py +270 -0
megadetector/data_management/cct_json_utils.py +566 -0
megadetector/data_management/cct_to_md.py +184 -0
megadetector/data_management/cct_to_wi.py +293 -0
megadetector/data_management/coco_to_labelme.py +284 -0
megadetector/data_management/coco_to_yolo.py +701 -0
megadetector/data_management/databases/__init__.py +0 -0
megadetector/data_management/databases/add_width_and_height_to_db.py +107 -0
megadetector/data_management/databases/combine_coco_camera_traps_files.py +210 -0
megadetector/data_management/databases/integrity_check_json_db.py +563 -0
megadetector/data_management/databases/subset_json_db.py +195 -0
megadetector/data_management/generate_crops_from_cct.py +200 -0
megadetector/data_management/get_image_sizes.py +164 -0
megadetector/data_management/labelme_to_coco.py +559 -0
megadetector/data_management/labelme_to_yolo.py +349 -0
megadetector/data_management/lila/__init__.py +0 -0
megadetector/data_management/lila/create_lila_blank_set.py +556 -0
megadetector/data_management/lila/create_lila_test_set.py +192 -0
megadetector/data_management/lila/create_links_to_md_results_files.py +106 -0
megadetector/data_management/lila/download_lila_subset.py +182 -0
megadetector/data_management/lila/generate_lila_per_image_labels.py +777 -0
megadetector/data_management/lila/get_lila_annotation_counts.py +174 -0
megadetector/data_management/lila/get_lila_image_counts.py +112 -0
megadetector/data_management/lila/lila_common.py +319 -0
megadetector/data_management/lila/test_lila_metadata_urls.py +164 -0
megadetector/data_management/mewc_to_md.py +344 -0
megadetector/data_management/ocr_tools.py +873 -0
megadetector/data_management/read_exif.py +964 -0
megadetector/data_management/remap_coco_categories.py +195 -0
megadetector/data_management/remove_exif.py +156 -0
megadetector/data_management/rename_images.py +194 -0
megadetector/data_management/resize_coco_dataset.py +665 -0
megadetector/data_management/speciesnet_to_md.py +41 -0
megadetector/data_management/wi_download_csv_to_coco.py +247 -0
megadetector/data_management/yolo_output_to_md_output.py +594 -0
megadetector/data_management/yolo_to_coco.py +984 -0
megadetector/data_management/zamba_to_md.py +188 -0
megadetector/detection/__init__.py +0 -0
megadetector/detection/change_detection.py +840 -0
megadetector/detection/process_video.py +479 -0
megadetector/detection/pytorch_detector.py +1451 -0
megadetector/detection/run_detector.py +1267 -0
megadetector/detection/run_detector_batch.py +2172 -0
megadetector/detection/run_inference_with_yolov5_val.py +1314 -0
megadetector/detection/run_md_and_speciesnet.py +1604 -0
megadetector/detection/run_tiled_inference.py +1044 -0
megadetector/detection/tf_detector.py +209 -0
megadetector/detection/video_utils.py +1379 -0
megadetector/postprocessing/__init__.py +0 -0
megadetector/postprocessing/add_max_conf.py +72 -0
megadetector/postprocessing/categorize_detections_by_size.py +166 -0
megadetector/postprocessing/classification_postprocessing.py +1943 -0
megadetector/postprocessing/combine_batch_outputs.py +249 -0
megadetector/postprocessing/compare_batch_results.py +2110 -0
megadetector/postprocessing/convert_output_format.py +403 -0
megadetector/postprocessing/create_crop_folder.py +629 -0
megadetector/postprocessing/detector_calibration.py +570 -0
megadetector/postprocessing/generate_csv_report.py +522 -0
megadetector/postprocessing/load_api_results.py +223 -0
megadetector/postprocessing/md_to_coco.py +428 -0
megadetector/postprocessing/md_to_labelme.py +351 -0
megadetector/postprocessing/md_to_wi.py +41 -0
megadetector/postprocessing/merge_detections.py +392 -0
megadetector/postprocessing/postprocess_batch_results.py +2140 -0
megadetector/postprocessing/remap_detection_categories.py +226 -0
megadetector/postprocessing/render_detection_confusion_matrix.py +677 -0
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +206 -0
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +82 -0
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +1665 -0
megadetector/postprocessing/separate_detections_into_folders.py +795 -0
megadetector/postprocessing/subset_json_detector_output.py +964 -0
megadetector/postprocessing/top_folders_to_bottom.py +238 -0
megadetector/postprocessing/validate_batch_results.py +332 -0
megadetector/taxonomy_mapping/__init__.py +0 -0
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +491 -0
megadetector/taxonomy_mapping/map_new_lila_datasets.py +211 -0
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +165 -0
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +543 -0
megadetector/taxonomy_mapping/retrieve_sample_image.py +71 -0
megadetector/taxonomy_mapping/simple_image_download.py +231 -0
megadetector/taxonomy_mapping/species_lookup.py +1008 -0
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +159 -0
megadetector/taxonomy_mapping/taxonomy_graph.py +346 -0
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +83 -0
megadetector/tests/__init__.py +0 -0
megadetector/tests/test_nms_synthetic.py +335 -0
megadetector/utils/__init__.py +0 -0
megadetector/utils/ct_utils.py +1857 -0
megadetector/utils/directory_listing.py +199 -0
megadetector/utils/extract_frames_from_video.py +307 -0
megadetector/utils/gpu_test.py +125 -0
megadetector/utils/md_tests.py +2072 -0
megadetector/utils/path_utils.py +2872 -0
megadetector/utils/process_utils.py +172 -0
megadetector/utils/split_locations_into_train_val.py +237 -0
megadetector/utils/string_utils.py +234 -0
megadetector/utils/url_utils.py +825 -0
megadetector/utils/wi_platform_utils.py +968 -0
megadetector/utils/wi_taxonomy_utils.py +1766 -0
megadetector/utils/write_html_image_list.py +239 -0
megadetector/visualization/__init__.py +0 -0
megadetector/visualization/plot_utils.py +309 -0
megadetector/visualization/render_images_with_thumbnails.py +243 -0
megadetector/visualization/visualization_utils.py +1973 -0
megadetector/visualization/visualize_db.py +630 -0
megadetector/visualization/visualize_detector_output.py +498 -0
megadetector/visualization/visualize_video_output.py +705 -0
megadetector-10.0.15.dist-info/METADATA +115 -0
megadetector-10.0.15.dist-info/RECORD +147 -0
megadetector-10.0.15.dist-info/WHEEL +5 -0
megadetector-10.0.15.dist-info/licenses/LICENSE +19 -0
megadetector-10.0.15.dist-info/top_level.txt +1 -0

megadetector/classification/map_classification_categories.py ADDED Viewed

@@ -0,0 +1,276 @@
+"""
+map_classification_categories.py
+Maps a classifier's output categories to desired target categories.
+In this file, we use the following terminology:
+* "category": a category output by the classifier
+* "target": name of a desired group, comprising >= 1 classifier categories
+Takes as input 2 label specification JSON files:
+1) desired label specification JSON file
+   this should not have a target named "other"
+2) label specification JSON file of trained classifier
+The mapping is accomplished as follows:
+1. For each category in the classifier label spec, find all taxon nodes that
+    belong to that category.
+2. Given a target in the desired label spec, find all taxon nodes that belong
+    to that target. If there is any classifier category whose nodes are a
+    subset of the target nodes, then map the classifier category to that target.
+    Any partial intersection between a target's nodes and a category's nodes
+    is considered an error.
+3. If there are any classifier categories that have not yet been assigned a
+    target, group them into the "other" target.
+This script outputs a JSON file that maps each target to a list of classifier
+categories.
+The taxonomy mapping parts of this script are very similar to json_validator.py.
+"""
+#%% Imports
+from __future__ import annotations
+import argparse
+import json
+import os
+from collections import defaultdict
+from collections.abc import Mapping
+from typing import Any, Optional
+import networkx as nx
+import pandas as pd
+from tqdm import tqdm
+from megadetector.taxonomy_mapping.taxonomy_graph import (
+    build_taxonomy_graph, dag_to_tree, TaxonNode)
+from megadetector.utils import ct_utils
+#%% Example usage
+"""
+    python map_classification_categories.py \
+        desired_label_spec.json \
+        /path/to/classifier/label_spec.json \
+        $HOME/camera-traps-private/camera_trap_taxonomy_mapping.csv
+"""
+#%% Main function
+def main(desired_label_spec_json_path: str,
+         classifier_label_spec_json_path: str,
+         taxonomy_csv_path: str,
+         output_json_path: str,
+         classifier_label_index_path: Optional[str]) -> None:
+    print('Reading label spec JSON files')
+    with open(desired_label_spec_json_path, 'r') as f:
+        target_spec = json.load(f)
+    with open(classifier_label_spec_json_path, 'r') as f:
+        classifier_spec = json.load(f)
+    if classifier_label_index_path is not None:
+        with open(classifier_label_index_path, 'r') as f:
+            classifier_labels = set(json.load(f).values())
+        assert classifier_labels <= set(classifier_spec.keys())
+        if len(classifier_labels) < len(classifier_spec):
+            classifier_spec = {
+                k: v for k, v in classifier_spec.items()
+                if k in classifier_labels
+            }
+    print('Building taxonomy hierarchy')
+    taxonomy_df = pd.read_csv(taxonomy_csv_path)
+    graph, taxon_to_node, label_to_node = build_taxonomy_graph(taxonomy_df)
+    dag_to_tree(graph, taxon_to_node)
+    print('Mapping label spec to nodes')
+    classifier_label_to_nodes = label_spec_to_nodes(
+        classifier_spec, taxon_to_node, label_to_node)
+    target_label_to_nodes = label_spec_to_nodes(
+        target_spec, taxon_to_node, label_to_node)
+    print('Creating mapping from target to classifier categories')
+    target_to_classifier_labels = map_target_to_classifier(
+        target_label_to_nodes, classifier_label_to_nodes)
+    os.makedirs(os.path.dirname(output_json_path), exist_ok=True)
+    ct_utils.write_json(output_json_path, target_to_classifier_labels)
+#%% Support functions
+def map_target_to_classifier(
+        target_label_to_nodes: Mapping[str, set[TaxonNode]],
+        classifier_label_to_nodes: Mapping[str, set[TaxonNode]]
+        ) -> dict[str, list[str]]:
+    """
+    For each target, if there is any classifier category whose nodes are a
+    subset of the target nodes, then assign the classifier category to that
+    target. Any partial intersection between a target's nodes and a category's
+    nodes is considered an error.
+    Args:
+        target_label_to_nodes: dict, maps target to set of nodes,
+            all of the sets of nodes should be disjoint
+        classifier_label_to_nodes: dict, maps classifier label to set of nodes,
+            all of the sets of nodes should be disjoint
+    Returns: dict, maps target label to set of classifier labels
+    """
+    remaining_classifier_labels = set(classifier_label_to_nodes.keys())
+    target_to_classifier_labels: defaultdict[str, set[str]] = defaultdict(set)
+    for target, target_nodes in tqdm(target_label_to_nodes.items()):
+        for label, classifier_nodes in classifier_label_to_nodes.items():
+            overlap = classifier_nodes & target_nodes
+            if len(overlap) == len(classifier_nodes):
+                target_to_classifier_labels[target].add(label)
+                remaining_classifier_labels.remove(label)
+            elif 0 < len(overlap) < len(classifier_nodes):  # partial overlap
+                raise ValueError('Only partial overlap between target '
+                                 f'{target} and classifier label {label}')
+    if len(remaining_classifier_labels) > 0:
+        target_to_classifier_labels['other'] = remaining_classifier_labels
+    target_to_sorted_labels = {
+        target: sorted(labels_set)
+        for target, labels_set in target_to_classifier_labels.items()
+    }
+    return target_to_sorted_labels
+def parse_spec(spec_dict: Mapping[str, Any],
+               taxon_to_node: dict[tuple[str, str], TaxonNode],
+               label_to_node: dict[tuple[str, str], TaxonNode]
+               ) -> set[TaxonNode]:
+    """
+    Args:
+        spec_dict: dict, contains keys ['taxa', 'dataset_labels', 'exclude']
+            {
+              "taxa": [
+                {'level': 'family', 'name': 'cervidae', 'datasets': ['idfg']},
+                {'level': 'genus',  'name': 'meleagris'} ],
+              "dataset_labels": { "idfg_swwlf_2019": ["bird"] },
+              "exclude": {...}
+            }
+        taxon_to_node: dict, maps (taxon_level, taxon_name) to a TaxonNode
+        label_to_node: dict, maps (dataset_name, dataset_label) to the lowest
+            TaxonNode node in the tree that contains the label
+    Returns: set of TaxonNode, nodes selected by the taxa spec
+    Raises: ValueError, if specification does not match any dataset labels
+    """
+    result = set()
+    if 'taxa' in spec_dict:
+        for taxon in spec_dict['taxa']:
+            key = (taxon['level'].lower(), taxon['name'].lower())
+            if key in taxon_to_node:
+                node = taxon_to_node[key]
+                result.add(node)
+                result |= nx.descendants(node.graph, node)
+            else:
+                print(f'Taxon {key} not found in taxonomy graph. Ignoring.')
+    if 'dataset_labels' in spec_dict:
+        for ds, ds_labels in spec_dict['dataset_labels'].items():
+            ds = ds.lower()
+            for ds_label in ds_labels:
+                node = label_to_node[(ds, ds_label.lower())]
+                result.add(node)
+                result |= nx.descendants(node.graph, node)
+    if 'exclude' in spec_dict:
+        result -= parse_spec(spec_dict['exclude'], taxon_to_node, label_to_node)
+    if len(result) == 0:
+        raise ValueError(f'specification matched no TaxonNode: {spec_dict}')
+    return result
+def label_spec_to_nodes(label_spec_js: dict[str, dict[str, Any]],
+                        taxon_to_node: dict[tuple[str, str], TaxonNode],
+                        label_to_node: dict[tuple[str, str], TaxonNode]
+                        ) -> dict[str, set[TaxonNode]]:
+    """
+    Convert label spec to a mapping from classification labels to a set of
+    nodes.
+    Args:
+        label_spec_js: dict, Python dict representation of JSON file
+            see classification/README.md
+        taxon_to_node: dict, maps (taxon_level, taxon_name) to a TaxonNode
+        label_to_node: dict, maps (dataset_name, dataset_label) to the lowest
+            TaxonNode node in the tree that contains the label
+    Returns: dict, maps label name to set of TaxonNode
+    Raises: ValueError, if a classification label specification matches no
+        TaxonNode, or if a node is included in two or more classification labels
+    """
+    # maps output label name to set of (dataset, dataset_label) tuples
+    seen_nodes: set[TaxonNode] = set()
+    label_to_nodes: dict[str, set[TaxonNode]] = {}
+    for label, spec_dict in label_spec_js.items():
+        include_set = parse_spec(spec_dict, taxon_to_node, label_to_node)
+        if include_set.isdisjoint(seen_nodes):
+            label_to_nodes[label] = include_set
+            seen_nodes |= include_set
+        else:
+            # find which other label (label_b) has intersection
+            for label_b, set_b in label_to_nodes.items():
+                shared = include_set.intersection(set_b)
+                if len(shared) > 0:
+                    print(f'Labels {label} and {label_b} share images:', shared)
+                    raise ValueError('Intersection between sets!')
+    return label_to_nodes
+#%% Command-line driver
+def _parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+        description='Create mapping from target categories to classifier '
+                    'labels.')
+    parser.add_argument(
+        'desired_label_spec_json',
+        help='path to JSON file containing desired label specification')
+    parser.add_argument(
+        'classifier_label_spec_json',
+        help='path to JSON file containing label specification of a trained '
+             'classifier')
+    parser.add_argument(
+        'taxonomy_csv',
+        help='path to taxonomy CSV file')
+    parser.add_argument(
+        '-o', '--output', required=True,
+        help='path to output JSON')
+    parser.add_argument(
+        '-i', '--classifier-label-index',
+        help='(optional) path to label index JSON file for trained classifier, '
+             'needed if not all labels from <classifier_label_spec_json> were '
+             'actually used (e.g., if some labels were filtered out by the '
+             '--min-locs argument for create_classification_dataset.py)')
+    return parser.parse_args()
+if __name__ == '__main__':
+    args = _parse_args()
+    main(desired_label_spec_json_path=args.desired_label_spec_json,
+         classifier_label_spec_json_path=args.classifier_label_spec_json,
+         taxonomy_csv_path=args.taxonomy_csv,
+         output_json_path=args.output,
+         classifier_label_index_path=args.classifier_label_index)