megadetector 5.0.9__py3-none-any.whl → 5.0.11__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of megadetector might be problematic. Click here for more details.

Files changed (226) hide show
  1. {megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/LICENSE +0 -0
  2. {megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/METADATA +12 -11
  3. megadetector-5.0.11.dist-info/RECORD +5 -0
  4. megadetector-5.0.11.dist-info/top_level.txt +1 -0
  5. api/__init__.py +0 -0
  6. api/batch_processing/__init__.py +0 -0
  7. api/batch_processing/api_core/__init__.py +0 -0
  8. api/batch_processing/api_core/batch_service/__init__.py +0 -0
  9. api/batch_processing/api_core/batch_service/score.py +0 -439
  10. api/batch_processing/api_core/server.py +0 -294
  11. api/batch_processing/api_core/server_api_config.py +0 -98
  12. api/batch_processing/api_core/server_app_config.py +0 -55
  13. api/batch_processing/api_core/server_batch_job_manager.py +0 -220
  14. api/batch_processing/api_core/server_job_status_table.py +0 -152
  15. api/batch_processing/api_core/server_orchestration.py +0 -360
  16. api/batch_processing/api_core/server_utils.py +0 -92
  17. api/batch_processing/api_core_support/__init__.py +0 -0
  18. api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
  19. api/batch_processing/api_support/__init__.py +0 -0
  20. api/batch_processing/api_support/summarize_daily_activity.py +0 -152
  21. api/batch_processing/data_preparation/__init__.py +0 -0
  22. api/batch_processing/data_preparation/manage_local_batch.py +0 -2391
  23. api/batch_processing/data_preparation/manage_video_batch.py +0 -327
  24. api/batch_processing/integration/digiKam/setup.py +0 -6
  25. api/batch_processing/integration/digiKam/xmp_integration.py +0 -465
  26. api/batch_processing/integration/eMammal/test_scripts/config_template.py +0 -5
  27. api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +0 -126
  28. api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +0 -55
  29. api/batch_processing/postprocessing/__init__.py +0 -0
  30. api/batch_processing/postprocessing/add_max_conf.py +0 -64
  31. api/batch_processing/postprocessing/categorize_detections_by_size.py +0 -163
  32. api/batch_processing/postprocessing/combine_api_outputs.py +0 -249
  33. api/batch_processing/postprocessing/compare_batch_results.py +0 -958
  34. api/batch_processing/postprocessing/convert_output_format.py +0 -397
  35. api/batch_processing/postprocessing/load_api_results.py +0 -195
  36. api/batch_processing/postprocessing/md_to_coco.py +0 -310
  37. api/batch_processing/postprocessing/md_to_labelme.py +0 -330
  38. api/batch_processing/postprocessing/merge_detections.py +0 -401
  39. api/batch_processing/postprocessing/postprocess_batch_results.py +0 -1904
  40. api/batch_processing/postprocessing/remap_detection_categories.py +0 -170
  41. api/batch_processing/postprocessing/render_detection_confusion_matrix.py +0 -661
  42. api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +0 -211
  43. api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +0 -82
  44. api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +0 -1631
  45. api/batch_processing/postprocessing/separate_detections_into_folders.py +0 -731
  46. api/batch_processing/postprocessing/subset_json_detector_output.py +0 -696
  47. api/batch_processing/postprocessing/top_folders_to_bottom.py +0 -223
  48. api/synchronous/__init__.py +0 -0
  49. api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
  50. api/synchronous/api_core/animal_detection_api/api_backend.py +0 -152
  51. api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -266
  52. api/synchronous/api_core/animal_detection_api/config.py +0 -35
  53. api/synchronous/api_core/animal_detection_api/data_management/annotations/annotation_constants.py +0 -47
  54. api/synchronous/api_core/animal_detection_api/detection/detector_training/copy_checkpoints.py +0 -43
  55. api/synchronous/api_core/animal_detection_api/detection/detector_training/model_main_tf2.py +0 -114
  56. api/synchronous/api_core/animal_detection_api/detection/process_video.py +0 -543
  57. api/synchronous/api_core/animal_detection_api/detection/pytorch_detector.py +0 -304
  58. api/synchronous/api_core/animal_detection_api/detection/run_detector.py +0 -627
  59. api/synchronous/api_core/animal_detection_api/detection/run_detector_batch.py +0 -1029
  60. api/synchronous/api_core/animal_detection_api/detection/run_inference_with_yolov5_val.py +0 -581
  61. api/synchronous/api_core/animal_detection_api/detection/run_tiled_inference.py +0 -754
  62. api/synchronous/api_core/animal_detection_api/detection/tf_detector.py +0 -165
  63. api/synchronous/api_core/animal_detection_api/detection/video_utils.py +0 -495
  64. api/synchronous/api_core/animal_detection_api/md_utils/azure_utils.py +0 -174
  65. api/synchronous/api_core/animal_detection_api/md_utils/ct_utils.py +0 -262
  66. api/synchronous/api_core/animal_detection_api/md_utils/directory_listing.py +0 -251
  67. api/synchronous/api_core/animal_detection_api/md_utils/matlab_porting_tools.py +0 -97
  68. api/synchronous/api_core/animal_detection_api/md_utils/path_utils.py +0 -416
  69. api/synchronous/api_core/animal_detection_api/md_utils/process_utils.py +0 -110
  70. api/synchronous/api_core/animal_detection_api/md_utils/sas_blob_utils.py +0 -509
  71. api/synchronous/api_core/animal_detection_api/md_utils/string_utils.py +0 -59
  72. api/synchronous/api_core/animal_detection_api/md_utils/url_utils.py +0 -144
  73. api/synchronous/api_core/animal_detection_api/md_utils/write_html_image_list.py +0 -226
  74. api/synchronous/api_core/animal_detection_api/md_visualization/visualization_utils.py +0 -841
  75. api/synchronous/api_core/tests/__init__.py +0 -0
  76. api/synchronous/api_core/tests/load_test.py +0 -110
  77. classification/__init__.py +0 -0
  78. classification/aggregate_classifier_probs.py +0 -108
  79. classification/analyze_failed_images.py +0 -227
  80. classification/cache_batchapi_outputs.py +0 -198
  81. classification/create_classification_dataset.py +0 -627
  82. classification/crop_detections.py +0 -516
  83. classification/csv_to_json.py +0 -226
  84. classification/detect_and_crop.py +0 -855
  85. classification/efficientnet/__init__.py +0 -9
  86. classification/efficientnet/model.py +0 -415
  87. classification/efficientnet/utils.py +0 -610
  88. classification/evaluate_model.py +0 -520
  89. classification/identify_mislabeled_candidates.py +0 -152
  90. classification/json_to_azcopy_list.py +0 -63
  91. classification/json_validator.py +0 -695
  92. classification/map_classification_categories.py +0 -276
  93. classification/merge_classification_detection_output.py +0 -506
  94. classification/prepare_classification_script.py +0 -194
  95. classification/prepare_classification_script_mc.py +0 -228
  96. classification/run_classifier.py +0 -286
  97. classification/save_mislabeled.py +0 -110
  98. classification/train_classifier.py +0 -825
  99. classification/train_classifier_tf.py +0 -724
  100. classification/train_utils.py +0 -322
  101. data_management/__init__.py +0 -0
  102. data_management/annotations/__init__.py +0 -0
  103. data_management/annotations/annotation_constants.py +0 -34
  104. data_management/camtrap_dp_to_coco.py +0 -238
  105. data_management/cct_json_utils.py +0 -395
  106. data_management/cct_to_md.py +0 -176
  107. data_management/cct_to_wi.py +0 -289
  108. data_management/coco_to_labelme.py +0 -272
  109. data_management/coco_to_yolo.py +0 -662
  110. data_management/databases/__init__.py +0 -0
  111. data_management/databases/add_width_and_height_to_db.py +0 -33
  112. data_management/databases/combine_coco_camera_traps_files.py +0 -206
  113. data_management/databases/integrity_check_json_db.py +0 -477
  114. data_management/databases/subset_json_db.py +0 -115
  115. data_management/generate_crops_from_cct.py +0 -149
  116. data_management/get_image_sizes.py +0 -188
  117. data_management/importers/add_nacti_sizes.py +0 -52
  118. data_management/importers/add_timestamps_to_icct.py +0 -79
  119. data_management/importers/animl_results_to_md_results.py +0 -158
  120. data_management/importers/auckland_doc_test_to_json.py +0 -372
  121. data_management/importers/auckland_doc_to_json.py +0 -200
  122. data_management/importers/awc_to_json.py +0 -189
  123. data_management/importers/bellevue_to_json.py +0 -273
  124. data_management/importers/cacophony-thermal-importer.py +0 -796
  125. data_management/importers/carrizo_shrubfree_2018.py +0 -268
  126. data_management/importers/carrizo_trail_cam_2017.py +0 -287
  127. data_management/importers/cct_field_adjustments.py +0 -57
  128. data_management/importers/channel_islands_to_cct.py +0 -913
  129. data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
  130. data_management/importers/eMammal/eMammal_helpers.py +0 -249
  131. data_management/importers/eMammal/make_eMammal_json.py +0 -223
  132. data_management/importers/ena24_to_json.py +0 -275
  133. data_management/importers/filenames_to_json.py +0 -385
  134. data_management/importers/helena_to_cct.py +0 -282
  135. data_management/importers/idaho-camera-traps.py +0 -1407
  136. data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
  137. data_management/importers/jb_csv_to_json.py +0 -150
  138. data_management/importers/mcgill_to_json.py +0 -250
  139. data_management/importers/missouri_to_json.py +0 -489
  140. data_management/importers/nacti_fieldname_adjustments.py +0 -79
  141. data_management/importers/noaa_seals_2019.py +0 -181
  142. data_management/importers/pc_to_json.py +0 -365
  143. data_management/importers/plot_wni_giraffes.py +0 -123
  144. data_management/importers/prepare-noaa-fish-data-for-lila.py +0 -359
  145. data_management/importers/prepare_zsl_imerit.py +0 -131
  146. data_management/importers/rspb_to_json.py +0 -356
  147. data_management/importers/save_the_elephants_survey_A.py +0 -320
  148. data_management/importers/save_the_elephants_survey_B.py +0 -332
  149. data_management/importers/snapshot_safari_importer.py +0 -758
  150. data_management/importers/snapshot_safari_importer_reprise.py +0 -665
  151. data_management/importers/snapshot_serengeti_lila.py +0 -1067
  152. data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
  153. data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
  154. data_management/importers/sulross_get_exif.py +0 -65
  155. data_management/importers/timelapse_csv_set_to_json.py +0 -490
  156. data_management/importers/ubc_to_json.py +0 -399
  157. data_management/importers/umn_to_json.py +0 -507
  158. data_management/importers/wellington_to_json.py +0 -263
  159. data_management/importers/wi_to_json.py +0 -441
  160. data_management/importers/zamba_results_to_md_results.py +0 -181
  161. data_management/labelme_to_coco.py +0 -548
  162. data_management/labelme_to_yolo.py +0 -272
  163. data_management/lila/__init__.py +0 -0
  164. data_management/lila/add_locations_to_island_camera_traps.py +0 -97
  165. data_management/lila/add_locations_to_nacti.py +0 -147
  166. data_management/lila/create_lila_blank_set.py +0 -557
  167. data_management/lila/create_lila_test_set.py +0 -151
  168. data_management/lila/create_links_to_md_results_files.py +0 -106
  169. data_management/lila/download_lila_subset.py +0 -177
  170. data_management/lila/generate_lila_per_image_labels.py +0 -515
  171. data_management/lila/get_lila_annotation_counts.py +0 -170
  172. data_management/lila/get_lila_image_counts.py +0 -111
  173. data_management/lila/lila_common.py +0 -300
  174. data_management/lila/test_lila_metadata_urls.py +0 -132
  175. data_management/ocr_tools.py +0 -874
  176. data_management/read_exif.py +0 -681
  177. data_management/remap_coco_categories.py +0 -84
  178. data_management/remove_exif.py +0 -66
  179. data_management/resize_coco_dataset.py +0 -189
  180. data_management/wi_download_csv_to_coco.py +0 -246
  181. data_management/yolo_output_to_md_output.py +0 -441
  182. data_management/yolo_to_coco.py +0 -676
  183. detection/__init__.py +0 -0
  184. detection/detector_training/__init__.py +0 -0
  185. detection/detector_training/model_main_tf2.py +0 -114
  186. detection/process_video.py +0 -703
  187. detection/pytorch_detector.py +0 -337
  188. detection/run_detector.py +0 -779
  189. detection/run_detector_batch.py +0 -1219
  190. detection/run_inference_with_yolov5_val.py +0 -917
  191. detection/run_tiled_inference.py +0 -935
  192. detection/tf_detector.py +0 -188
  193. detection/video_utils.py +0 -606
  194. docs/source/conf.py +0 -43
  195. md_utils/__init__.py +0 -0
  196. md_utils/azure_utils.py +0 -174
  197. md_utils/ct_utils.py +0 -612
  198. md_utils/directory_listing.py +0 -246
  199. md_utils/md_tests.py +0 -968
  200. md_utils/path_utils.py +0 -1044
  201. md_utils/process_utils.py +0 -157
  202. md_utils/sas_blob_utils.py +0 -509
  203. md_utils/split_locations_into_train_val.py +0 -228
  204. md_utils/string_utils.py +0 -92
  205. md_utils/url_utils.py +0 -323
  206. md_utils/write_html_image_list.py +0 -225
  207. md_visualization/__init__.py +0 -0
  208. md_visualization/plot_utils.py +0 -293
  209. md_visualization/render_images_with_thumbnails.py +0 -275
  210. md_visualization/visualization_utils.py +0 -1537
  211. md_visualization/visualize_db.py +0 -551
  212. md_visualization/visualize_detector_output.py +0 -406
  213. megadetector-5.0.9.dist-info/RECORD +0 -224
  214. megadetector-5.0.9.dist-info/top_level.txt +0 -8
  215. taxonomy_mapping/__init__.py +0 -0
  216. taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +0 -491
  217. taxonomy_mapping/map_new_lila_datasets.py +0 -154
  218. taxonomy_mapping/prepare_lila_taxonomy_release.py +0 -142
  219. taxonomy_mapping/preview_lila_taxonomy.py +0 -591
  220. taxonomy_mapping/retrieve_sample_image.py +0 -71
  221. taxonomy_mapping/simple_image_download.py +0 -218
  222. taxonomy_mapping/species_lookup.py +0 -834
  223. taxonomy_mapping/taxonomy_csv_checker.py +0 -159
  224. taxonomy_mapping/taxonomy_graph.py +0 -346
  225. taxonomy_mapping/validate_lila_category_mappings.py +0 -83
  226. {megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/WHEEL +0 -0
@@ -1,276 +0,0 @@
1
- """
2
-
3
- map_classification_categories.py
4
-
5
- Maps a classifier's output categories to desired target categories.
6
-
7
- In this file, we use the following terminology:
8
- * "category": a category output by the classifier
9
- * "target": name of a desired group, comprising >= 1 classifier categories
10
-
11
- Takes as input 2 label specification JSON files:
12
-
13
- 1) desired label specification JSON file
14
- this should not have a target named "other"
15
-
16
- 2) label specification JSON file of trained classifier
17
-
18
- The mapping is accomplished as follows:
19
-
20
- 1. For each category in the classifier label spec, find all taxon nodes that
21
- belong to that category.
22
-
23
- 2. Given a target in the desired label spec, find all taxon nodes that belong
24
- to that target. If there is any classifier category whose nodes are a
25
- subset of the target nodes, then map the classifier category to that target.
26
- Any partial intersection between a target's nodes and a category's nodes
27
- is considered an error.
28
-
29
- 3. If there are any classifier categories that have not yet been assigned a
30
- target, group them into the "other" target.
31
-
32
- This script outputs a JSON file that maps each target to a list of classifier
33
- categories.
34
-
35
- The taxonomy mapping parts of this script are very similar to json_validator.py.
36
-
37
- """
38
-
39
- #%% Imports
40
-
41
- from __future__ import annotations
42
-
43
- import argparse
44
- import json
45
- import os
46
-
47
- from collections import defaultdict
48
- from collections.abc import Mapping
49
- from typing import Any, Optional
50
-
51
- import networkx as nx
52
- import pandas as pd
53
- from tqdm import tqdm
54
-
55
- from taxonomy_mapping.taxonomy_graph import (
56
- build_taxonomy_graph, dag_to_tree, TaxonNode)
57
-
58
-
59
- #%% Example usage
60
-
61
- """
62
- python map_classification_categories.py \
63
- desired_label_spec.json \
64
- /path/to/classifier/label_spec.json \
65
- $HOME/camera-traps-private/camera_trap_taxonomy_mapping.csv
66
- """
67
-
68
-
69
- #%% Main function
70
-
71
- def main(desired_label_spec_json_path: str,
72
- classifier_label_spec_json_path: str,
73
- taxonomy_csv_path: str,
74
- output_json_path: str,
75
- classifier_label_index_path: Optional[str]) -> None:
76
-
77
- print('Reading label spec JSON files')
78
- with open(desired_label_spec_json_path, 'r') as f:
79
- target_spec = json.load(f)
80
- with open(classifier_label_spec_json_path, 'r') as f:
81
- classifier_spec = json.load(f)
82
-
83
- if classifier_label_index_path is not None:
84
- with open(classifier_label_index_path, 'r') as f:
85
- classifier_labels = set(json.load(f).values())
86
- assert classifier_labels <= set(classifier_spec.keys())
87
- if len(classifier_labels) < len(classifier_spec):
88
- classifier_spec = {
89
- k: v for k, v in classifier_spec.items()
90
- if k in classifier_labels
91
- }
92
-
93
- print('Building taxonomy hierarchy')
94
- taxonomy_df = pd.read_csv(taxonomy_csv_path)
95
- graph, taxon_to_node, label_to_node = build_taxonomy_graph(taxonomy_df)
96
- dag_to_tree(graph, taxon_to_node)
97
-
98
- print('Mapping label spec to nodes')
99
- classifier_label_to_nodes = label_spec_to_nodes(
100
- classifier_spec, taxon_to_node, label_to_node)
101
- target_label_to_nodes = label_spec_to_nodes(
102
- target_spec, taxon_to_node, label_to_node)
103
-
104
- print('Creating mapping from target to classifier categories')
105
- target_to_classifier_labels = map_target_to_classifier(
106
- target_label_to_nodes, classifier_label_to_nodes)
107
- os.makedirs(os.path.dirname(output_json_path), exist_ok=True)
108
- with open(output_json_path, 'w') as f:
109
- json.dump(target_to_classifier_labels, f, indent=1)
110
-
111
-
112
- #%% Support functions
113
-
114
- def map_target_to_classifier(
115
- target_label_to_nodes: Mapping[str, set[TaxonNode]],
116
- classifier_label_to_nodes: Mapping[str, set[TaxonNode]]
117
- ) -> dict[str, list[str]]:
118
- """
119
- For each target, if there is any classifier category whose nodes are a
120
- subset of the target nodes, then assign the classifier category to that
121
- target. Any partial intersection between a target's nodes and a category's
122
- nodes is considered an error.
123
-
124
- Args:
125
- target_label_to_nodes: dict, maps target to set of nodes,
126
- all of the sets of nodes should be disjoint
127
- classifier_label_to_nodes: dict, maps classifier label to set of nodes,
128
- all of the sets of nodes should be disjoint
129
-
130
- Returns: dict, maps target label to set of classifier labels
131
- """
132
-
133
- remaining_classifier_labels = set(classifier_label_to_nodes.keys())
134
- target_to_classifier_labels: defaultdict[str, set[str]] = defaultdict(set)
135
- for target, target_nodes in tqdm(target_label_to_nodes.items()):
136
- for label, classifier_nodes in classifier_label_to_nodes.items():
137
- overlap = classifier_nodes & target_nodes
138
- if len(overlap) == len(classifier_nodes):
139
- target_to_classifier_labels[target].add(label)
140
- remaining_classifier_labels.remove(label)
141
- elif 0 < len(overlap) < len(classifier_nodes): # partial overlap
142
- raise ValueError('Only partial overlap between target '
143
- f'{target} and classifier label {label}')
144
- if len(remaining_classifier_labels) > 0:
145
- target_to_classifier_labels['other'] = remaining_classifier_labels
146
- target_to_sorted_labels = {
147
- target: sorted(labels_set)
148
- for target, labels_set in target_to_classifier_labels.items()
149
- }
150
- return target_to_sorted_labels
151
-
152
-
153
- def parse_spec(spec_dict: Mapping[str, Any],
154
- taxon_to_node: dict[tuple[str, str], TaxonNode],
155
- label_to_node: dict[tuple[str, str], TaxonNode]
156
- ) -> set[TaxonNode]:
157
- """
158
- Args:
159
- spec_dict: dict, contains keys ['taxa', 'dataset_labels', 'exclude']
160
- {
161
- "taxa": [
162
- {'level': 'family', 'name': 'cervidae', 'datasets': ['idfg']},
163
- {'level': 'genus', 'name': 'meleagris'} ],
164
- "dataset_labels": { "idfg_swwlf_2019": ["bird"] },
165
- "exclude": {...}
166
- }
167
- taxon_to_node: dict, maps (taxon_level, taxon_name) to a TaxonNode
168
- label_to_node: dict, maps (dataset_name, dataset_label) to the lowest
169
- TaxonNode node in the tree that contains the label
170
-
171
- Returns: set of TaxonNode, nodes selected by the taxa spec
172
-
173
- Raises: ValueError, if specification does not match any dataset labels
174
- """
175
-
176
- result = set()
177
- if 'taxa' in spec_dict:
178
- for taxon in spec_dict['taxa']:
179
- key = (taxon['level'].lower(), taxon['name'].lower())
180
- if key in taxon_to_node:
181
- node = taxon_to_node[key]
182
- result.add(node)
183
- result |= nx.descendants(node.graph, node)
184
- else:
185
- print(f'Taxon {key} not found in taxonomy graph. Ignoring.')
186
- if 'dataset_labels' in spec_dict:
187
- for ds, ds_labels in spec_dict['dataset_labels'].items():
188
- ds = ds.lower()
189
- for ds_label in ds_labels:
190
- node = label_to_node[(ds, ds_label.lower())]
191
- result.add(node)
192
- result |= nx.descendants(node.graph, node)
193
- if 'exclude' in spec_dict:
194
- result -= parse_spec(spec_dict['exclude'], taxon_to_node, label_to_node)
195
- if len(result) == 0:
196
- raise ValueError(f'specification matched no TaxonNode: {spec_dict}')
197
- return result
198
-
199
-
200
- def label_spec_to_nodes(label_spec_js: dict[str, dict[str, Any]],
201
- taxon_to_node: dict[tuple[str, str], TaxonNode],
202
- label_to_node: dict[tuple[str, str], TaxonNode]
203
- ) -> dict[str, set[TaxonNode]]:
204
- """
205
- Convert label spec to a mapping from classification labels to a set of
206
- nodes.
207
-
208
- Args:
209
- label_spec_js: dict, Python dict representation of JSON file
210
- see classification/README.md
211
- taxon_to_node: dict, maps (taxon_level, taxon_name) to a TaxonNode
212
- label_to_node: dict, maps (dataset_name, dataset_label) to the lowest
213
- TaxonNode node in the tree that contains the label
214
-
215
- Returns: dict, maps label name to set of TaxonNode
216
-
217
- Raises: ValueError, if a classification label specification matches no
218
- TaxonNode, or if a node is included in two or more classification labels
219
- """
220
-
221
- # maps output label name to set of (dataset, dataset_label) tuples
222
- seen_nodes: set[TaxonNode] = set()
223
- label_to_nodes: dict[str, set[TaxonNode]] = {}
224
- for label, spec_dict in label_spec_js.items():
225
- include_set = parse_spec(spec_dict, taxon_to_node, label_to_node)
226
- if include_set.isdisjoint(seen_nodes):
227
- label_to_nodes[label] = include_set
228
- seen_nodes |= include_set
229
- else:
230
- # find which other label (label_b) has intersection
231
- for label_b, set_b in label_to_nodes.items():
232
- shared = include_set.intersection(set_b)
233
- if len(shared) > 0:
234
- print(f'Labels {label} and {label_b} share images:', shared)
235
- raise ValueError('Intersection between sets!')
236
- return label_to_nodes
237
-
238
-
239
- #%% Command-line driver
240
-
241
- def _parse_args() -> argparse.Namespace:
242
-
243
- parser = argparse.ArgumentParser(
244
- formatter_class=argparse.ArgumentDefaultsHelpFormatter,
245
- description='Create mapping from target categories to classifier '
246
- 'labels.')
247
- parser.add_argument(
248
- 'desired_label_spec_json',
249
- help='path to JSON file containing desired label specification')
250
- parser.add_argument(
251
- 'classifier_label_spec_json',
252
- help='path to JSON file containing label specification of a trained '
253
- 'classifier')
254
- parser.add_argument(
255
- 'taxonomy_csv',
256
- help='path to taxonomy CSV file')
257
- parser.add_argument(
258
- '-o', '--output', required=True,
259
- help='path to output JSON')
260
- parser.add_argument(
261
- '-i', '--classifier-label-index',
262
- help='(optional) path to label index JSON file for trained classifier, '
263
- 'needed if not all labels from <classifier_label_spec_json> were '
264
- 'actually used (e.g., if some labels were filtered out by the '
265
- '--min-locs argument for create_classification_dataset.py)')
266
- return parser.parse_args()
267
-
268
-
269
- if __name__ == '__main__':
270
-
271
- args = _parse_args()
272
- main(desired_label_spec_json_path=args.desired_label_spec_json,
273
- classifier_label_spec_json_path=args.classifier_label_spec_json,
274
- taxonomy_csv_path=args.taxonomy_csv,
275
- output_json_path=args.output,
276
- classifier_label_index_path=args.classifier_label_index)