PyPI - megadetector - Versions diffs - 5.0.10__py3-none-any.whl → 5.0.11__py3-none-any.whl - Mend

megadetector 5.0.10py3-none-any.whl → 5.0.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (226) hide show

{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/LICENSE +0 -0
{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/METADATA +12 -11
megadetector-5.0.11.dist-info/RECORD +5 -0
megadetector-5.0.11.dist-info/top_level.txt +1 -0
api/__init__.py +0 -0
api/batch_processing/__init__.py +0 -0
api/batch_processing/api_core/__init__.py +0 -0
api/batch_processing/api_core/batch_service/__init__.py +0 -0
api/batch_processing/api_core/batch_service/score.py +0 -439
api/batch_processing/api_core/server.py +0 -294
api/batch_processing/api_core/server_api_config.py +0 -98
api/batch_processing/api_core/server_app_config.py +0 -55
api/batch_processing/api_core/server_batch_job_manager.py +0 -220
api/batch_processing/api_core/server_job_status_table.py +0 -152
api/batch_processing/api_core/server_orchestration.py +0 -360
api/batch_processing/api_core/server_utils.py +0 -92
api/batch_processing/api_core_support/__init__.py +0 -0
api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
api/batch_processing/api_support/__init__.py +0 -0
api/batch_processing/api_support/summarize_daily_activity.py +0 -152
api/batch_processing/data_preparation/__init__.py +0 -0
api/batch_processing/data_preparation/manage_local_batch.py +0 -2391
api/batch_processing/data_preparation/manage_video_batch.py +0 -327
api/batch_processing/integration/digiKam/setup.py +0 -6
api/batch_processing/integration/digiKam/xmp_integration.py +0 -465
api/batch_processing/integration/eMammal/test_scripts/config_template.py +0 -5
api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +0 -126
api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +0 -55
api/batch_processing/postprocessing/__init__.py +0 -0
api/batch_processing/postprocessing/add_max_conf.py +0 -64
api/batch_processing/postprocessing/categorize_detections_by_size.py +0 -163
api/batch_processing/postprocessing/combine_api_outputs.py +0 -249
api/batch_processing/postprocessing/compare_batch_results.py +0 -958
api/batch_processing/postprocessing/convert_output_format.py +0 -397
api/batch_processing/postprocessing/load_api_results.py +0 -195
api/batch_processing/postprocessing/md_to_coco.py +0 -310
api/batch_processing/postprocessing/md_to_labelme.py +0 -330
api/batch_processing/postprocessing/merge_detections.py +0 -401
api/batch_processing/postprocessing/postprocess_batch_results.py +0 -1904
api/batch_processing/postprocessing/remap_detection_categories.py +0 -170
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +0 -661
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +0 -211
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +0 -82
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +0 -1631
api/batch_processing/postprocessing/separate_detections_into_folders.py +0 -731
api/batch_processing/postprocessing/subset_json_detector_output.py +0 -696
api/batch_processing/postprocessing/top_folders_to_bottom.py +0 -223
api/synchronous/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/api_backend.py +0 -152
api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -266
api/synchronous/api_core/animal_detection_api/config.py +0 -35
api/synchronous/api_core/animal_detection_api/data_management/annotations/annotation_constants.py +0 -47
api/synchronous/api_core/animal_detection_api/detection/detector_training/copy_checkpoints.py +0 -43
api/synchronous/api_core/animal_detection_api/detection/detector_training/model_main_tf2.py +0 -114
api/synchronous/api_core/animal_detection_api/detection/process_video.py +0 -543
api/synchronous/api_core/animal_detection_api/detection/pytorch_detector.py +0 -304
api/synchronous/api_core/animal_detection_api/detection/run_detector.py +0 -627
api/synchronous/api_core/animal_detection_api/detection/run_detector_batch.py +0 -1029
api/synchronous/api_core/animal_detection_api/detection/run_inference_with_yolov5_val.py +0 -581
api/synchronous/api_core/animal_detection_api/detection/run_tiled_inference.py +0 -754
api/synchronous/api_core/animal_detection_api/detection/tf_detector.py +0 -165
api/synchronous/api_core/animal_detection_api/detection/video_utils.py +0 -495
api/synchronous/api_core/animal_detection_api/md_utils/azure_utils.py +0 -174
api/synchronous/api_core/animal_detection_api/md_utils/ct_utils.py +0 -262
api/synchronous/api_core/animal_detection_api/md_utils/directory_listing.py +0 -251
api/synchronous/api_core/animal_detection_api/md_utils/matlab_porting_tools.py +0 -97
api/synchronous/api_core/animal_detection_api/md_utils/path_utils.py +0 -416
api/synchronous/api_core/animal_detection_api/md_utils/process_utils.py +0 -110
api/synchronous/api_core/animal_detection_api/md_utils/sas_blob_utils.py +0 -509
api/synchronous/api_core/animal_detection_api/md_utils/string_utils.py +0 -59
api/synchronous/api_core/animal_detection_api/md_utils/url_utils.py +0 -144
api/synchronous/api_core/animal_detection_api/md_utils/write_html_image_list.py +0 -226
api/synchronous/api_core/animal_detection_api/md_visualization/visualization_utils.py +0 -841
api/synchronous/api_core/tests/__init__.py +0 -0
api/synchronous/api_core/tests/load_test.py +0 -110
classification/__init__.py +0 -0
classification/aggregate_classifier_probs.py +0 -108
classification/analyze_failed_images.py +0 -227
classification/cache_batchapi_outputs.py +0 -198
classification/create_classification_dataset.py +0 -627
classification/crop_detections.py +0 -516
classification/csv_to_json.py +0 -226
classification/detect_and_crop.py +0 -855
classification/efficientnet/__init__.py +0 -9
classification/efficientnet/model.py +0 -415
classification/efficientnet/utils.py +0 -610
classification/evaluate_model.py +0 -520
classification/identify_mislabeled_candidates.py +0 -152
classification/json_to_azcopy_list.py +0 -63
classification/json_validator.py +0 -695
classification/map_classification_categories.py +0 -276
classification/merge_classification_detection_output.py +0 -506
classification/prepare_classification_script.py +0 -194
classification/prepare_classification_script_mc.py +0 -228
classification/run_classifier.py +0 -286
classification/save_mislabeled.py +0 -110
classification/train_classifier.py +0 -825
classification/train_classifier_tf.py +0 -724
classification/train_utils.py +0 -322
data_management/__init__.py +0 -0
data_management/annotations/__init__.py +0 -0
data_management/annotations/annotation_constants.py +0 -34
data_management/camtrap_dp_to_coco.py +0 -238
data_management/cct_json_utils.py +0 -395
data_management/cct_to_md.py +0 -176
data_management/cct_to_wi.py +0 -289
data_management/coco_to_labelme.py +0 -272
data_management/coco_to_yolo.py +0 -662
data_management/databases/__init__.py +0 -0
data_management/databases/add_width_and_height_to_db.py +0 -33
data_management/databases/combine_coco_camera_traps_files.py +0 -206
data_management/databases/integrity_check_json_db.py +0 -477
data_management/databases/subset_json_db.py +0 -115
data_management/generate_crops_from_cct.py +0 -149
data_management/get_image_sizes.py +0 -188
data_management/importers/add_nacti_sizes.py +0 -52
data_management/importers/add_timestamps_to_icct.py +0 -79
data_management/importers/animl_results_to_md_results.py +0 -158
data_management/importers/auckland_doc_test_to_json.py +0 -372
data_management/importers/auckland_doc_to_json.py +0 -200
data_management/importers/awc_to_json.py +0 -189
data_management/importers/bellevue_to_json.py +0 -273
data_management/importers/cacophony-thermal-importer.py +0 -796
data_management/importers/carrizo_shrubfree_2018.py +0 -268
data_management/importers/carrizo_trail_cam_2017.py +0 -287
data_management/importers/cct_field_adjustments.py +0 -57
data_management/importers/channel_islands_to_cct.py +0 -913
data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
data_management/importers/eMammal/eMammal_helpers.py +0 -249
data_management/importers/eMammal/make_eMammal_json.py +0 -223
data_management/importers/ena24_to_json.py +0 -275
data_management/importers/filenames_to_json.py +0 -385
data_management/importers/helena_to_cct.py +0 -282
data_management/importers/idaho-camera-traps.py +0 -1407
data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
data_management/importers/jb_csv_to_json.py +0 -150
data_management/importers/mcgill_to_json.py +0 -250
data_management/importers/missouri_to_json.py +0 -489
data_management/importers/nacti_fieldname_adjustments.py +0 -79
data_management/importers/noaa_seals_2019.py +0 -181
data_management/importers/pc_to_json.py +0 -365
data_management/importers/plot_wni_giraffes.py +0 -123
data_management/importers/prepare-noaa-fish-data-for-lila.py +0 -359
data_management/importers/prepare_zsl_imerit.py +0 -131
data_management/importers/rspb_to_json.py +0 -356
data_management/importers/save_the_elephants_survey_A.py +0 -320
data_management/importers/save_the_elephants_survey_B.py +0 -332
data_management/importers/snapshot_safari_importer.py +0 -758
data_management/importers/snapshot_safari_importer_reprise.py +0 -665
data_management/importers/snapshot_serengeti_lila.py +0 -1067
data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
data_management/importers/sulross_get_exif.py +0 -65
data_management/importers/timelapse_csv_set_to_json.py +0 -490
data_management/importers/ubc_to_json.py +0 -399
data_management/importers/umn_to_json.py +0 -507
data_management/importers/wellington_to_json.py +0 -263
data_management/importers/wi_to_json.py +0 -441
data_management/importers/zamba_results_to_md_results.py +0 -181
data_management/labelme_to_coco.py +0 -548
data_management/labelme_to_yolo.py +0 -272
data_management/lila/__init__.py +0 -0
data_management/lila/add_locations_to_island_camera_traps.py +0 -97
data_management/lila/add_locations_to_nacti.py +0 -147
data_management/lila/create_lila_blank_set.py +0 -557
data_management/lila/create_lila_test_set.py +0 -151
data_management/lila/create_links_to_md_results_files.py +0 -106
data_management/lila/download_lila_subset.py +0 -177
data_management/lila/generate_lila_per_image_labels.py +0 -515
data_management/lila/get_lila_annotation_counts.py +0 -170
data_management/lila/get_lila_image_counts.py +0 -111
data_management/lila/lila_common.py +0 -300
data_management/lila/test_lila_metadata_urls.py +0 -132
data_management/ocr_tools.py +0 -874
data_management/read_exif.py +0 -681
data_management/remap_coco_categories.py +0 -84
data_management/remove_exif.py +0 -66
data_management/resize_coco_dataset.py +0 -189
data_management/wi_download_csv_to_coco.py +0 -246
data_management/yolo_output_to_md_output.py +0 -441
data_management/yolo_to_coco.py +0 -676
detection/__init__.py +0 -0
detection/detector_training/__init__.py +0 -0
detection/detector_training/model_main_tf2.py +0 -114
detection/process_video.py +0 -703
detection/pytorch_detector.py +0 -337
detection/run_detector.py +0 -779
detection/run_detector_batch.py +0 -1219
detection/run_inference_with_yolov5_val.py +0 -917
detection/run_tiled_inference.py +0 -935
detection/tf_detector.py +0 -188
detection/video_utils.py +0 -606
docs/source/conf.py +0 -43
md_utils/__init__.py +0 -0
md_utils/azure_utils.py +0 -174
md_utils/ct_utils.py +0 -612
md_utils/directory_listing.py +0 -246
md_utils/md_tests.py +0 -968
md_utils/path_utils.py +0 -1044
md_utils/process_utils.py +0 -157
md_utils/sas_blob_utils.py +0 -509
md_utils/split_locations_into_train_val.py +0 -228
md_utils/string_utils.py +0 -92
md_utils/url_utils.py +0 -323
md_utils/write_html_image_list.py +0 -225
md_visualization/__init__.py +0 -0
md_visualization/plot_utils.py +0 -293
md_visualization/render_images_with_thumbnails.py +0 -275
md_visualization/visualization_utils.py +0 -1537
md_visualization/visualize_db.py +0 -551
md_visualization/visualize_detector_output.py +0 -406
megadetector-5.0.10.dist-info/RECORD +0 -224
megadetector-5.0.10.dist-info/top_level.txt +0 -8
taxonomy_mapping/__init__.py +0 -0
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +0 -491
taxonomy_mapping/map_new_lila_datasets.py +0 -154
taxonomy_mapping/prepare_lila_taxonomy_release.py +0 -142
taxonomy_mapping/preview_lila_taxonomy.py +0 -591
taxonomy_mapping/retrieve_sample_image.py +0 -71
taxonomy_mapping/simple_image_download.py +0 -218
taxonomy_mapping/species_lookup.py +0 -834
taxonomy_mapping/taxonomy_csv_checker.py +0 -159
taxonomy_mapping/taxonomy_graph.py +0 -346
taxonomy_mapping/validate_lila_category_mappings.py +0 -83
{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/WHEEL +0 -0

data_management/importers/idfg_iwildcam_lila_prep.py DELETED Viewed

@@ -1,294 +0,0 @@
-"""
- idfg_iwildcam_lila_prep.py
- Adding class labels (from the private test .csv) to the iWildCam 2019 IDFG
- test set, in preparation for release on LILA.
- This version works with the public iWildCam release images.
-"""
-#%% ############ Take one, from iWildCam .json files ############
-#%% Imports and constants
-import uuid
-import json
-import os
-from tqdm import tqdm
-base_folder = r'h:\iWildCam_2019_IDFG'
-input_json = os.path.join(base_folder,'iWildCam_2019_IDFG_info.json')
-input_csv = os.path.join(base_folder,'IDFG_eval_public_v_private.csv')
-output_json = os.path.join(base_folder,'idaho_camera_traps.json')
-assert os.path.isfile(input_json)
-assert os.path.isfile(input_csv)
-#%% Read input files
-with open(input_json,'r') as f:
-    input_data = json.load(f)
-with open(input_csv,'r') as f:
-    private_csv_lines = f.readlines()
-private_csv_lines = [s.strip() for s in private_csv_lines]
-# Remove the header line
-assert private_csv_lines[0] == 'Id,Category,Usage'
-private_csv_lines = private_csv_lines[1:]
-print('Read {} annotations for {} images'.format(len(private_csv_lines),len(input_data['images'])))
-assert len(private_csv_lines) == len(input_data['images'])
-n_images = len(input_data['images'])
-#%% Parse annotations
-image_id_to_category_ids = {}
-for line in tqdm(private_csv_lines):
-    # Lines look like:
-    #
-    # b005e5b2-2c0b-11e9-bcad-06f1011196c4,1,Private
-    tokens = line.split(',')
-    assert len(tokens) == 3
-    assert tokens[2] in ['Private','Public']
-    image_id_to_category_ids[tokens[0]] = int(tokens[1])
-assert len(image_id_to_category_ids) == n_images
-#%% Minor cleanup re: images
-for im in tqdm(input_data['images']):
-    image_id = im['id']
-    im['file_name'] = im['file_name'].replace('iWildCam_IDFG_images/','')
-    assert isinstance(im['location'],int)
-    im['location'] = str(im['location'])
-#%% Create annotations
-annotations = []
-for image_id in tqdm(image_id_to_category_ids):
-    category_id = image_id_to_category_ids[image_id]
-    ann = {}
-    ann['id'] = str(uuid.uuid1())
-    ann['image_id'] = image_id
-    ann['category_id'] = category_id
-    annotations.append(ann)
-#%% Prepare info
-info = input_data['info']
-info['contributor'] = 'Images acquired by the Idaho Department of Fish and Game, dataset curated by Sara Beery'
-info['description'] = 'Idaho Camera traps'
-info['version'] = '2021.07.19'
-#%% Minor adjustments to categories
-input_categories = input_data['categories']
-category_id_to_name = {cat['id']:cat['name'] for cat in input_categories}
-category_name_to_id = {cat['name']:cat['id'] for cat in input_categories}
-assert category_id_to_name[0] == 'empty'
-category_names_to_counts = {}
-for category in input_categories:
-    category_names_to_counts[category['name']] = 0
-for ann in annotations:
-    category_id = ann['category_id']
-    category_name = category_id_to_name[category_id]
-    category_names_to_counts[category_name] = category_names_to_counts[category_name] + 1
-categories = []
-for category_name in category_names_to_counts:
-    count = category_names_to_counts[category_name]
-    # Remove unused categories
-    if count == 0:
-        continue
-    category_id = category_name_to_id[category_name]
-    # Name adjustments
-    if category_name == 'prongs':
-        category_name = 'pronghorn'
-    categories.append({'id':category_id,'name':category_name})
-#%% Create output
-output_data = {}
-output_data['images'] = input_data['images']
-output_data['annotations'] = annotations
-output_data['categories'] = categories
-output_data['info'] = info
-#%% Write output
-with open(output_json,'w') as f:
-    json.dump(output_data,f,indent=2)
-#%% Validate .json file
-from data_management.databases import integrity_check_json_db
-options = integrity_check_json_db.IntegrityCheckOptions()
-options.baseDir = os.path.join(base_folder,'images'); assert os.path.isdir(options.baseDir)
-options.bCheckImageSizes = False
-options.bCheckImageExistence = False
-options.bFindUnusedImages = False
-_, _, _ = integrity_check_json_db.integrity_check_json_db(output_json, options)
-#%% Preview labels
-from md_visualization import visualize_db
-viz_options = visualize_db.DbVizOptions()
-viz_options.num_to_visualize = 100
-viz_options.trim_to_images_with_bboxes = False
-viz_options.add_search_links = False
-viz_options.sort_by_filename = False
-viz_options.parallelize_rendering = True
-viz_options.include_filename_links = True
-# viz_options.classes_to_exclude = ['test']
-html_output_file, _ = visualize_db.visualize_db(db_path=output_json,
-                                                         output_dir=os.path.join(
-                                                         base_folder,'preview'),
-                                                         image_base_dir=os.path.join(base_folder,'images'),
-                                                         options=viz_options)
-os.startfile(html_output_file)
-#%% ############ Take two, from pre-iWildCam .json files created from IDFG .csv files ############
-#%% Imports and constants
-import json
-import os
-base_folder = r'h:\idaho-camera-traps'
-input_json_sl = os.path.join(base_folder,'iWildCam_IDFG.json')
-input_json = os.path.join(base_folder,'iWildCam_IDFG_ml.json')
-output_json = os.path.join(base_folder,'idaho_camera_traps.json')
-remote_image_base_dir = r'z:\idfg'
-assert os.path.isfile(input_json)
-#%% One-time line break addition
-if not os.path.isfile(input_json):
-    sl_json = input_json_sl
-    ml_json = input_json
-    with open(sl_json,'r') as f:
-        d = json.load(f)
-    with open(ml_json,'w') as f:
-        json.dump(d,f,indent=2)
-#%% Read input files
-with open(input_json,'r') as f:
-    input_data = json.load(f)
-print('Read {} annotations for {} images'.format(len(input_data['annotations']),len(input_data['images'])))
-n_images = len(input_data['images'])
-#%% Prepare info
-info = {}
-info['contributor'] = 'Images acquired by the Idaho Department of Fish and Game, dataset curated by Sara Beery'
-info['description'] = 'Idaho Camera traps'
-info['version'] = '2021.07.19'
-#%% Minor adjustments to categories
-input_categories = input_data['categories']
-output_categories = []
-for c in input_categories:
-    category_name = c['name']
-    category_id = c['id']
-    if category_name == 'prong':
-        category_name = 'pronghorn'
-    category_name = category_name.lower()
-    output_categories.append({'name':category_name,'id':category_id})
-#%% Minor adjustments to annotations
-for ann in input_data['annotations']:
-    ann['id'] = str(ann['id'])
-#%% Create output
-output_data = {}
-output_data['images'] = input_data['images']
-output_data['annotations'] = input_data['annotations']
-output_data['categories'] = output_categories
-output_data['info'] = info
-#%% Write output
-with open(output_json,'w') as f:
-    json.dump(output_data,f,indent=2)
-#%% Validate .json file
-from data_management.databases import integrity_check_json_db
-options = integrity_check_json_db.IntegrityCheckOptions()
-options.baseDir = remote_image_base_dir
-options.bCheckImageSizes = False
-options.bCheckImageExistence = False
-options.bFindUnusedImages = False
-_, _, _ = integrity_check_json_db.integrity_check_json_db(output_json, options)
-#%% Preview labels
-from md_visualization import visualize_db
-viz_options = visualize_db.DbVizOptions()
-viz_options.num_to_visualize = 100
-viz_options.trim_to_images_with_bboxes = False
-viz_options.add_search_links = False
-viz_options.sort_by_filename = False
-viz_options.parallelize_rendering = True
-viz_options.include_filename_links = True
-# viz_options.classes_to_exclude = ['test']
-html_output_file, _ = visualize_db.visualize_db(db_path=output_json,
-                                                         output_dir=os.path.join(
-                                                         base_folder,'preview'),
-                                                         image_base_dir=remote_image_base_dir,
-                                                         options=viz_options)
-os.startfile(html_output_file)

data_management/importers/jb_csv_to_json.py DELETED Viewed

@@ -1,150 +0,0 @@
-"""
- jb_csv_to_json.py
- Convert a particular .csv file to CCT format.  Images were not available at
- the time I wrote this script, so this is much shorter than other scripts
- in this folder.
-"""
-#%% Constants and environment
-import pandas as pd
-import uuid
-import json
-input_metadata_file = r'd:\temp\pre_bounding_box.csv'
-output_file = r'd:\temp\pre_bounding_box.json'
-filename_col = 'filename'
-label_col = 'category'
-#%% Read source data
-input_metadata = pd.read_csv(input_metadata_file)
-print('Read {} columns and {} rows from metadata file'.format(len(input_metadata.columns),
-      len(input_metadata)))
-#%% Confirm filename uniqueness (this data set has one label per image)
-imageFilenames = input_metadata[filename_col]
-duplicateRows = []
-filenamesToRows = {}
-# Build up a map from filenames to a list of rows, checking image existence as we go
-for iFile,fn in enumerate(imageFilenames):
-    if (fn in filenamesToRows):
-        duplicateRows.append(iFile)
-        filenamesToRows[fn].append(iFile)
-    else:
-        filenamesToRows[fn] = [iFile]
-assert(len(duplicateRows) == 0)
-#%% Create CCT dictionaries
-images = []
-annotations = []
-# Map categories to integer IDs (that's what COCO likes)
-nextCategoryID = 1
-categories = []
-categoryNamesToCategories = {}
-cat = {}
-cat['name'] = 'empty'
-cat['id'] = 0
-categories.append(cat)
-categoryNamesToCategories['empty'] = cat
-# For each image
-#
-# Because in practice images are 1:1 with annotations in this data set,
-# this is also a loop over annotations.
-# imageName = imageFilenames[0]
-for imageName in imageFilenames:
-    rows = filenamesToRows[imageName]
-    # As per above, this is convenient and appears to be true; asserting to be safe
-    assert(len(rows) == 1)
-    iRow = rows[0]
-    row = input_metadata.iloc[iRow]
-    im = {}
-    # Filenames look like "290716114012001a1116.jpg"
-    im['id'] = imageName.split('.')[0]
-    im['file_name'] = imageName
-    im['seq_id'] = '-1'
-    images.append(im)
-    categoryName = row[label_col].lower()
-    # Have we seen this category before?
-    if categoryName in categoryNamesToCategories:
-        categoryID = categoryNamesToCategories[categoryName]['id']
-    else:
-        cat = {}
-        categoryID = nextCategoryID
-        cat['name'] = categoryName
-        cat['id'] = nextCategoryID
-        categories.append(cat)
-        categoryNamesToCategories[categoryName] = cat
-        nextCategoryID += 1
-    # Create an annotation
-    ann = {}
-    # The Internet tells me this guarantees uniqueness to a reasonable extent, even
-    # beyond the sheer improbability of collisions.
-    ann['id'] = str(uuid.uuid1())
-    ann['image_id'] = im['id']
-    ann['category_id'] = categoryID
-    annotations.append(ann)
-# ...for each image
-print('Finished creating dictionaries')
-#%% Create info struct
-info = {}
-info['year'] = 2019
-info['version'] = 1
-info['description'] = 'COCO style database'
-info['secondary_contributor'] = 'Converted to COCO .json by Dan Morris'
-info['contributor'] = ''
-#%% Write output
-json_data = {}
-json_data['images'] = images
-json_data['annotations'] = annotations
-json_data['categories'] = categories
-json_data['info'] = info
-json.dump(json_data, open(output_file,'w'), indent=4)
-print('Finished writing .json file with {} images, {} annotations, and {} categories'.format(
-        len(images),len(annotations),len(categories)))
-#%% Validate
-from data_management.databases import integrity_check_json_db
-options = integrity_check_json_db.IntegrityCheckOptions()
-sortedCategories,data = integrity_check_json_db.integrity_check_json_db(output_file, options)

data_management/importers/mcgill_to_json.py DELETED Viewed

@@ -1,250 +0,0 @@
-"""
- mcgill_to_json.py
- Convert the .csv file provided for the McGill test data set to a
- COCO-camera-traps .json file
-"""
-#%% Constants and environment
-import pandas as pd
-import os
-import glob
-import json
-import uuid
-import time
-import ntpath
-import humanfriendly
-import PIL
-import math
-baseDir = r'D:\wildlife_data\mcgill_test'
-input_metadata_file = os.path.join(baseDir, 'dan_500_photos_metadata.csv')
-output_file = os.path.join(baseDir, 'mcgill_test.json')
-image_directory = baseDir
-assert(os.path.isdir(image_directory))
-assert(os.path.isfile(input_metadata_file))
-#%% Read source data
-input_metadata = pd.read_csv(input_metadata_file)
-print('Read {} columns and {} rows from metadata file'.format(len(input_metadata.columns),
-      len(input_metadata)))
-#%% Map filenames to rows, verify image existence
-# Create an additional column for concatenated filenames
-input_metadata['relative_path'] = ''
-input_metadata['full_path'] = ''
-startTime = time.time()
-# Maps relative filenames to rows
-filenamesToRows = {}
-duplicateRows = []
-# Build up a map from filenames to a list of rows, checking image existence as we go
-# row = input_metadata.iloc[0]
-for iFile,row in input_metadata.iterrows():
-    relativePath = os.path.join(row['site'],row['date_range'],str(row['camera']),
-                                str(row['folder']),row['filename'])
-    fullPath = os.path.join(baseDir,relativePath)
-    if (relativePath in filenamesToRows):
-        duplicateRows.append(iFile)
-        filenamesToRows[relativePath].append(iFile)
-    else:
-        filenamesToRows[relativePath] = [iFile]
-        assert(os.path.isfile(fullPath))
-    row['relative_path'] = relativePath
-    row['full_path'] = fullPath
-    input_metadata.iloc[iFile] = row
-elapsed = time.time() - startTime
-print('Finished verifying image existence in {}, found {} filenames with multiple labels'.format(
-      humanfriendly.format_timespan(elapsed),len(duplicateRows)))
-# I didn't expect this to be true a priori, but it appears to be true, and
-# it saves us the trouble of checking consistency across multiple occurrences
-# of an image.
-assert(len(duplicateRows) == 0)
-#%% Check for images that aren't included in the metadata file
-# Enumerate all images
-imageFullPaths = glob.glob(os.path.join(image_directory,'**/*.JPG'), recursive=True)
-for iImage,imagePath in enumerate(imageFullPaths):
-    imageRelPath = ntpath.relpath(imagePath, image_directory)
-    assert(imageRelPath in filenamesToRows)
-print('Finished checking {} images to make sure they\'re in the metadata'.format(
-        len(imageFullPaths)))
-#%% Create CCT dictionaries
-# Also gets image sizes, so this takes ~6 minutes
-#
-# Implicitly checks images for overt corruptness, i.e. by not crashing.
-images = []
-annotations = []
-categories = []
-emptyCategory = {}
-emptyCategory['id'] = 0
-emptyCategory['name'] = 'empty'
-emptyCategory['latin'] = 'empty'
-emptyCategory['count'] = 0
-categories.append(emptyCategory)
-# Map categories to integer IDs (that's what COCO likes)
-nextCategoryID = 1
-labelToCategory = {'empty':emptyCategory}
-# For each image
-#
-# Because in practice images are 1:1 with annotations in this data set,
-# this is also a loop over annotations.
-startTime = time.time()
-# row = input_metadata.iloc[0]
-for iFile,row in input_metadata.iterrows():
-    relPath = row['relative_path'].replace('\\','/')
-    im = {}
-    # Filenames look like "290716114012001a1116.jpg"
-    im['id'] = relPath.replace('/','_').replace(' ','_')
-    im['file_name'] = relPath
-    im['seq_id'] = -1
-    im['frame_num'] = -1
-    # In the form "001a"
-    im['site']= row['site']
-    # Can be in the form '111' or 's46'
-    im['camera'] = row['camera']
-    # In the form "7/29/2016 11:40"
-    im['datetime'] = row['timestamp']
-    otherFields = ['motion','temp_F','n_present','n_waterhole','n_contact','notes']
-    for s in otherFields:
-        im[s] = row[s]
-    # Check image height and width
-    fullPath = row['full_path']
-    assert(os.path.isfile(fullPath))
-    pilImage = PIL.Image.open(fullPath)
-    width, height = pilImage.size
-    im['width'] = width
-    im['height'] = height
-    images.append(im)
-    label = row['species']
-    if not isinstance(label,str):
-        # NaN is the only thing we should see that's not a string
-        assert math.isnan(label)
-        label = 'empty'
-    else:
-        label = label.lower()
-    latin = row['binomial']
-    if not isinstance(latin,str):
-        # NaN is the only thing we should see that's not a string
-        assert math.isnan(latin)
-        latin = 'empty'
-    else:
-        latin = latin.lower()
-    if label == 'empty':
-        if latin != 'empty':
-            latin = 'empty'
-    if label == 'unknown':
-        if latin != 'unknown':
-            latin = 'unknown'
-    if label not in labelToCategory:
-        print('Adding category {} ({})'.format(label,latin))
-        category = {}
-        categoryID = nextCategoryID
-        category['id'] = categoryID
-        nextCategoryID += 1
-        category['name'] = label
-        category['latin'] = latin
-        category['count'] = 1
-        labelToCategory[label] = category
-        categories.append(category)
-    else:
-        category = labelToCategory[label]
-        category['count'] = category['count'] + 1
-        categoryID = category['id']
-    # Create an annotation
-    ann = {}
-    # The Internet tells me this guarantees uniqueness to a reasonable extent, even
-    # beyond the sheer improbability of collisions.
-    ann['id'] = str(uuid.uuid1())
-    ann['image_id'] = im['id']
-    ann['category_id'] = categoryID
-    annotations.append(ann)
-# ...for each image
-# Convert categories to a CCT-style dictionary
-for category in categories:
-    print('Category {}, count {}'.format(category['name'],category['count']))
-elapsed = time.time() - startTime
-print('Finished creating CCT dictionaries in {}'.format(
-      humanfriendly.format_timespan(elapsed)))
-#%% Create info struct
-info = {}
-info['year'] = 2019
-info['version'] = 1
-info['description'] = 'COCO style database'
-info['secondary_contributor'] = 'Converted to COCO .json by Dan Morris'
-info['contributor'] = 'McGill University'
-#%% Write output
-json_data = {}
-json_data['images'] = images
-json_data['annotations'] = annotations
-json_data['categories'] = categories
-json_data['info'] = info
-json.dump(json_data, open(output_file,'w'), indent=4)
-print('Finished writing .json file with {} images, {} annotations, and {} categories'.format(
-        len(images),len(annotations),len(categories)))

megadetector 5.0.10__py3-none-any.whl → 5.0.11__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.10py3-none-any.whl → 5.0.11py3-none-any.whl