PyPI - megadetector - Versions diffs - 5.0.9__py3-none-any.whl → 5.0.11__py3-none-any.whl - Mend

megadetector 5.0.9py3-none-any.whl → 5.0.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (226) hide show

{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/LICENSE +0 -0
{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/METADATA +12 -11
megadetector-5.0.11.dist-info/RECORD +5 -0
megadetector-5.0.11.dist-info/top_level.txt +1 -0
api/__init__.py +0 -0
api/batch_processing/__init__.py +0 -0
api/batch_processing/api_core/__init__.py +0 -0
api/batch_processing/api_core/batch_service/__init__.py +0 -0
api/batch_processing/api_core/batch_service/score.py +0 -439
api/batch_processing/api_core/server.py +0 -294
api/batch_processing/api_core/server_api_config.py +0 -98
api/batch_processing/api_core/server_app_config.py +0 -55
api/batch_processing/api_core/server_batch_job_manager.py +0 -220
api/batch_processing/api_core/server_job_status_table.py +0 -152
api/batch_processing/api_core/server_orchestration.py +0 -360
api/batch_processing/api_core/server_utils.py +0 -92
api/batch_processing/api_core_support/__init__.py +0 -0
api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
api/batch_processing/api_support/__init__.py +0 -0
api/batch_processing/api_support/summarize_daily_activity.py +0 -152
api/batch_processing/data_preparation/__init__.py +0 -0
api/batch_processing/data_preparation/manage_local_batch.py +0 -2391
api/batch_processing/data_preparation/manage_video_batch.py +0 -327
api/batch_processing/integration/digiKam/setup.py +0 -6
api/batch_processing/integration/digiKam/xmp_integration.py +0 -465
api/batch_processing/integration/eMammal/test_scripts/config_template.py +0 -5
api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +0 -126
api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +0 -55
api/batch_processing/postprocessing/__init__.py +0 -0
api/batch_processing/postprocessing/add_max_conf.py +0 -64
api/batch_processing/postprocessing/categorize_detections_by_size.py +0 -163
api/batch_processing/postprocessing/combine_api_outputs.py +0 -249
api/batch_processing/postprocessing/compare_batch_results.py +0 -958
api/batch_processing/postprocessing/convert_output_format.py +0 -397
api/batch_processing/postprocessing/load_api_results.py +0 -195
api/batch_processing/postprocessing/md_to_coco.py +0 -310
api/batch_processing/postprocessing/md_to_labelme.py +0 -330
api/batch_processing/postprocessing/merge_detections.py +0 -401
api/batch_processing/postprocessing/postprocess_batch_results.py +0 -1904
api/batch_processing/postprocessing/remap_detection_categories.py +0 -170
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +0 -661
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +0 -211
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +0 -82
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +0 -1631
api/batch_processing/postprocessing/separate_detections_into_folders.py +0 -731
api/batch_processing/postprocessing/subset_json_detector_output.py +0 -696
api/batch_processing/postprocessing/top_folders_to_bottom.py +0 -223
api/synchronous/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/api_backend.py +0 -152
api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -266
api/synchronous/api_core/animal_detection_api/config.py +0 -35
api/synchronous/api_core/animal_detection_api/data_management/annotations/annotation_constants.py +0 -47
api/synchronous/api_core/animal_detection_api/detection/detector_training/copy_checkpoints.py +0 -43
api/synchronous/api_core/animal_detection_api/detection/detector_training/model_main_tf2.py +0 -114
api/synchronous/api_core/animal_detection_api/detection/process_video.py +0 -543
api/synchronous/api_core/animal_detection_api/detection/pytorch_detector.py +0 -304
api/synchronous/api_core/animal_detection_api/detection/run_detector.py +0 -627
api/synchronous/api_core/animal_detection_api/detection/run_detector_batch.py +0 -1029
api/synchronous/api_core/animal_detection_api/detection/run_inference_with_yolov5_val.py +0 -581
api/synchronous/api_core/animal_detection_api/detection/run_tiled_inference.py +0 -754
api/synchronous/api_core/animal_detection_api/detection/tf_detector.py +0 -165
api/synchronous/api_core/animal_detection_api/detection/video_utils.py +0 -495
api/synchronous/api_core/animal_detection_api/md_utils/azure_utils.py +0 -174
api/synchronous/api_core/animal_detection_api/md_utils/ct_utils.py +0 -262
api/synchronous/api_core/animal_detection_api/md_utils/directory_listing.py +0 -251
api/synchronous/api_core/animal_detection_api/md_utils/matlab_porting_tools.py +0 -97
api/synchronous/api_core/animal_detection_api/md_utils/path_utils.py +0 -416
api/synchronous/api_core/animal_detection_api/md_utils/process_utils.py +0 -110
api/synchronous/api_core/animal_detection_api/md_utils/sas_blob_utils.py +0 -509
api/synchronous/api_core/animal_detection_api/md_utils/string_utils.py +0 -59
api/synchronous/api_core/animal_detection_api/md_utils/url_utils.py +0 -144
api/synchronous/api_core/animal_detection_api/md_utils/write_html_image_list.py +0 -226
api/synchronous/api_core/animal_detection_api/md_visualization/visualization_utils.py +0 -841
api/synchronous/api_core/tests/__init__.py +0 -0
api/synchronous/api_core/tests/load_test.py +0 -110
classification/__init__.py +0 -0
classification/aggregate_classifier_probs.py +0 -108
classification/analyze_failed_images.py +0 -227
classification/cache_batchapi_outputs.py +0 -198
classification/create_classification_dataset.py +0 -627
classification/crop_detections.py +0 -516
classification/csv_to_json.py +0 -226
classification/detect_and_crop.py +0 -855
classification/efficientnet/__init__.py +0 -9
classification/efficientnet/model.py +0 -415
classification/efficientnet/utils.py +0 -610
classification/evaluate_model.py +0 -520
classification/identify_mislabeled_candidates.py +0 -152
classification/json_to_azcopy_list.py +0 -63
classification/json_validator.py +0 -695
classification/map_classification_categories.py +0 -276
classification/merge_classification_detection_output.py +0 -506
classification/prepare_classification_script.py +0 -194
classification/prepare_classification_script_mc.py +0 -228
classification/run_classifier.py +0 -286
classification/save_mislabeled.py +0 -110
classification/train_classifier.py +0 -825
classification/train_classifier_tf.py +0 -724
classification/train_utils.py +0 -322
data_management/__init__.py +0 -0
data_management/annotations/__init__.py +0 -0
data_management/annotations/annotation_constants.py +0 -34
data_management/camtrap_dp_to_coco.py +0 -238
data_management/cct_json_utils.py +0 -395
data_management/cct_to_md.py +0 -176
data_management/cct_to_wi.py +0 -289
data_management/coco_to_labelme.py +0 -272
data_management/coco_to_yolo.py +0 -662
data_management/databases/__init__.py +0 -0
data_management/databases/add_width_and_height_to_db.py +0 -33
data_management/databases/combine_coco_camera_traps_files.py +0 -206
data_management/databases/integrity_check_json_db.py +0 -477
data_management/databases/subset_json_db.py +0 -115
data_management/generate_crops_from_cct.py +0 -149
data_management/get_image_sizes.py +0 -188
data_management/importers/add_nacti_sizes.py +0 -52
data_management/importers/add_timestamps_to_icct.py +0 -79
data_management/importers/animl_results_to_md_results.py +0 -158
data_management/importers/auckland_doc_test_to_json.py +0 -372
data_management/importers/auckland_doc_to_json.py +0 -200
data_management/importers/awc_to_json.py +0 -189
data_management/importers/bellevue_to_json.py +0 -273
data_management/importers/cacophony-thermal-importer.py +0 -796
data_management/importers/carrizo_shrubfree_2018.py +0 -268
data_management/importers/carrizo_trail_cam_2017.py +0 -287
data_management/importers/cct_field_adjustments.py +0 -57
data_management/importers/channel_islands_to_cct.py +0 -913
data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
data_management/importers/eMammal/eMammal_helpers.py +0 -249
data_management/importers/eMammal/make_eMammal_json.py +0 -223
data_management/importers/ena24_to_json.py +0 -275
data_management/importers/filenames_to_json.py +0 -385
data_management/importers/helena_to_cct.py +0 -282
data_management/importers/idaho-camera-traps.py +0 -1407
data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
data_management/importers/jb_csv_to_json.py +0 -150
data_management/importers/mcgill_to_json.py +0 -250
data_management/importers/missouri_to_json.py +0 -489
data_management/importers/nacti_fieldname_adjustments.py +0 -79
data_management/importers/noaa_seals_2019.py +0 -181
data_management/importers/pc_to_json.py +0 -365
data_management/importers/plot_wni_giraffes.py +0 -123
data_management/importers/prepare-noaa-fish-data-for-lila.py +0 -359
data_management/importers/prepare_zsl_imerit.py +0 -131
data_management/importers/rspb_to_json.py +0 -356
data_management/importers/save_the_elephants_survey_A.py +0 -320
data_management/importers/save_the_elephants_survey_B.py +0 -332
data_management/importers/snapshot_safari_importer.py +0 -758
data_management/importers/snapshot_safari_importer_reprise.py +0 -665
data_management/importers/snapshot_serengeti_lila.py +0 -1067
data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
data_management/importers/sulross_get_exif.py +0 -65
data_management/importers/timelapse_csv_set_to_json.py +0 -490
data_management/importers/ubc_to_json.py +0 -399
data_management/importers/umn_to_json.py +0 -507
data_management/importers/wellington_to_json.py +0 -263
data_management/importers/wi_to_json.py +0 -441
data_management/importers/zamba_results_to_md_results.py +0 -181
data_management/labelme_to_coco.py +0 -548
data_management/labelme_to_yolo.py +0 -272
data_management/lila/__init__.py +0 -0
data_management/lila/add_locations_to_island_camera_traps.py +0 -97
data_management/lila/add_locations_to_nacti.py +0 -147
data_management/lila/create_lila_blank_set.py +0 -557
data_management/lila/create_lila_test_set.py +0 -151
data_management/lila/create_links_to_md_results_files.py +0 -106
data_management/lila/download_lila_subset.py +0 -177
data_management/lila/generate_lila_per_image_labels.py +0 -515
data_management/lila/get_lila_annotation_counts.py +0 -170
data_management/lila/get_lila_image_counts.py +0 -111
data_management/lila/lila_common.py +0 -300
data_management/lila/test_lila_metadata_urls.py +0 -132
data_management/ocr_tools.py +0 -874
data_management/read_exif.py +0 -681
data_management/remap_coco_categories.py +0 -84
data_management/remove_exif.py +0 -66
data_management/resize_coco_dataset.py +0 -189
data_management/wi_download_csv_to_coco.py +0 -246
data_management/yolo_output_to_md_output.py +0 -441
data_management/yolo_to_coco.py +0 -676
detection/__init__.py +0 -0
detection/detector_training/__init__.py +0 -0
detection/detector_training/model_main_tf2.py +0 -114
detection/process_video.py +0 -703
detection/pytorch_detector.py +0 -337
detection/run_detector.py +0 -779
detection/run_detector_batch.py +0 -1219
detection/run_inference_with_yolov5_val.py +0 -917
detection/run_tiled_inference.py +0 -935
detection/tf_detector.py +0 -188
detection/video_utils.py +0 -606
docs/source/conf.py +0 -43
md_utils/__init__.py +0 -0
md_utils/azure_utils.py +0 -174
md_utils/ct_utils.py +0 -612
md_utils/directory_listing.py +0 -246
md_utils/md_tests.py +0 -968
md_utils/path_utils.py +0 -1044
md_utils/process_utils.py +0 -157
md_utils/sas_blob_utils.py +0 -509
md_utils/split_locations_into_train_val.py +0 -228
md_utils/string_utils.py +0 -92
md_utils/url_utils.py +0 -323
md_utils/write_html_image_list.py +0 -225
md_visualization/__init__.py +0 -0
md_visualization/plot_utils.py +0 -293
md_visualization/render_images_with_thumbnails.py +0 -275
md_visualization/visualization_utils.py +0 -1537
md_visualization/visualize_db.py +0 -551
md_visualization/visualize_detector_output.py +0 -406
megadetector-5.0.9.dist-info/RECORD +0 -224
megadetector-5.0.9.dist-info/top_level.txt +0 -8
taxonomy_mapping/__init__.py +0 -0
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +0 -491
taxonomy_mapping/map_new_lila_datasets.py +0 -154
taxonomy_mapping/prepare_lila_taxonomy_release.py +0 -142
taxonomy_mapping/preview_lila_taxonomy.py +0 -591
taxonomy_mapping/retrieve_sample_image.py +0 -71
taxonomy_mapping/simple_image_download.py +0 -218
taxonomy_mapping/species_lookup.py +0 -834
taxonomy_mapping/taxonomy_csv_checker.py +0 -159
taxonomy_mapping/taxonomy_graph.py +0 -346
taxonomy_mapping/validate_lila_category_mappings.py +0 -83
{megadetector-5.0.9.dist-info → megadetector-5.0.11.dist-info}/WHEEL +0 -0

data_management/importers/cacophony-thermal-importer.py DELETED Viewed

@@ -1,796 +0,0 @@
-"""
- cacophony-thermal-importer.py
- Create data and metadata for LILA from the Cacophony thermal dataset.  Takes a folder
- of HDF files, and produces .json metadata, along with compressed/normalized videos for
- each HDF file.
- Source format notes for this dataset:
- https://docs.google.com/document/d/12sw5JtwdMf9MiXuNCBcvhvZ04Jwa1TH2Lf6LnJmF8Bk/edit
-"""
-#%% Imports and constants
-import os
-import h5py
-import numpy as np
-import json
-from tqdm import tqdm
-from copy import deepcopy
-from collections import defaultdict
-from multiprocessing.pool import Pool
-import zipfile
-from zipfile import ZipFile
-import cv2
-from md_utils.ct_utils import truncate_float
-from md_utils import path_utils
-base_dir = '/bigdata/home/sftp/cacophony-ferraro_/data/cacophony-thermal/'
-output_base = os.path.expanduser('~/tmp/new-zealand-wildlife-thermal-imaging')
-video_output_folder = os.path.join(output_base,'videos')
-individual_metadata_output_folder = os.path.join(output_base,'individual-metadata')
-os.makedirs(video_output_folder,exist_ok=True)
-os.makedirs(individual_metadata_output_folder,exist_ok=True)
-main_metadata_filename = 'new-zealand-wildlife-thermal-imaging.json'
-# Every HDF file specifies a crop rectangle within which the pixels are trustworthy;
-# in practice this is the same across all files.
-expected_crop_rectangle = [1,1,159,119]
-# Required attributes for each video
-expected_clip_attributes = ['clip_id', 'crop_rectangle', 'ffc_frames', 'frame_temp_max',
-                            'frame_temp_mean', 'frame_temp_median', 'frame_temp_min', 'max_temp',
-                            'mean_temp', 'min_temp', 'num_frames', 'res_x', 'res_y', 'start_time',
-                            'station_id']
-# Attributes that may or may not be present for each video
-optional_clip_attributes = ['temp_thresh','model']
-# Required attributes for each trck
-expected_track_attributes = ['end_frame', 'id', 'start_frame']
-# Attributes that may or may not be present for each track
-optional_track_attributes = ['human_tag', 'human_tag_confidence', 'human_tags',
-                             'human_tags_confidence', 'ai_tag', 'ai_tag_confidence']
-labels_to_ignore_when_another_label_is_present = ['false-positive','unidentified','part','poor tracking']
-frame_rate = 9
-use_default_filtering = False
-write_as_color = False
-# codec = 'ffv1'
-# codec = 'hfyu'
-codec = 'h264'
-overwrite_video = True
-codec_to_extension = {'mp4v':'.mp4','ffv1':'.avi','hfyu':'.avi','h264':'.mp4'}
-# Set to >0 to process only a subset of clips
-debug_n = -1
-n_workers = 16
-confidence_digits = 3
-# Standardize a few tag names
-tag_mappings = {
-    'bird/kiwi':'bird',
-    'allbirds':'bird',
-    'not identifiable':'unidentified',
-    'part':'unidentified',
-    'pest':'unidentified'
-}
-# Discard tracks and labels that are below this confidence threshold.
-confidence_threshold = 0.001
-#%% Support functions
-def remove_tracking_points(clip_metadata):
-    """
-    As a debugging convenience, take the metadata for a clip (after conversion to
-    the output format) and remove the only field that makes it hard to read in a
-    console (the track coordinates).
-    """
-    slim_metadata = deepcopy(clip_metadata)
-    if 'tracks' in slim_metadata:
-        for t in slim_metadata['tracks']:
-            del t['points']
-    return slim_metadata
-def norm_image(image,vmin=None,vmax=None,do_normalization=True,stack_channels=True):
-    """
-    Normalize an MxN 2D numpy ndarray (may be any type, but typically uint16) into the range
-    0,255.
-    If stack_channels==True, return as an MxNx3 uint8 matrix (content is replicated across
-    all three channels).
-    """
-    if vmin is not None:
-        assert vmax is not None
-        assert vmax > vmin
-    if vmax is not None:
-        assert vmin is not None
-    assert isinstance(image,np.ndarray)
-    assert isinstance(image[0][0],np.uint16) or isinstance(image[0][0],np.float32), \
-        'First pixel is of type {}'.format(type(image[0][0]))
-    assert len(image.shape) == 2
-    norm = np.float32(image)
-    if do_normalization:
-        if vmin is None:
-            vmin = np.amin(image)
-            vmax = np.amax(image)
-        norm = 255 * (norm - vmin) / (vmax - vmin)
-    norm = np.uint8(norm)
-    norm = norm[:, :, np.newaxis]
-    if stack_channels:
-        norm = np.repeat(norm, 3, axis=2)
-    return norm
-#%% Enumerate files
-all_files = path_utils.recursive_file_list(base_dir)
-all_hdf_files_relative = [os.path.relpath(fn,base_dir) for fn in all_files if fn.lower().endswith('.hdf5')]
-print('Found {} HDF files (of {} total files)'.format(
-    len(all_hdf_files_relative),len(all_files)))
-#%% Process one file
-def process_file(fn_relative,verbose=False):
-    """
-    Read the HDF file, convert to video files with/without filtering, and return
-    a metadata dict for this file.
-    """
-    fn_abs = os.path.join(base_dir,fn_relative)
-    clip_id = int(os.path.basename(fn_relative).split('.')[0])
-    metadata_fn = os.path.join(individual_metadata_output_folder,str(clip_id) + '_metadata.json')
-    clip_metadata = {}
-    clip_metadata['hdf_filename'] = os.path.basename(fn_relative)
-    clip_metadata['id'] = clip_id
-    clip_metadata['error'] = None
-    try:
-        h5f = h5py.File(fn_abs, 'r')
-    except Exception as e:
-        print('Could not open file {}: {}'.format(
-            fn_relative,str(e)))
-        clip_metadata['error'] = str(e)
-        with open(metadata_fn,'w') as f:
-            json.dump(clip_metadata,f,indent=1)
-        return clip_metadata
-    clip_attrs = h5f.attrs
-    for s in expected_clip_attributes:
-        assert s in clip_attrs
-    assert clip_id == int(clip_attrs.get('clip_id'))
-    assert os.path.basename(fn_relative).startswith(str(clip_id))
-    station_id = clip_attrs.get('station_id')
-    assert isinstance(station_id,np.int64)
-    station_id = int(station_id)
-    crop_rectangle = clip_attrs.get('crop_rectangle')
-    assert len(crop_rectangle) == 4
-    for i_coord in range(0,4):
-        assert crop_rectangle[i_coord] == expected_crop_rectangle[i_coord]
-    frames = h5f['frames']
-    assert 'thermals' in frames
-    # This is an HDF dataset of size n_frames,y,x
-    thermal_frames = frames['thermals']
-    assert len(thermal_frames.shape) == 3
-    # If present, this is an HDF dataset of size y,x
-    if 'background' in frames:
-        background_frame = frames['background']
-        assert len(background_frame.shape) == 2
-        assert background_frame.shape[0] == thermal_frames.shape[1]
-        assert background_frame.shape[1] == thermal_frames.shape[2]
-    else:
-        background_frame = None
-    calibration_frame_indices = clip_attrs.get('ffc_frames')
-    if len(calibration_frame_indices) > 0:
-        assert max(calibration_frame_indices) < thermal_frames.shape[0]
-    assert clip_attrs.get('num_frames') == thermal_frames.shape[0]
-    assert clip_attrs.get('res_x') == thermal_frames.shape[2]
-    assert clip_attrs.get('res_y') == thermal_frames.shape[1]
-    assert clip_attrs.get('model') in [None,'lepton3.5','lepton3']
-    tracks = h5f['tracks']
-    track_ids = list(tracks.keys())
-    # List of dicts
-    tracks_this_clip = []
-    # i_track = 0; track_id = track_ids[i_track]
-    for i_track,track_id in enumerate(track_ids):
-        track = tracks[track_id]
-        if 'human_tags' not in track.attrs.keys():
-            continue
-        track_info = {}
-        # 'human_tags' is all the tags that were assigned to this track by humans
-        # 'human_tags_confidence' is the confidence for each of those assignments
-        #
-        # If there is a clear "winner", 'human_tag' and 'human_tag' confidence will
-        # identify the clear winner.
-        if 'human_tag' in track.attrs.keys():
-            assert 'human_tags' in track.attrs.keys()
-            assert 'human_tags_confidence' in track.attrs.keys()
-            assert 'human_tag_confidence' in track.attrs.keys()
-        track_tags = []
-        if 'human_tags' in track.attrs.keys():
-            assert 'human_tags_confidence' in track.attrs.keys()
-            assert len(track.attrs.get('human_tags_confidence')) == \
-                   len(track.attrs.get('human_tags'))
-            human_tags_this_clip = list(track.attrs.get('human_tags'))
-            human_tag_confidences_this_clip = list(track.attrs.get('human_tags_confidence'))
-            for i_tag,tag in enumerate(human_tags_this_clip):
-                assert isinstance(tag,str)
-                tag_info = {}
-                tag_info['label'] = tag
-                conf = float(human_tag_confidences_this_clip[i_tag])
-                tag_info['confidence'] = truncate_float(conf,confidence_digits)
-                track_tags.append(tag_info)
-        track_start_frame = int(round(track.attrs.get('start_frame')))
-        track_end_frame = int(round(track.attrs.get('end_frame')))
-        track_info['start_frame'] = track_start_frame
-        track_info['end_frame'] = track_end_frame
-        track_info['tags'] = track_tags
-        # A list of x/y/frame tuples
-        track_info['points'] = []
-        for s in expected_track_attributes:
-            assert s in track.attrs
-        positions = track['regions']
-        # Positions is an N x 7 matrix in which each row looks like:
-        #
-        # [left,top,right,bottom,frame_number,mass,blank_frame]
-        #
-        # The origin appears to be in the upper-left.
-        #
-        # "blank_frame" indicates that the tracked object is not visible in this frame,
-        # but was predicted from previous frames.
-        assert positions.shape[1] == 7
-        # The number of items in the positions array should be equal to the length of the track, but this
-        # can be off by a little when 'start_frame' and/or 'end_frame' are not integers.  Make sure this
-        # is approximately true.
-        # assert positions.shape[0] == 1 + (track.attrs.get('end_frame') - track.attrs.get('start_frame'))
-        track_length_error = abs(positions.shape[0] -
-            (1 + (track.attrs.get('end_frame') - track.attrs.get('start_frame'))))
-        assert track_length_error < 2
-        # i_position = 0; position = positions[i_position]
-        for i_position,position in enumerate(positions):
-            left = float(position[0])
-            top = float(position[1])
-            right = float(position[2])
-            bottom = float(position[3])
-            frame_number = int(position[4])
-            # TODO: I'm being lazy about the fact that these don't reflect the
-            # pixels cropped out of the border.  IMO this is OK because for this dataset,
-            # this is just an approximate set of coordinates used to disambiguate simultaneous
-            # areas of movement when multiple different labels are present in the same video.
-            position_info = [left+float((right-left)/2),
-                             top+float((bottom-top)/2),
-                             int(frame_number)]
-            track_info['points'].append(position_info)
-            # In a small number of tracks, boxes are turned upside-down or left-over-right,
-            # we don't bother checking for coordinate validity in those tracks.
-            if left <= right:
-                assert left >= 0 and left < clip_attrs.get('res_x')
-                assert right >= 0 and right < clip_attrs.get('res_x')
-            if top <= bottom:
-                assert top >= 0 and top < clip_attrs.get('res_y')
-                assert bottom >= 0 and bottom < clip_attrs.get('res_y')
-            # frame_number should be approximately equal to i_position + start_frame, but this
-            # can be off by a little when 'start_frame' and/or 'end_frame' are not integers.
-            # Make sure this is approximately true.
-            # assert frame_number == i_position + track.attrs.get('start_frame')
-            frame_number_error = abs(frame_number - (i_position + track.attrs.get('start_frame')))
-            assert frame_number_error <= 2
-        # ...for each position in this track
-        tracks_this_clip.append(track_info)
-    # ...for each track ID
-    clip_metadata['tracks'] = tracks_this_clip
-    assert len(human_tags_this_clip) > 0
-    ffc_frames = clip_attrs.get('ffc_frames').tolist()
-    if len(ffc_frames) > 0:
-        assert max(ffc_frames) < thermal_frames.shape[0]
-        n_ffc_frames = len(ffc_frames)
-        n_frames = thermal_frames.shape[0]
-        if verbose:
-            if (n_ffc_frames / n_frames) > 0.2:
-                print('Warning: in video {}, {} of {} frames are FFC frames (tags: {})'.format(
-                    fn_relative,n_ffc_frames,n_frames,str(human_tags_this_clip)))
-    frames = h5f["frames"]
-    if "background" in frames:
-        background = frames["background"]
-        background_frame_present = True
-    else:
-        background = frames["thermals"][0]
-        background_frame_present = False
-    crop_rectangle = clip_attrs["crop_rectangle"]
-    background = background[
-        crop_rectangle[1]:crop_rectangle[3],
-        crop_rectangle[0]:crop_rectangle[2]
-    ]
-    # Compute the median frame value
-    #
-    # (...which we may use for filtering)
-    frames_array = np.array(frames['thermals'])
-    frames_array = frames_array[:,crop_rectangle[1] : crop_rectangle[3], crop_rectangle[0] : crop_rectangle[2]]
-    median_values = np.float32(np.median(frames_array,0))
-    if (background_frame_present or use_default_filtering):
-        background_for_filtering = background
-    else:
-        if verbose:
-            print('No background present: using median values for background')
-        background_for_filtering = median_values
-    # Find the largest value by which any pixel in this video exceeds the background
-    #
-    # (...which we may use for normalization)
-    max_pixel_diff = 0
-    for frame in frames["thermals"]:
-        cropped_frame = frame[
-            crop_rectangle[1]:crop_rectangle[3],
-            crop_rectangle[0]:crop_rectangle[2]
-        ]
-        filtered_frame = np.float32(cropped_frame) - background_for_filtering
-        max_pixel_diff_this_frame = np.amax(filtered_frame)
-        if max_pixel_diff_this_frame > max_pixel_diff:
-            max_pixel_diff = max_pixel_diff_this_frame
-    filtered_frames = []
-    original_frames = []
-    # i_frame = 0; frame = frames["thermals"][i_frame]
-    for i_frame,frame in enumerate(frames["thermals"]):
-        cropped_frame = frame[crop_rectangle[1] : crop_rectangle[3], crop_rectangle[0] : crop_rectangle[2]]
-        # Subtract the background frame
-        filtered_frame = np.float32(cropped_frame) - background_for_filtering
-        # Assume that nothing can be cooler than the background
-        filtered_frame[filtered_frame < 0] = 0
-        # Normalize filtered frame (and convert to three channels)
-        if use_default_filtering:
-            filtered_frame = norm_image(filtered_frame,stack_channels=write_as_color)
-        else:
-            filtered_frame = norm_image(filtered_frame,vmin=0,vmax=max_pixel_diff,stack_channels=write_as_color)
-        # Normalize original frame (and convert to three channels)
-        original_frame = norm_image(cropped_frame,stack_channels=write_as_color)
-        filtered_frames.append(filtered_frame)
-        original_frames.append(original_frame)
-    # ...for each frame
-    # filtered_frames[0].shape[1] is 158, clip_attrs.get('res_x') is 160, ergo shape is h,w
-    video_w = filtered_frames[0].shape[1]
-    video_h = filtered_frames[0].shape[0]
-    clip_metadata['width'] = video_w
-    clip_metadata['height'] = video_h
-    clip_metadata['frame_rate'] = frame_rate
-    filtered_video_fn = os.path.join(video_output_folder,str(clip_id) + '_filtered' + codec_to_extension[codec])
-    unfiltered_video_fn = os.path.join(video_output_folder,str(clip_id) + codec_to_extension[codec])
-    if overwrite_video or (not os.path.isfile(filtered_video_fn)):
-        filtered_video_out = cv2.VideoWriter(filtered_video_fn, cv2.VideoWriter_fourcc(*codec), frame_rate,
-                              (video_w, video_h), isColor=write_as_color)
-        for i_frame,filtered_frame in enumerate(filtered_frames):
-            filtered_video_out.write(filtered_frame)
-        filtered_video_out.release()
-    if overwrite_video or (not os.path.isfile(unfiltered_video_fn)):
-        unfiltered_video_out = cv2.VideoWriter(unfiltered_video_fn, cv2.VideoWriter_fourcc(*codec), frame_rate,
-                              (video_w, video_h), isColor=write_as_color)
-        for i_frame,frame in enumerate(original_frames):
-            unfiltered_video_out.write(frame)
-        unfiltered_video_out.release()
-    labels_this_clip = set()
-    ## Do some cleanup of tracks and track labels
-    valid_tracks = []
-    for track_info in clip_metadata['tracks']:
-        valid_tags = []
-        # Replace some tags with standardized names (e.g. map "allbirds" to "bird")
-        for tag in track_info['tags']:
-            if tag['label'] in tag_mappings:
-                tag['label'] = tag_mappings[tag['label']]
-            # Discard tags below the minimum confidence
-            if tag['confidence'] >= confidence_threshold:
-                valid_tags.append(tag)
-            else:
-                # TODO
-                print('Zero-confidence tag in {}'.format(fn_relative))
-        track_info['tags'] = valid_tags
-        # Don't keep any tracks that had no tags above the minimum confidence
-        if len(valid_tags) > 0:
-            valid_tracks.append(track_info)
-        else:
-            # TODO
-            print('Invalid track in {}'.format(fn_relative))
-    # ...for each track
-    if (len(clip_metadata['tracks']) > 0) and (len(valid_tracks) == 0):
-        # TODO
-        print('Removed all tracks from {}'.format(fn_relative))
-    clip_metadata['tracks'] = valid_tracks
-    # Build up the list of labels for this clip
-    for track_info in clip_metadata['tracks']:
-        for tag in track_info['tags']:
-            tag_label = tag['label']
-            labels_this_clip.add(tag_label)
-    clip_metadata['labels'] = sorted(list(labels_this_clip))
-    metadata_fn = os.path.join(individual_metadata_output_folder,str(clip_id) + '_metadata.json')
-    # clip_metadata['id'] = clip_id
-    # clip_metadata['hdf_filename'] = os.path.basename(fn_relative)
-    clip_metadata['video_filename'] = os.path.basename(unfiltered_video_fn)
-    clip_metadata['filtered_video_filename'] = os.path.basename(filtered_video_fn)
-    clip_metadata['location'] = station_id
-    clip_metadata['calibration_frames'] = ffc_frames
-    clip_metadata['metadata_filename'] = os.path.basename(metadata_fn)
-    with open(metadata_fn,'w') as f:
-        json.dump(clip_metadata,f,indent=1)
-    return clip_metadata
-# ...process_file(...)
-#%% Process files
-n_workers = 16
-if debug_n > 0:
-    files_to_process = all_hdf_files_relative[0:debug_n]
-else:
-    files_to_process = all_hdf_files_relative
-if n_workers <= 1:
-    all_clip_metadata = []
-    for i_file,fn_relative in tqdm(enumerate(files_to_process),total=len(files_to_process)):
-        clip_metadata = process_file(fn_relative)
-        all_clip_metadata.append(clip_metadata)
-else:
-    pool = Pool(n_workers)
-    all_clip_metadata = list(tqdm(pool.imap(process_file,files_to_process),
-                                  total=len(files_to_process)))
-#%% Postprocessing
-failed_file_to_error = {}
-label_to_video_count = defaultdict(int)
-# clip_metadata = all_clip_metadata[0]
-for clip_metadata in all_clip_metadata:
-    if clip_metadata['error'] is not None:
-        failed_file_to_error[clip_metadata['hdf_filename']] = clip_metadata['error']
-        continue
-    labels_this_clip = set()
-    # track_info = clip_metadata['tracks'][0]
-    for track_info in clip_metadata['tracks']:
-        for tag in track_info['tags']:
-            tag_label = tag['label']
-            labels_this_clip.add(tag_label)
-    for label in labels_this_clip:
-        label_to_video_count[label] += 1
-# ...for each clip
-label_to_video_count = {k: v for k, v in sorted(label_to_video_count.items(),
-                                                key=lambda item: item[1], reverse=True)}
-print('Failed to open {} of {} files'.format(
-    len(failed_file_to_error),len(all_hdf_files_relative)))
-print('Labels:\n')
-for label in label_to_video_count:
-    print('{}: {}'.format(label,label_to_video_count[label]))
-#%% Write count .csv
-count_csv_file_name = os.path.join(output_base,'new-zealand-wildlife-thermal-imaging-counts.csv')
-with open(count_csv_file_name,'w') as f:
-    f.write('label,count\n')
-    for label in label_to_video_count:
-        f.write('{},{}\n'.format(label,label_to_video_count[label]))
-#%% Build and zip the main .json file
-main_metadata_filename_abs = os.path.join(output_base,main_metadata_filename)
-info = {}
-info['version'] = '1.0.0'
-info['description'] = 'New Zealand Thermal Wildlife Imaging'
-info['contributor'] = 'Cacophony Project'
-main_metadata = {}
-main_metadata['info'] = info
-main_metadata['clips'] = []
-# clip_metadata = all_clip_metadata[0]
-for clip_metadata in tqdm(all_clip_metadata):
-    slim_metadata = remove_tracking_points(clip_metadata)
-    if 'tracks' in slim_metadata:
-        for track in slim_metadata['tracks']:
-            for tag in track['tags']:
-                tag['confidence'] = truncate_float(tag['confidence'],confidence_digits)
-    main_metadata['clips'].append(slim_metadata)
-with open(main_metadata_filename_abs,'w') as f:
-    json.dump(main_metadata,f,indent=1)
-zip_file_name = main_metadata_filename_abs.replace('.json','-metadata.json.zip')
-with ZipFile(zip_file_name,'w',zipfile.ZIP_DEFLATED) as zipf:
-    zipf.write(main_metadata_filename_abs,
-               arcname=os.path.basename(main_metadata_filename_abs),
-               compresslevel=9,compress_type=zipfile.ZIP_DEFLATED)
-#%% Create a zipfile containing videos, main metadata, and individual metadata
-zip_file_name = os.path.join(output_base,'new-zealand-wildlife-thermal-imaging.zip')
-all_files = path_utils.recursive_file_list(output_base)
-all_files_relative = [os.path.relpath(fn,output_base) for fn in all_files]
-all_files_to_zip_relative = [fn for fn in all_files_relative if \
-                             (\
-                              ('individual-metadata/' in fn) or \
-                              ('videos/' in fn) or \
-                              (fn.endswith('.json'))
-                             )]
-print('Zipping {} files (of {} total files)'.format(len(all_files_to_zip_relative),len(all_files)))
-with ZipFile(zip_file_name,'w',zipfile.ZIP_DEFLATED) as zipf:
-    for fn_relative in tqdm(all_files_to_zip_relative):
-        fn_abs = os.path.join(output_base,fn_relative)
-        if fn_abs.endswith('.mp4'):
-            zipf.write(fn_abs,arcname=fn_relative,compresslevel=0,compress_type=zipfile.ZIP_STORED)
-        else:
-            zipf.write(fn_abs,arcname=fn_relative,compresslevel=9,compress_type=zipfile.ZIP_DEFLATED)
-#%% Scrap
-if False:
-    pass
-    #%% Process one file
-    # i_file = 110680; fn_relative = all_hdf_files_relative[i_file]
-    # i_file = 8; fn_relative = all_hdf_files_relative[i_file]
-    fn_relative = [fn for fn in all_hdf_files_relative if '450281' in fn][0]
-    clip_metadata = process_file(fn_relative)
-    #%% Move individual metadata files
-    source_folder = base_dir
-    target_folder = os.path.expanduser('~/tmp/cacophony-thermal-out-individual-metadata')
-    assert os.path.isdir(source_folder) and os.path.isdir(target_folder)
-    from md_utils import path_utils
-    all_files = path_utils.recursive_file_list(source_folder)
-    files_to_move = [fn for fn in all_files if '_metadata.json' in fn]
-    print('Moving {} of {} files'.format(len(files_to_move),len(all_files)))
-    import shutil
-    # source_fn = files_to_move[0]
-    for source_fn in tqdm(files_to_move):
-        target_fn = os.path.join(target_folder,os.path.basename(source_fn))
-        shutil.move(source_fn,target_fn)
-    #%% Choose a random video with a particular label
-    target_label = 'pukeko'
-    target_clips = []
-    for clip_metadata in all_clip_metadata:
-        if clip_metadata['error'] is not None:
-            continue
-        labels_this_clip = set()
-        # track_info = clip_metadata['tracks'][0]
-        for track_info in clip_metadata['tracks']:
-            for tag in track_info['tags']:
-                tag_label = tag['label']
-                labels_this_clip.add(tag_label)
-        if target_label in labels_this_clip:
-            target_clips.append(clip_metadata)
-    print('Found {} matches'.format(len(target_clips)))
-    import random
-    selected_clip = random.choice(target_clips)
-    filtered_video_filename = selected_clip['filtered_video_filename']
-    video_filename = selected_clip['video_filename']
-    from md_utils.path_utils import open_file
-    # open_file(os.path.join(output_base,video_filename))
-    open_file(os.path.join(output_base,filtered_video_filename))
-    # import clipboard; clipboard.copy(os.path.join(output_base,video_filename))
-    #%% Look for clips with multiple different labels
-    for i_clip,clip_metadata in enumerate(all_clip_metadata):
-        if clip_metadata['error'] is not None:
-            continue
-        labels_this_clip = set()
-        # track_info = clip_metadata['tracks'][0]
-        for track_info in clip_metadata['tracks']:
-            for tag in track_info['tags']:
-                tag_label = tag['label']
-                if tag_label not in labels_to_ignore_when_another_label_is_present:
-                    labels_this_clip.add(tag_label)
-        assert len(labels_this_clip) <= 3
-        if len(labels_this_clip) > 1:
-            print('Clip {} has {} labels: {}'.format(
-                i_clip,len(labels_this_clip),str(labels_this_clip)))
-        # remove_tracking_points(clip_metadata)
-    #%% Add the .json filename to each clip in all_clip_metadata
-    for i_clip,clip_metadata in tqdm(enumerate(all_clip_metadata),
-                                     total=len(all_clip_metadata)):
-        clip_metadata['metadata_filename'] = clip_metadata['hdf_filename'].replace('.hdf5',
-                                                                                     '_metadata.json')
-    #%% Add a "labels" field to each .json file
-    # This was only necessary during debugging; this is added in the main loop now.
-    for i_clip,clip_metadata in tqdm(enumerate(all_clip_metadata),
-                                     total=len(all_clip_metadata)):
-        if clip_metadata['error'] is not None:
-            continue
-        labels_this_clip = set()
-        # track_info = clip_metadata['tracks'][0]
-        for track_info in clip_metadata['tracks']:
-            for tag in track_info['tags']:
-                tag_label = tag['label']
-                # if tag_label not in labels_to_ignore_when_another_label_is_present:
-                if True:
-                    labels_this_clip.add(tag_label)
-        clip_metadata['labels'] = sorted(list(labels_this_clip))
-        json_filename = os.path.join(output_base,str(clip_metadata['id']) + '_metadata.json')
-        assert os.path.isfile(json_filename)
-        with open(json_filename,'w') as f:
-            json.dump(clip_metadata,f,indent=1)

megadetector 5.0.9__py3-none-any.whl → 5.0.11__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.9py3-none-any.whl → 5.0.11py3-none-any.whl