PyPI - megadetector - Versions diffs - 5.0.10__py3-none-any.whl → 5.0.11__py3-none-any.whl - Mend

megadetector 5.0.10py3-none-any.whl → 5.0.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (226) hide show

{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/LICENSE +0 -0
{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/METADATA +12 -11
megadetector-5.0.11.dist-info/RECORD +5 -0
megadetector-5.0.11.dist-info/top_level.txt +1 -0
api/__init__.py +0 -0
api/batch_processing/__init__.py +0 -0
api/batch_processing/api_core/__init__.py +0 -0
api/batch_processing/api_core/batch_service/__init__.py +0 -0
api/batch_processing/api_core/batch_service/score.py +0 -439
api/batch_processing/api_core/server.py +0 -294
api/batch_processing/api_core/server_api_config.py +0 -98
api/batch_processing/api_core/server_app_config.py +0 -55
api/batch_processing/api_core/server_batch_job_manager.py +0 -220
api/batch_processing/api_core/server_job_status_table.py +0 -152
api/batch_processing/api_core/server_orchestration.py +0 -360
api/batch_processing/api_core/server_utils.py +0 -92
api/batch_processing/api_core_support/__init__.py +0 -0
api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
api/batch_processing/api_support/__init__.py +0 -0
api/batch_processing/api_support/summarize_daily_activity.py +0 -152
api/batch_processing/data_preparation/__init__.py +0 -0
api/batch_processing/data_preparation/manage_local_batch.py +0 -2391
api/batch_processing/data_preparation/manage_video_batch.py +0 -327
api/batch_processing/integration/digiKam/setup.py +0 -6
api/batch_processing/integration/digiKam/xmp_integration.py +0 -465
api/batch_processing/integration/eMammal/test_scripts/config_template.py +0 -5
api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +0 -126
api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +0 -55
api/batch_processing/postprocessing/__init__.py +0 -0
api/batch_processing/postprocessing/add_max_conf.py +0 -64
api/batch_processing/postprocessing/categorize_detections_by_size.py +0 -163
api/batch_processing/postprocessing/combine_api_outputs.py +0 -249
api/batch_processing/postprocessing/compare_batch_results.py +0 -958
api/batch_processing/postprocessing/convert_output_format.py +0 -397
api/batch_processing/postprocessing/load_api_results.py +0 -195
api/batch_processing/postprocessing/md_to_coco.py +0 -310
api/batch_processing/postprocessing/md_to_labelme.py +0 -330
api/batch_processing/postprocessing/merge_detections.py +0 -401
api/batch_processing/postprocessing/postprocess_batch_results.py +0 -1904
api/batch_processing/postprocessing/remap_detection_categories.py +0 -170
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +0 -661
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +0 -211
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +0 -82
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +0 -1631
api/batch_processing/postprocessing/separate_detections_into_folders.py +0 -731
api/batch_processing/postprocessing/subset_json_detector_output.py +0 -696
api/batch_processing/postprocessing/top_folders_to_bottom.py +0 -223
api/synchronous/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/api_backend.py +0 -152
api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -266
api/synchronous/api_core/animal_detection_api/config.py +0 -35
api/synchronous/api_core/animal_detection_api/data_management/annotations/annotation_constants.py +0 -47
api/synchronous/api_core/animal_detection_api/detection/detector_training/copy_checkpoints.py +0 -43
api/synchronous/api_core/animal_detection_api/detection/detector_training/model_main_tf2.py +0 -114
api/synchronous/api_core/animal_detection_api/detection/process_video.py +0 -543
api/synchronous/api_core/animal_detection_api/detection/pytorch_detector.py +0 -304
api/synchronous/api_core/animal_detection_api/detection/run_detector.py +0 -627
api/synchronous/api_core/animal_detection_api/detection/run_detector_batch.py +0 -1029
api/synchronous/api_core/animal_detection_api/detection/run_inference_with_yolov5_val.py +0 -581
api/synchronous/api_core/animal_detection_api/detection/run_tiled_inference.py +0 -754
api/synchronous/api_core/animal_detection_api/detection/tf_detector.py +0 -165
api/synchronous/api_core/animal_detection_api/detection/video_utils.py +0 -495
api/synchronous/api_core/animal_detection_api/md_utils/azure_utils.py +0 -174
api/synchronous/api_core/animal_detection_api/md_utils/ct_utils.py +0 -262
api/synchronous/api_core/animal_detection_api/md_utils/directory_listing.py +0 -251
api/synchronous/api_core/animal_detection_api/md_utils/matlab_porting_tools.py +0 -97
api/synchronous/api_core/animal_detection_api/md_utils/path_utils.py +0 -416
api/synchronous/api_core/animal_detection_api/md_utils/process_utils.py +0 -110
api/synchronous/api_core/animal_detection_api/md_utils/sas_blob_utils.py +0 -509
api/synchronous/api_core/animal_detection_api/md_utils/string_utils.py +0 -59
api/synchronous/api_core/animal_detection_api/md_utils/url_utils.py +0 -144
api/synchronous/api_core/animal_detection_api/md_utils/write_html_image_list.py +0 -226
api/synchronous/api_core/animal_detection_api/md_visualization/visualization_utils.py +0 -841
api/synchronous/api_core/tests/__init__.py +0 -0
api/synchronous/api_core/tests/load_test.py +0 -110
classification/__init__.py +0 -0
classification/aggregate_classifier_probs.py +0 -108
classification/analyze_failed_images.py +0 -227
classification/cache_batchapi_outputs.py +0 -198
classification/create_classification_dataset.py +0 -627
classification/crop_detections.py +0 -516
classification/csv_to_json.py +0 -226
classification/detect_and_crop.py +0 -855
classification/efficientnet/__init__.py +0 -9
classification/efficientnet/model.py +0 -415
classification/efficientnet/utils.py +0 -610
classification/evaluate_model.py +0 -520
classification/identify_mislabeled_candidates.py +0 -152
classification/json_to_azcopy_list.py +0 -63
classification/json_validator.py +0 -695
classification/map_classification_categories.py +0 -276
classification/merge_classification_detection_output.py +0 -506
classification/prepare_classification_script.py +0 -194
classification/prepare_classification_script_mc.py +0 -228
classification/run_classifier.py +0 -286
classification/save_mislabeled.py +0 -110
classification/train_classifier.py +0 -825
classification/train_classifier_tf.py +0 -724
classification/train_utils.py +0 -322
data_management/__init__.py +0 -0
data_management/annotations/__init__.py +0 -0
data_management/annotations/annotation_constants.py +0 -34
data_management/camtrap_dp_to_coco.py +0 -238
data_management/cct_json_utils.py +0 -395
data_management/cct_to_md.py +0 -176
data_management/cct_to_wi.py +0 -289
data_management/coco_to_labelme.py +0 -272
data_management/coco_to_yolo.py +0 -662
data_management/databases/__init__.py +0 -0
data_management/databases/add_width_and_height_to_db.py +0 -33
data_management/databases/combine_coco_camera_traps_files.py +0 -206
data_management/databases/integrity_check_json_db.py +0 -477
data_management/databases/subset_json_db.py +0 -115
data_management/generate_crops_from_cct.py +0 -149
data_management/get_image_sizes.py +0 -188
data_management/importers/add_nacti_sizes.py +0 -52
data_management/importers/add_timestamps_to_icct.py +0 -79
data_management/importers/animl_results_to_md_results.py +0 -158
data_management/importers/auckland_doc_test_to_json.py +0 -372
data_management/importers/auckland_doc_to_json.py +0 -200
data_management/importers/awc_to_json.py +0 -189
data_management/importers/bellevue_to_json.py +0 -273
data_management/importers/cacophony-thermal-importer.py +0 -796
data_management/importers/carrizo_shrubfree_2018.py +0 -268
data_management/importers/carrizo_trail_cam_2017.py +0 -287
data_management/importers/cct_field_adjustments.py +0 -57
data_management/importers/channel_islands_to_cct.py +0 -913
data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
data_management/importers/eMammal/eMammal_helpers.py +0 -249
data_management/importers/eMammal/make_eMammal_json.py +0 -223
data_management/importers/ena24_to_json.py +0 -275
data_management/importers/filenames_to_json.py +0 -385
data_management/importers/helena_to_cct.py +0 -282
data_management/importers/idaho-camera-traps.py +0 -1407
data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
data_management/importers/jb_csv_to_json.py +0 -150
data_management/importers/mcgill_to_json.py +0 -250
data_management/importers/missouri_to_json.py +0 -489
data_management/importers/nacti_fieldname_adjustments.py +0 -79
data_management/importers/noaa_seals_2019.py +0 -181
data_management/importers/pc_to_json.py +0 -365
data_management/importers/plot_wni_giraffes.py +0 -123
data_management/importers/prepare-noaa-fish-data-for-lila.py +0 -359
data_management/importers/prepare_zsl_imerit.py +0 -131
data_management/importers/rspb_to_json.py +0 -356
data_management/importers/save_the_elephants_survey_A.py +0 -320
data_management/importers/save_the_elephants_survey_B.py +0 -332
data_management/importers/snapshot_safari_importer.py +0 -758
data_management/importers/snapshot_safari_importer_reprise.py +0 -665
data_management/importers/snapshot_serengeti_lila.py +0 -1067
data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
data_management/importers/sulross_get_exif.py +0 -65
data_management/importers/timelapse_csv_set_to_json.py +0 -490
data_management/importers/ubc_to_json.py +0 -399
data_management/importers/umn_to_json.py +0 -507
data_management/importers/wellington_to_json.py +0 -263
data_management/importers/wi_to_json.py +0 -441
data_management/importers/zamba_results_to_md_results.py +0 -181
data_management/labelme_to_coco.py +0 -548
data_management/labelme_to_yolo.py +0 -272
data_management/lila/__init__.py +0 -0
data_management/lila/add_locations_to_island_camera_traps.py +0 -97
data_management/lila/add_locations_to_nacti.py +0 -147
data_management/lila/create_lila_blank_set.py +0 -557
data_management/lila/create_lila_test_set.py +0 -151
data_management/lila/create_links_to_md_results_files.py +0 -106
data_management/lila/download_lila_subset.py +0 -177
data_management/lila/generate_lila_per_image_labels.py +0 -515
data_management/lila/get_lila_annotation_counts.py +0 -170
data_management/lila/get_lila_image_counts.py +0 -111
data_management/lila/lila_common.py +0 -300
data_management/lila/test_lila_metadata_urls.py +0 -132
data_management/ocr_tools.py +0 -874
data_management/read_exif.py +0 -681
data_management/remap_coco_categories.py +0 -84
data_management/remove_exif.py +0 -66
data_management/resize_coco_dataset.py +0 -189
data_management/wi_download_csv_to_coco.py +0 -246
data_management/yolo_output_to_md_output.py +0 -441
data_management/yolo_to_coco.py +0 -676
detection/__init__.py +0 -0
detection/detector_training/__init__.py +0 -0
detection/detector_training/model_main_tf2.py +0 -114
detection/process_video.py +0 -703
detection/pytorch_detector.py +0 -337
detection/run_detector.py +0 -779
detection/run_detector_batch.py +0 -1219
detection/run_inference_with_yolov5_val.py +0 -917
detection/run_tiled_inference.py +0 -935
detection/tf_detector.py +0 -188
detection/video_utils.py +0 -606
docs/source/conf.py +0 -43
md_utils/__init__.py +0 -0
md_utils/azure_utils.py +0 -174
md_utils/ct_utils.py +0 -612
md_utils/directory_listing.py +0 -246
md_utils/md_tests.py +0 -968
md_utils/path_utils.py +0 -1044
md_utils/process_utils.py +0 -157
md_utils/sas_blob_utils.py +0 -509
md_utils/split_locations_into_train_val.py +0 -228
md_utils/string_utils.py +0 -92
md_utils/url_utils.py +0 -323
md_utils/write_html_image_list.py +0 -225
md_visualization/__init__.py +0 -0
md_visualization/plot_utils.py +0 -293
md_visualization/render_images_with_thumbnails.py +0 -275
md_visualization/visualization_utils.py +0 -1537
md_visualization/visualize_db.py +0 -551
md_visualization/visualize_detector_output.py +0 -406
megadetector-5.0.10.dist-info/RECORD +0 -224
megadetector-5.0.10.dist-info/top_level.txt +0 -8
taxonomy_mapping/__init__.py +0 -0
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +0 -491
taxonomy_mapping/map_new_lila_datasets.py +0 -154
taxonomy_mapping/prepare_lila_taxonomy_release.py +0 -142
taxonomy_mapping/preview_lila_taxonomy.py +0 -591
taxonomy_mapping/retrieve_sample_image.py +0 -71
taxonomy_mapping/simple_image_download.py +0 -218
taxonomy_mapping/species_lookup.py +0 -834
taxonomy_mapping/taxonomy_csv_checker.py +0 -159
taxonomy_mapping/taxonomy_graph.py +0 -346
taxonomy_mapping/validate_lila_category_mappings.py +0 -83
{megadetector-5.0.10.dist-info → megadetector-5.0.11.dist-info}/WHEEL +0 -0

api/batch_processing/postprocessing/convert_output_format.py DELETED Viewed

@@ -1,397 +0,0 @@
-"""
-convert_output_format.py
-Converts between file formats output by our batch processing API.  Currently
-supports json <--> csv conversion, but this should be the landing place for any
-conversion - including between hypothetical alternative .json versions - that we support
-in the future.
-The .csv format is largely obsolete, don't use it unless you're super-duper sure you need it.
-"""
-#%% Constants and imports
-import argparse
-import json
-import csv
-import sys
-import os
-from tqdm import tqdm
-from api.batch_processing.postprocessing.load_api_results import load_api_results_csv
-from data_management.annotations import annotation_constants
-from md_utils import ct_utils
-CONF_DIGITS = 3
-#%% Conversion functions
-def convert_json_to_csv(input_path,output_path=None,min_confidence=None,
-                        omit_bounding_boxes=False,output_encoding=None,
-                        overwrite=True):
-    """
-    Converts a MD results .json file to a totally non-standard .csv format.
-    If [output_path] is None, will convert x.json to x.csv.
-    TODO: this function should obviously be using Pandas or some other sensible structured
-    representation of tabular data.  Even a list of dicts.  This implementation is quite
-    brittle and depends on adding fields to every row in exactly the right order.
-    Args:
-        input_path (str): the input .json file to convert
-        output_path (str, optional): the output .csv file to generate; if this is None, uses
-            [input_path].csv
-        min_confidence (float, optional): the minimum-confidence detection we should include
-            in the "detections" column; has no impact on the other columns
-        omit_bounding_boxes (bool): whether to leave out the json-formatted bounding boxes
-            that make up the "detections" column, which are not generally useful for someone who
-            wants to consume this data as a .csv file
-        output_encoding (str, optional): encoding to use for the .csv file
-        overwrite (bool): whether to overwrite an existing .csv file; if this is False and the
-            output file exists, no-ops and returns
-    """
-    if output_path is None:
-        output_path = os.path.splitext(input_path)[0]+'.csv'
-    if os.path.isfile(output_path) and (not overwrite):
-        print('File {} exists, skipping json --> csv conversion'.format(output_path))
-        return
-    print('Loading json results from {}...'.format(input_path))
-    json_output = json.load(open(input_path))
-    rows = []
-    fixed_columns = ['image_path', 'max_confidence', 'detections']
-    # We add an output column for each class other than 'empty',
-    # containing the maximum probability of  that class for each image
-    # n_non_empty_detection_categories = len(annotation_constants.annotation_bbox_categories) - 1
-    n_non_empty_detection_categories = annotation_constants.NUM_DETECTOR_CATEGORIES
-    detection_category_column_names = []
-    assert annotation_constants.detector_bbox_categories[0] == 'empty'
-    for cat_id in range(1,n_non_empty_detection_categories+1):
-        cat_name = annotation_constants.detector_bbox_categories[cat_id]
-        detection_category_column_names.append('max_conf_' + cat_name)
-    n_classification_categories = 0
-    if 'classification_categories' in json_output.keys():
-        classification_category_id_to_name = json_output['classification_categories']
-        classification_category_ids = list(classification_category_id_to_name.keys())
-        classification_category_id_to_column_number = {}
-        classification_category_column_names = []
-        for i_category,category_id in enumerate(classification_category_ids):
-            category_name = classification_category_id_to_name[category_id].\
-                replace(' ','_').replace(',','')
-            classification_category_column_names.append('max_classification_conf_' + category_name)
-            classification_category_id_to_column_number[category_id] = i_category
-        n_classification_categories = len(classification_category_ids)
-    # There are several .json fields for which we add .csv columns; other random bespoke fields
-    # will be ignored.
-    optional_fields = ['width','height','datetime','exif_metadata']
-    optional_fields_present = set()
-    # Iterate once over the data to check for optional fields
-    print('Looking for optional fields...')
-    for im in tqdm(json_output['images']):
-        # Which optional fields are present for this image?
-        for k in im.keys():
-            if k in optional_fields:
-                optional_fields_present.add(k)
-    optional_fields_present = sorted(list(optional_fields_present))
-    if len(optional_fields_present) > 0:
-        print('Found {} optional fields'.format(len(optional_fields_present)))
-    expected_row_length = len(fixed_columns) + len(detection_category_column_names) + \
-        n_classification_categories + len(optional_fields_present)
-    print('Formatting results...')
-    # i_image = 0; im = json_output['images'][i_image]
-    for im in tqdm(json_output['images']):
-        image_id = im['file']
-        if 'failure' in im and im['failure'] is not None:
-            row = [image_id, 'failure', im['failure']]
-            rows.append(row)
-            # print('Skipping failed image {} ({})'.format(im['file'],im['failure']))
-            continue
-        max_conf = ct_utils.get_max_conf(im)
-        detections = []
-        max_detection_category_probabilities = [None] * n_non_empty_detection_categories
-        max_classification_category_probabilities = [0] * n_classification_categories
-        # d = im['detections'][0]
-        for d in im['detections']:
-            # Skip sub-threshold detections
-            if (min_confidence is not None) and (d['conf'] < min_confidence):
-                continue
-            input_bbox = d['bbox']
-            # Our .json format is xmin/ymin/w/h
-            #
-            # Our .csv format was ymin/xmin/ymax/xmax
-            xmin = input_bbox[0]
-            ymin = input_bbox[1]
-            xmax = input_bbox[0] + input_bbox[2]
-            ymax = input_bbox[1] + input_bbox[3]
-            output_detection = [ymin, xmin, ymax, xmax]
-            output_detection.append(d['conf'])
-            # Category 0 is empty, for which we don't have a column, so the max
-            # confidence for category N goes in column N-1
-            detection_category_id = int(d['category'])
-            assert detection_category_id > 0 and detection_category_id <= \
-                n_non_empty_detection_categories
-            detection_category_column = detection_category_id - 1
-            detection_category_max = max_detection_category_probabilities[detection_category_column]
-            if detection_category_max is None or d['conf'] > detection_category_max:
-                max_detection_category_probabilities[detection_category_column] = d['conf']
-            output_detection.append(detection_category_id)
-            detections.append(output_detection)
-            if 'classifications' in d:
-                assert n_classification_categories > 0,\
-                    'Oops, I have classification results, but no classification metadata'
-                for c in d['classifications']:
-                    category_id = c[0]
-                    p = c[1]
-                    category_index = classification_category_id_to_column_number[category_id]
-                    if (max_classification_category_probabilities[category_index] < p):
-                        max_classification_category_probabilities[category_index] = p
-                # ...for each classification
-            # ...if we have classification results for this detection
-        # ...for each detection
-        detection_string = ''
-        if not omit_bounding_boxes:
-            detection_string = json.dumps(detections)
-        row = [image_id, max_conf, detection_string]
-        row.extend(max_detection_category_probabilities)
-        row.extend(max_classification_category_probabilities)
-        for field_name in optional_fields_present:
-            if field_name not in im:
-                row.append('')
-            else:
-                row.append(str(im[field_name]))
-        assert len(row) == expected_row_length
-        rows.append(row)
-    # ...for each image
-    print('Writing to csv...')
-    with open(output_path, 'w', newline='', encoding=output_encoding) as f:
-        writer = csv.writer(f, delimiter=',')
-        header = fixed_columns
-        header.extend(detection_category_column_names)
-        if n_classification_categories > 0:
-            header.extend(classification_category_column_names)
-        for field_name in optional_fields_present:
-            header.append(field_name)
-        writer.writerow(header)
-        writer.writerows(rows)
-# ...def convert_json_to_csv(...)
-def convert_csv_to_json(input_path,output_path=None,overwrite=True):
-    """
-    Convert .csv to .json.  If output_path is None, will convert x.csv to x.json.
-    Args:
-        input_path (str): .csv filename to convert to .json
-        output_path (str, optional): the output .json file to generate; if this is None, uses
-            [input_path].json
-        overwrite (bool): whether to overwrite an existing .json file; if this is False and the
-            output file exists, no-ops and returns
-    """
-    if output_path is None:
-        output_path = os.path.splitext(input_path)[0]+'.json'
-    if os.path.isfile(output_path) and (not overwrite):
-        print('File {} exists, skipping csv --> json conversion'.format(output_path))
-        return
-    # Format spec:
-    #
-    # https://github.com/agentmorris/MegaDetector/tree/master/api/batch_processing
-    print('Loading csv results...')
-    df = load_api_results_csv(input_path)
-    info = {
-        "format_version":"1.2",
-        "detector": "unknown",
-        "detection_completion_time" : "unknown",
-        "classifier": "unknown",
-        "classification_completion_time": "unknown"
-    }
-    classification_categories = {}
-    detection_categories = annotation_constants.detector_bbox_categories
-    images = []
-    # iFile = 0; row = df.iloc[iFile]
-    for iFile,row in df.iterrows():
-        image = {}
-        image['file'] = row['image_path']
-        image['max_detection_conf'] = round(row['max_confidence'], CONF_DIGITS)
-        src_detections = row['detections']
-        out_detections = []
-        for iDetection,detection in enumerate(src_detections):
-            # Our .csv format was ymin/xmin/ymax/xmax
-            #
-            # Our .json format is xmin/ymin/w/h
-            ymin = detection[0]
-            xmin = detection[1]
-            ymax = detection[2]
-            xmax = detection[3]
-            bbox = [xmin, ymin, xmax-xmin, ymax-ymin]
-            conf = detection[4]
-            iClass = detection[5]
-            out_detection = {}
-            out_detection['category'] = str(iClass)
-            out_detection['conf'] = conf
-            out_detection['bbox'] = bbox
-            out_detections.append(out_detection)
-        # ...for each detection
-        image['detections'] = out_detections
-        images.append(image)
-    # ...for each image
-    json_out = {}
-    json_out['info'] = info
-    json_out['detection_categories'] = detection_categories
-    json_out['classification_categories'] = classification_categories
-    json_out['images'] = images
-    json.dump(json_out,open(output_path,'w'),indent=1)
-# ...def convert_csv_to_json(...)
-#%% Interactive driver
-if False:
-    #%%
-    input_path = r'c:\temp\test.json'
-    min_confidence = None
-    output_path = input_path + '.csv'
-    convert_json_to_csv(input_path,output_path,min_confidence=min_confidence,
-                        omit_bounding_boxes=False)
-    #%%
-    base_path = r'c:\temp\json'
-    input_paths = os.listdir(base_path)
-    input_paths = [os.path.join(base_path,s) for s in input_paths]
-    min_confidence = None
-    for input_path in input_paths:
-        output_path = input_path + '.csv'
-        convert_json_to_csv(input_path,output_path,min_confidence=min_confidence,
-                            omit_bounding_boxes=True)
-    #%% Concatenate .csv files from a folder
-    import glob
-    csv_files = glob.glob(os.path.join(base_path,'*.json.csv' ))
-    master_csv = os.path.join(base_path,'all.csv')
-    print('Concatenating {} files to {}'.format(len(csv_files),master_csv))
-    header = None
-    with open(master_csv, 'w') as fout:
-        for filename in tqdm(csv_files):
-            with open(filename) as fin:
-                lines = fin.readlines()
-                if header is not None:
-                    assert lines[0] == header
-                else:
-                    header = lines[0]
-                    fout.write(header)
-                for line in lines[1:]:
-                    if len(line.strip()) == 0:
-                        continue
-                    fout.write(line)
-        # ...for each .csv file
-    # with open(master_csv)
-#%% Command-line driver
-def main():
-    parser = argparse.ArgumentParser()
-    parser.add_argument('input_path',type=str,
-                        help='Input filename ending in .json or .csv')
-    parser.add_argument('--output_path',type=str,default=None,
-                        help='Output filename ending in .json or .csv (defaults to ' + \
-                             'input file, with .json/.csv replaced by .csv/.json)')
-    if len(sys.argv[1:]) == 0:
-        parser.print_help()
-        parser.exit()
-    args = parser.parse_args()
-    if args.output_path is None:
-        if args.input_path.endswith('.csv'):
-            args.output_path = args.input_path[:-4] + '.json'
-        elif args.input_path.endswith('.json'):
-            args.output_path = args.input_path[:-5] + '.csv'
-        else:
-            raise ValueError('Illegal input file extension')
-    if args.input_path.endswith('.csv') and args.output_path.endswith('.json'):
-        convert_csv_to_json(args.input_path,args.output_path)
-    elif args.input_path.endswith('.json') and args.output_path.endswith('.csv'):
-        convert_json_to_csv(args.input_path,args.output_path)
-    else:
-        raise ValueError('Illegal format combination')
-if __name__ == '__main__':
-    main()

api/batch_processing/postprocessing/load_api_results.py DELETED Viewed

@@ -1,195 +0,0 @@
-"""
-load_api_results.py
-DEPRECATED
-As of 2023.12, this module is used in postprocessing and RDE.  Not recommended
-for new code.
-Loads the output of the batch processing API (json) into a Pandas dataframe.
-Includes functions to read/write the (very very old) .csv results format.
-"""
-#%% Imports
-import json
-import os
-from typing import Dict, Mapping, Optional, Tuple
-import pandas as pd
-from md_utils import ct_utils
-#%% Functions for loading .json results into a Pandas DataFrame, and writing back to .json
-def load_api_results(api_output_path: str, normalize_paths: bool = True,
-                     filename_replacements: Optional[Mapping[str, str]] = None,
-                     force_forward_slashes: bool = True
-                     ) -> Tuple[pd.DataFrame, Dict]:
-    r"""
-    Loads json-formatted MegaDetector results to a Pandas DataFrame.
-    Args:
-        api_output_path: path to the output json file
-        normalize_paths: whether to apply os.path.normpath to the 'file' field
-            in each image entry in the output file
-        filename_replacements: replace some path tokens to match local paths to
-            the original blob structure
-        force_forward_slashes: whether to convert backslashes to forward slashes
-            in filenames
-    Returns:
-        detection_results: pd.DataFrame, contains at least the columns ['file', 'detections','failure']
-        other_fields: a dict containing fields in the results other than 'images'
-    """
-    print('Loading results from {}'.format(api_output_path))
-    with open(api_output_path) as f:
-        detection_results = json.load(f)
-    # Validate that this is really a detector output file
-    for s in ['info', 'detection_categories', 'images']:
-        assert s in detection_results, 'Missing field {} in detection results'.format(s)
-    # Fields in the output json other than 'images'
-    other_fields = {}
-    for k, v in detection_results.items():
-        if k != 'images':
-            other_fields[k] = v
-    if normalize_paths:
-        for image in detection_results['images']:
-            image['file'] = os.path.normpath(image['file'])
-    if force_forward_slashes:
-        for image in detection_results['images']:
-            image['file'] = image['file'].replace('\\','/')
-    # Replace some path tokens to match local paths to original blob structure
-    if filename_replacements is not None:
-        for string_to_replace in filename_replacements.keys():
-            replacement_string = filename_replacements[string_to_replace]
-            for im in detection_results['images']:
-                im['file'] = im['file'].replace(string_to_replace,replacement_string)
-    print('Converting results to dataframe')
-    # If this is a newer file that doesn't include maximum detection confidence values,
-    # add them, because our unofficial internal dataframe format includes this.
-    for im in detection_results['images']:
-        if 'max_detection_conf' not in im:
-            im['max_detection_conf'] = ct_utils.get_max_conf(im)
-    # Pack the json output into a Pandas DataFrame
-    detection_results = pd.DataFrame(detection_results['images'])
-    print('Finished loading MegaDetector results for {} images from {}'.format(
-            len(detection_results),api_output_path))
-    return detection_results, other_fields
-def write_api_results(detection_results_table, other_fields, out_path):
-    """
-    Writes a Pandas DataFrame to the MegaDetector .json format.
-    """
-    print('Writing detection results to {}'.format(out_path))
-    fields = other_fields
-    images = detection_results_table.to_json(orient='records',
-                                             double_precision=3)
-    images = json.loads(images)
-    fields['images'] = images
-    # Convert the 'version' field back to a string as per format convention
-    try:
-        version = other_fields['info']['format_version']
-        if not isinstance(version,str):
-            other_fields['info']['format_version'] = str(version)
-    except Exception:
-        print('Warning: error determining format version')
-        pass
-    # Remove 'max_detection_conf' as per newer file convention (format >= v1.3)
-    try:
-        version = other_fields['info']['format_version']
-        version = float(version)
-        if version >= 1.3:
-            for im in images:
-                if 'max_detection_conf' in im:
-                    del im['max_detection_conf']
-    except Exception:
-        print('Warning: error removing max_detection_conf from output')
-        pass
-    with open(out_path, 'w') as f:
-        json.dump(fields, f, indent=1)
-    print('Finished writing detection results to {}'.format(out_path))
-def load_api_results_csv(filename, normalize_paths=True, filename_replacements={}, nrows=None):
-    """
-    [DEPRECATED]
-    Loads .csv-formatted MegaDetector results to a pandas table
-    """
-    print('Loading MegaDetector results from {}'.format(filename))
-    detection_results = pd.read_csv(filename,nrows=nrows)
-    print('De-serializing MegaDetector results from {}'.format(filename))
-    # Confirm that this is really a detector output file
-    for s in ['image_path','max_confidence','detections']:
-        assert s in detection_results.columns
-    # Normalize paths to simplify comparisons later
-    if normalize_paths:
-        detection_results['image_path'] = detection_results['image_path'].apply(os.path.normpath)
-    # De-serialize detections
-    detection_results['detections'] = detection_results['detections'].apply(json.loads)
-    # Optionally replace some path tokens to match local paths to the original blob structure
-    # string_to_replace = list(options.detector_output_filename_replacements.keys())[0]
-    for string_to_replace in filename_replacements:
-        replacement_string = filename_replacements[string_to_replace]
-        # iRow = 0
-        for iRow in range(0,len(detection_results)):
-            row = detection_results.iloc[iRow]
-            fn = row['image_path']
-            fn = fn.replace(string_to_replace,replacement_string)
-            detection_results.at[iRow,'image_path'] = fn
-    print('Finished loading and de-serializing MD results for {} images from {}'.format(
-        len(detection_results),filename))
-    return detection_results
-def write_api_results_csv(detection_results, filename):
-    """
-    [DEPRECATED]
-    Writes a Pandas table to csv in a way that's compatible with the .csv output
-    format.  Currently just a wrapper around to_csv that forces output writing
-    to go through a common code path.
-    """
-    print('Writing detection results to {}'.format(filename))
-    detection_results.to_csv(filename, index=False)
-    print('Finished writing detection results to {}'.format(filename))

megadetector 5.0.10__py3-none-any.whl → 5.0.11__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.10py3-none-any.whl → 5.0.11py3-none-any.whl