PyPI - megadetector - Versions diffs - 5.0.5__py3-none-any.whl → 5.0.7__py3-none-any.whl - Mend

megadetector 5.0.5py3-none-any.whl → 5.0.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (132) hide show

api/batch_processing/data_preparation/manage_local_batch.py +302 -263
api/batch_processing/data_preparation/manage_video_batch.py +81 -2
api/batch_processing/postprocessing/add_max_conf.py +1 -0
api/batch_processing/postprocessing/categorize_detections_by_size.py +50 -19
api/batch_processing/postprocessing/compare_batch_results.py +110 -60
api/batch_processing/postprocessing/load_api_results.py +56 -70
api/batch_processing/postprocessing/md_to_coco.py +1 -1
api/batch_processing/postprocessing/md_to_labelme.py +2 -1
api/batch_processing/postprocessing/postprocess_batch_results.py +240 -81
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +625 -0
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +71 -23
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +1 -1
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +227 -75
api/batch_processing/postprocessing/subset_json_detector_output.py +132 -5
api/batch_processing/postprocessing/top_folders_to_bottom.py +1 -1
api/synchronous/api_core/animal_detection_api/detection/run_detector_batch.py +2 -2
classification/prepare_classification_script.py +191 -191
data_management/coco_to_yolo.py +68 -45
data_management/databases/integrity_check_json_db.py +7 -5
data_management/generate_crops_from_cct.py +3 -3
data_management/get_image_sizes.py +8 -6
data_management/importers/add_timestamps_to_icct.py +79 -0
data_management/importers/animl_results_to_md_results.py +160 -0
data_management/importers/auckland_doc_test_to_json.py +4 -4
data_management/importers/auckland_doc_to_json.py +1 -1
data_management/importers/awc_to_json.py +5 -5
data_management/importers/bellevue_to_json.py +5 -5
data_management/importers/carrizo_shrubfree_2018.py +5 -5
data_management/importers/carrizo_trail_cam_2017.py +5 -5
data_management/importers/cct_field_adjustments.py +2 -3
data_management/importers/channel_islands_to_cct.py +4 -4
data_management/importers/ena24_to_json.py +5 -5
data_management/importers/helena_to_cct.py +10 -10
data_management/importers/idaho-camera-traps.py +12 -12
data_management/importers/idfg_iwildcam_lila_prep.py +8 -8
data_management/importers/jb_csv_to_json.py +4 -4
data_management/importers/missouri_to_json.py +1 -1
data_management/importers/noaa_seals_2019.py +1 -1
data_management/importers/pc_to_json.py +5 -5
data_management/importers/prepare-noaa-fish-data-for-lila.py +4 -4
data_management/importers/prepare_zsl_imerit.py +5 -5
data_management/importers/rspb_to_json.py +4 -4
data_management/importers/save_the_elephants_survey_A.py +5 -5
data_management/importers/save_the_elephants_survey_B.py +6 -6
data_management/importers/snapshot_safari_importer.py +9 -9
data_management/importers/snapshot_serengeti_lila.py +9 -9
data_management/importers/timelapse_csv_set_to_json.py +5 -7
data_management/importers/ubc_to_json.py +4 -4
data_management/importers/umn_to_json.py +4 -4
data_management/importers/wellington_to_json.py +1 -1
data_management/importers/wi_to_json.py +2 -2
data_management/importers/zamba_results_to_md_results.py +181 -0
data_management/labelme_to_coco.py +35 -7
data_management/labelme_to_yolo.py +229 -0
data_management/lila/add_locations_to_island_camera_traps.py +1 -1
data_management/lila/add_locations_to_nacti.py +147 -0
data_management/lila/create_lila_blank_set.py +474 -0
data_management/lila/create_lila_test_set.py +2 -1
data_management/lila/create_links_to_md_results_files.py +106 -0
data_management/lila/download_lila_subset.py +46 -21
data_management/lila/generate_lila_per_image_labels.py +23 -14
data_management/lila/get_lila_annotation_counts.py +17 -11
data_management/lila/lila_common.py +14 -11
data_management/lila/test_lila_metadata_urls.py +116 -0
data_management/ocr_tools.py +829 -0
data_management/resize_coco_dataset.py +13 -11
data_management/yolo_output_to_md_output.py +84 -12
data_management/yolo_to_coco.py +38 -20
detection/process_video.py +36 -14
detection/pytorch_detector.py +23 -8
detection/run_detector.py +76 -19
detection/run_detector_batch.py +178 -63
detection/run_inference_with_yolov5_val.py +326 -57
detection/run_tiled_inference.py +153 -43
detection/video_utils.py +34 -8
md_utils/ct_utils.py +172 -1
md_utils/md_tests.py +372 -51
md_utils/path_utils.py +167 -39
md_utils/process_utils.py +26 -7
md_utils/split_locations_into_train_val.py +215 -0
md_utils/string_utils.py +10 -0
md_utils/url_utils.py +0 -2
md_utils/write_html_image_list.py +9 -26
md_visualization/plot_utils.py +12 -8
md_visualization/visualization_utils.py +106 -7
md_visualization/visualize_db.py +16 -8
md_visualization/visualize_detector_output.py +208 -97
{megadetector-5.0.5.dist-info → megadetector-5.0.7.dist-info}/METADATA +3 -6
{megadetector-5.0.5.dist-info → megadetector-5.0.7.dist-info}/RECORD +98 -121
{megadetector-5.0.5.dist-info → megadetector-5.0.7.dist-info}/WHEEL +1 -1
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +1 -1
taxonomy_mapping/map_new_lila_datasets.py +43 -39
taxonomy_mapping/prepare_lila_taxonomy_release.py +5 -2
taxonomy_mapping/preview_lila_taxonomy.py +27 -27
taxonomy_mapping/species_lookup.py +33 -13
taxonomy_mapping/taxonomy_csv_checker.py +7 -5
api/synchronous/api_core/yolov5/detect.py +0 -252
api/synchronous/api_core/yolov5/export.py +0 -607
api/synchronous/api_core/yolov5/hubconf.py +0 -146
api/synchronous/api_core/yolov5/models/__init__.py +0 -0
api/synchronous/api_core/yolov5/models/common.py +0 -738
api/synchronous/api_core/yolov5/models/experimental.py +0 -104
api/synchronous/api_core/yolov5/models/tf.py +0 -574
api/synchronous/api_core/yolov5/models/yolo.py +0 -338
api/synchronous/api_core/yolov5/train.py +0 -670
api/synchronous/api_core/yolov5/utils/__init__.py +0 -36
api/synchronous/api_core/yolov5/utils/activations.py +0 -103
api/synchronous/api_core/yolov5/utils/augmentations.py +0 -284
api/synchronous/api_core/yolov5/utils/autoanchor.py +0 -170
api/synchronous/api_core/yolov5/utils/autobatch.py +0 -66
api/synchronous/api_core/yolov5/utils/aws/__init__.py +0 -0
api/synchronous/api_core/yolov5/utils/aws/resume.py +0 -40
api/synchronous/api_core/yolov5/utils/benchmarks.py +0 -148
api/synchronous/api_core/yolov5/utils/callbacks.py +0 -71
api/synchronous/api_core/yolov5/utils/dataloaders.py +0 -1087
api/synchronous/api_core/yolov5/utils/downloads.py +0 -178
api/synchronous/api_core/yolov5/utils/flask_rest_api/example_request.py +0 -19
api/synchronous/api_core/yolov5/utils/flask_rest_api/restapi.py +0 -46
api/synchronous/api_core/yolov5/utils/general.py +0 -1018
api/synchronous/api_core/yolov5/utils/loggers/__init__.py +0 -187
api/synchronous/api_core/yolov5/utils/loggers/wandb/__init__.py +0 -0
api/synchronous/api_core/yolov5/utils/loggers/wandb/log_dataset.py +0 -27
api/synchronous/api_core/yolov5/utils/loggers/wandb/sweep.py +0 -41
api/synchronous/api_core/yolov5/utils/loggers/wandb/wandb_utils.py +0 -577
api/synchronous/api_core/yolov5/utils/loss.py +0 -234
api/synchronous/api_core/yolov5/utils/metrics.py +0 -355
api/synchronous/api_core/yolov5/utils/plots.py +0 -489
api/synchronous/api_core/yolov5/utils/torch_utils.py +0 -314
api/synchronous/api_core/yolov5/val.py +0 -394
md_utils/matlab_porting_tools.py +0 -97
{megadetector-5.0.5.dist-info → megadetector-5.0.7.dist-info}/LICENSE +0 -0
{megadetector-5.0.5.dist-info → megadetector-5.0.7.dist-info}/top_level.txt +0 -0

md_utils/write_html_image_list.py CHANGED Viewed

@@ -8,16 +8,13 @@
 # Each "filename" can also be a dict with elements 'filename','title',
 # 'imageStyle','textStyle', 'linkTarget'
 #
-# Strips directory information away if options.makeRelative == 1.
-#
-# Tries to convert absolute to relative paths if options.makeRelative == 2.
-#
 ########
 #%% Constants and imports
 import os
 import math
+import urllib
 from md_utils import path_utils
@@ -39,12 +36,12 @@ def write_html_image_list(filename=None,images=None,options=None):
     options: a dict with one or more of the following fields:
         fHtml
-        makeRelative
         headerHtml
         trailerHtml
         defaultTextStyle
         defaultImageStyle
         maxFiguresPerHtmlFile
+        urlEncodeFilenames (default True, e.g. '#' will be replaced by '%23')
     """
@@ -55,9 +52,6 @@ def write_html_image_list(filename=None,images=None,options=None):
     if 'fHtml' not in options:
         options['fHtml'] = -1
-    if 'makeRelative' not in options:
-        options['makeRelative'] = 0
     if 'headerHtml' not in options or options['headerHtml'] is None:
         options['headerHtml'] = ''
@@ -71,6 +65,9 @@ def write_html_image_list(filename=None,images=None,options=None):
     if 'defaultImageStyle' not in options or options['defaultImageStyle'] is None:
         options['defaultImageStyle'] = \
         "margin:0px;margin-top:5px;margin-bottom:5px;"
+    if 'urlEncodeFilenames' not in options or options['urlEncodeFilenames'] is None:
+        options['urlEncodeFilenames'] = True
     # Possibly split the html output for figures into multiple files; Chrome gets sad with
     # thousands of images in a single tab.
@@ -98,24 +95,6 @@ def write_html_image_list(filename=None,images=None,options=None):
             imageInfo['textStyle'] = options['defaultTextStyle']
         images[iImage] = imageInfo
-    # Remove leading directory information from filenames if requested
-    if options['makeRelative'] == 1:
-        for iImage in range(0,len(images)):
-            _,n,e = path_utils.fileparts(images[iImage]['filename'])
-            images[iImage]['filename'] = n + e
-    elif options['makeRelative'] == 2:
-        baseDir,_,_ = path_utils.fileparts(filename)
-        if len(baseDir) > 1 and baseDir[-1] != '\\':
-            baseDir = baseDir + '\\'
-        for iImage in range(0,len(images)):
-            fn = images[iImage]['filename']
-            fn = fn.replace(baseDir,'')
-            images[iImage]['filename'] = fn
     nImages = len(images)
     # If we need to break this up into multiple files...
@@ -197,6 +176,10 @@ def write_html_image_list(filename=None,images=None,options=None):
         title = title.encode('ascii','ignore').decode('ascii')
         filename = filename.encode('ascii','ignore').decode('ascii')
+        if options['urlEncodeFilenames']:
+            filename = filename.replace('\\','/')
+            filename = urllib.parse.quote(filename)
         if len(title) > 0:
             fHtml.write(
                     '<p style="{}">{}</p>\n'\

md_visualization/plot_utils.py CHANGED Viewed

@@ -28,8 +28,9 @@ def plot_confusion_matrix(
         cmap: Union[str, matplotlib.colors.Colormap] = matplotlib.cm.Blues,
         vmax: Optional[float] = None,
         use_colorbar: bool = True,
-        y_label: bool = True,
-        fmt: str = '{:.0f}'
+        y_label: bool = True,
+        fmt: str = '{:.0f}',
+        fig=None
         ) -> matplotlib.figure.Figure:
     """
     Plot a confusion matrix. By default, assumes values in the given matrix
@@ -56,18 +57,20 @@ def plot_confusion_matrix(
     assert matrix.shape[1] == num_classes
     assert len(classes) == num_classes
+    normalized_matrix = matrix.astype(np.float64) / (
+        matrix.sum(axis=1, keepdims=True) + 1e-7)
     if normalize:
-        matrix = matrix.astype(np.float64) / (
-            matrix.sum(axis=1, keepdims=True) + 1e-7)
+        matrix = normalized_matrix
     fig_h = 3 + 0.3 * num_classes
     fig_w = fig_h
     if use_colorbar:
         fig_w += 0.5
-    fig = matplotlib.figure.Figure(figsize=(fig_w, fig_h), tight_layout=True)
+    if fig is None:
+        fig = matplotlib.figure.Figure(figsize=(fig_w, fig_h), tight_layout=True)
     ax = fig.subplots(1, 1)
-    im = ax.imshow(matrix, interpolation='nearest', cmap=cmap, vmax=vmax)
+    im = ax.imshow(normalized_matrix, interpolation='nearest', cmap=cmap, vmax=vmax)
     ax.set_title(title)
     if use_colorbar:
@@ -86,10 +89,11 @@ def plot_confusion_matrix(
         ax.set_ylabel('Ground-truth class')
     for i, j in np.ndindex(matrix.shape):
-        ax.text(j, i, fmt.format(matrix[i, j] * 100),
+        v = matrix[i, j]
+        ax.text(j, i, fmt.format(v),
                 horizontalalignment='center',
                 verticalalignment='center',
-                color='white' if matrix[i, j] > 0.5 else 'black')
+                color='white' if normalized_matrix[i, j] > 0.5 else 'black')
     return fig

md_visualization/visualization_utils.py CHANGED Viewed

@@ -166,13 +166,26 @@ def load_image(input_file: Union[str, BytesIO]) -> Image:
     return image
-def resize_image(image, target_width, target_height=-1):
+def resize_image(image, target_width, target_height=-1, output_file=None):
     """
     Resizes a PIL image object to the specified width and height; does not resize
     in place. If either width or height are -1, resizes with aspect ratio preservation.
     If both are -1, returns the original image (does not copy in this case).
+    None is equivalent to -1 for target_width and target_height.
+    [image] can be a PIL image or a filename.
     """
+    if isinstance(image,str):
+        image = load_image(image)
+    if target_width is None:
+        target_width = -1
+    if target_height is None:
+        target_height = -1
     # Null operation
     if target_width == -1 and target_height == -1:
         return image
@@ -197,6 +210,9 @@ def resize_image(image, target_width, target_height=-1):
     except:
         resized_image = image.resize((target_width, target_height), Image.Resampling.LANCZOS)
+    if output_file is not None:
+        exif_preserving_save(resized_image,output_file)
     return resized_image
@@ -363,7 +379,8 @@ def render_detection_bounding_boxes(detections, image,
             The type of the numerical label (default string) needs to be consistent with the keys in
             label_map; no casting is carried out.  If this is None, no classification labels are shown.
-        confidence_threshold: optional, threshold above which the bounding box is rendered.
+        confidence_threshold: optional, threshold above which boxes are rendered.  Can also be a dictionary
+        mapping category IDs to thresholds.
         thickness: line thickness in pixels. Default value is 4.
@@ -397,9 +414,15 @@ def render_detection_bounding_boxes(detections, image,
         score = detection['conf']
+        if isinstance(confidence_threshold,dict):
+            rendering_threshold = confidence_threshold[detection['category']]
+        else:
+            rendering_threshold = confidence_threshold
         # Always render objects with a confidence of "None", this is typically used
         # for ground truth data.
-        if score is None or score >= confidence_threshold:
+        if score is None or score >= rendering_threshold:
             x1, y1, w_box, h_box = detection['bbox']
             display_boxes.append([y1, x1, y1 + h_box, x1 + w_box])
@@ -784,7 +807,8 @@ def draw_bounding_boxes_on_file(input_file, output_file, detections, confidence_
                                 detector_label_map=DEFAULT_DETECTOR_LABEL_MAP,
                                 thickness=DEFAULT_BOX_THICKNESS, expansion=0,
                                 colormap=DEFAULT_COLORS,
-                                custom_strings=None):
+                                label_font_size=DEFAULT_LABEL_FONT_SIZE,
+                                custom_strings=None,target_size=None):
     """
     Render detection bounding boxes on an image loaded from file, writing the results to a
     new image file.
@@ -804,15 +828,21 @@ def draw_bounding_boxes_on_file(input_file, output_file, detections, confidence_
     custom_strings: optional set of strings to append to detection labels, should have the
     same length as [detections].  Appended before classification labels, if classification
     data is provided.
+    target_size: tuple of (target_width,target_height).  Either or both can be -1,
+    see resize_image for documentation.  If None or (-1,-1), uses the original image size.
     """
     image = open_image(input_file)
+    if target_size is not None:
+        image = resize_image(image,target_size[0],target_size[1])
     render_detection_bounding_boxes(
             detections, image, label_map=detector_label_map,
             confidence_threshold=confidence_threshold,
             thickness=thickness,expansion=expansion,colormap=colormap,
-            custom_strings=custom_strings)
+            custom_strings=custom_strings,label_font_size=label_font_size)
     image.save(output_file)
@@ -838,4 +868,73 @@ def draw_db_boxes_on_file(input_file, output_file, boxes, classes=None,
     image.save(output_file)
+def gray_scale_fraction(image,crop_size=(0.1,0.1)):
+    """
+    Returns the fraction of the pixels in [image] that appear to be grayscale (R==G==B),
+    useful for approximating whether this is a night-time image when flash information is not
+    available in EXIF data (or for video frames, where this information is often not available
+    in structured metadata at all).
+    [image] can be a PIL image or a file name.
+    crop_size should be a 2-element list/tuple, representing the fraction of the image
+    to crop at the top and bottom, respectively, before analyzing (to minimize the possibility
+    of including color elements in the image chrome).
+    """
+    if isinstance(image,str):
+        image = Image.open(image)
+    if image.mode == 'L':
+        return 1.0
+    if len(image.getbands()) == 1:
+        return 1.0
+    # Crop if necessary
+    if crop_size[0] > 0 or crop_size[1] > 0:
+        assert (crop_size[0] + crop_size[1]) < 1.0, \
+            print('Illegal crop size: {}'.format(str(crop_size)))
+        top_crop_pixels = int(image.height * crop_size[0])
+        bottom_crop_pixels = int(image.height * crop_size[1])
+        left = 0
+        right = image.width
+        # Remove pixels from the top
+        first_crop_top = top_crop_pixels
+        first_crop_bottom = image.height
+        first_crop = image.crop((left, first_crop_top, right, first_crop_bottom))
+        # Remove pixels from the bottom
+        second_crop_top = 0
+        second_crop_bottom = first_crop.height - bottom_crop_pixels
+        second_crop = first_crop.crop((left, second_crop_top, right, second_crop_bottom))
+        image = second_crop
+    # It doesn't matter if these are actually R/G/B, they're just names
+    r = np.array(image.getchannel(0))
+    g = np.array(image.getchannel(1))
+    b = np.array(image.getchannel(2))
+    gray_pixels = np.logical_and(r == g, r == b)
+    n_pixels = gray_pixels.size
+    n_gray_pixels = gray_pixels.sum()
+    return n_gray_pixels / n_pixels
+    # Non-numpy way to do the same thing, briefly keeping this here for posterity
+    if False:
+        w, h = image.size
+        n_pixels = w*h
+        n_gray_pixels = 0
+        for i in range(w):
+            for j in range(h):
+                r, g, b = image.getpixel((i,j))
+                if r == g and r == b and g == b:
+                    n_gray_pixels += 1

md_visualization/visualize_db.py CHANGED Viewed

@@ -3,7 +3,7 @@
 # visualize_db.py
 #
 # Outputs an HTML page visualizing annotations (class labels and/or bounding boxes)
-# on a sample of images in a database in the COCO Camera Traps format
+# on a sample of images in a database in the COCO Camera Traps format.
 #
 ########
@@ -41,7 +41,15 @@ class DbVizOptions:
     #
     # If viz_size is None or (-1,-1), the original image size is used.
     viz_size = (675, -1)
+    # The most relevant option one might want to set here is:
+    #
+    # htmlOptions['maxFiguresPerHtmlFile']
+    #
+    # ...which can be used to paginate previews to a number of images that will load well
+    # in a browser (5000 is a reasonable limit).
     htmlOptions = write_html_image_list()
     sort_by_filename = True
     trim_to_images_with_bboxes = False
@@ -96,7 +104,7 @@ def image_filename_to_path(image_file_name, image_base_dir, pathsep_replacement=
 #%% Core functions
-def process_images(db_path, output_dir, image_base_dir, options=None):
+def visualize_db(db_path, output_dir, image_base_dir, options=None):
     """
     Writes images and html to output_dir to visualize the annotations in the json file
     db_path.
@@ -418,7 +426,7 @@ def process_images(db_path, output_dir, image_base_dir, options=None):
     return htmlOutputFile,image_db
-# def process_images(...)
+# def visualize_db(...)
 #%% Command-line driver
@@ -452,7 +460,8 @@ def main():
     parser.add_argument('--random_seed', action='store', type=int, default=None,
                         help='Random seed for image selection')
     parser.add_argument('--pathsep_replacement', action='store', type=str, default='',
-                        help='Replace path separators in relative filenames with another character (frequently ~)')
+                        help='Replace path separators in relative filenames with another ' + \
+                             'character (frequently ~)')
     if len(sys.argv[1:]) == 0:
         parser.print_help()
@@ -466,7 +475,7 @@ def main():
     if options.random_sort:
         options.sort_by_filename = False
-    process_images(options.db_path,options.output_dir,options.image_base_dir,options)
+    visualize_db(options.db_path,options.output_dir,options.image_base_dir,options)
 if __name__ == '__main__':
@@ -474,7 +483,7 @@ if __name__ == '__main__':
     main()
-#%% Interactive driver(s)
+#%% Interactive driver
 if False:
@@ -487,6 +496,5 @@ if False:
     options = DbVizOptions()
     options.num_to_visualize = 100
-    htmlOutputFile,db = process_images(db_path,output_dir,image_base_dir,options)
+    htmlOutputFile,db = visualize_db(db_path,output_dir,image_base_dir,options)
     # os.startfile(htmlOutputFile)

megadetector 5.0.5__py3-none-any.whl → 5.0.7__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.5py3-none-any.whl → 5.0.7py3-none-any.whl