PyPI - megadetector - Versions diffs - 5.0.7__py3-none-any.whl → 5.0.9__py3-none-any.whl - Mend

megadetector 5.0.7py3-none-any.whl → 5.0.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (191) hide show

api/__init__.py +0 -0
api/batch_processing/__init__.py +0 -0
api/batch_processing/api_core/__init__.py +0 -0
api/batch_processing/api_core/batch_service/__init__.py +0 -0
api/batch_processing/api_core/batch_service/score.py +0 -1
api/batch_processing/api_core/server_job_status_table.py +0 -1
api/batch_processing/api_core_support/__init__.py +0 -0
api/batch_processing/api_core_support/aggregate_results_manually.py +0 -1
api/batch_processing/api_support/__init__.py +0 -0
api/batch_processing/api_support/summarize_daily_activity.py +0 -1
api/batch_processing/data_preparation/__init__.py +0 -0
api/batch_processing/data_preparation/manage_local_batch.py +93 -79
api/batch_processing/data_preparation/manage_video_batch.py +8 -8
api/batch_processing/integration/digiKam/xmp_integration.py +0 -1
api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +0 -1
api/batch_processing/postprocessing/__init__.py +0 -0
api/batch_processing/postprocessing/add_max_conf.py +12 -12
api/batch_processing/postprocessing/categorize_detections_by_size.py +32 -14
api/batch_processing/postprocessing/combine_api_outputs.py +69 -55
api/batch_processing/postprocessing/compare_batch_results.py +114 -44
api/batch_processing/postprocessing/convert_output_format.py +62 -19
api/batch_processing/postprocessing/load_api_results.py +17 -20
api/batch_processing/postprocessing/md_to_coco.py +31 -21
api/batch_processing/postprocessing/md_to_labelme.py +165 -68
api/batch_processing/postprocessing/merge_detections.py +40 -15
api/batch_processing/postprocessing/postprocess_batch_results.py +270 -186
api/batch_processing/postprocessing/remap_detection_categories.py +170 -0
api/batch_processing/postprocessing/render_detection_confusion_matrix.py +75 -39
api/batch_processing/postprocessing/repeat_detection_elimination/find_repeat_detections.py +53 -44
api/batch_processing/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +25 -14
api/batch_processing/postprocessing/repeat_detection_elimination/repeat_detections_core.py +244 -160
api/batch_processing/postprocessing/separate_detections_into_folders.py +159 -114
api/batch_processing/postprocessing/subset_json_detector_output.py +146 -169
api/batch_processing/postprocessing/top_folders_to_bottom.py +77 -43
api/synchronous/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
api/synchronous/api_core/animal_detection_api/api_backend.py +0 -2
api/synchronous/api_core/animal_detection_api/api_frontend.py +266 -268
api/synchronous/api_core/animal_detection_api/config.py +35 -35
api/synchronous/api_core/tests/__init__.py +0 -0
api/synchronous/api_core/tests/load_test.py +109 -109
classification/__init__.py +0 -0
classification/aggregate_classifier_probs.py +21 -24
classification/analyze_failed_images.py +11 -13
classification/cache_batchapi_outputs.py +51 -51
classification/create_classification_dataset.py +69 -68
classification/crop_detections.py +54 -53
classification/csv_to_json.py +97 -100
classification/detect_and_crop.py +105 -105
classification/evaluate_model.py +43 -42
classification/identify_mislabeled_candidates.py +47 -46
classification/json_to_azcopy_list.py +10 -10
classification/json_validator.py +72 -71
classification/map_classification_categories.py +44 -43
classification/merge_classification_detection_output.py +68 -68
classification/prepare_classification_script.py +157 -154
classification/prepare_classification_script_mc.py +228 -228
classification/run_classifier.py +27 -26
classification/save_mislabeled.py +30 -30
classification/train_classifier.py +20 -20
classification/train_classifier_tf.py +21 -22
classification/train_utils.py +10 -10
data_management/__init__.py +0 -0
data_management/annotations/__init__.py +0 -0
data_management/annotations/annotation_constants.py +18 -31
data_management/camtrap_dp_to_coco.py +238 -0
data_management/cct_json_utils.py +107 -59
data_management/cct_to_md.py +176 -158
data_management/cct_to_wi.py +247 -219
data_management/coco_to_labelme.py +272 -0
data_management/coco_to_yolo.py +86 -62
data_management/databases/__init__.py +0 -0
data_management/databases/add_width_and_height_to_db.py +20 -16
data_management/databases/combine_coco_camera_traps_files.py +35 -31
data_management/databases/integrity_check_json_db.py +130 -83
data_management/databases/subset_json_db.py +25 -16
data_management/generate_crops_from_cct.py +27 -45
data_management/get_image_sizes.py +188 -144
data_management/importers/add_nacti_sizes.py +8 -8
data_management/importers/add_timestamps_to_icct.py +78 -78
data_management/importers/animl_results_to_md_results.py +158 -160
data_management/importers/auckland_doc_test_to_json.py +9 -9
data_management/importers/auckland_doc_to_json.py +8 -8
data_management/importers/awc_to_json.py +7 -7
data_management/importers/bellevue_to_json.py +15 -15
data_management/importers/cacophony-thermal-importer.py +13 -13
data_management/importers/carrizo_shrubfree_2018.py +8 -8
data_management/importers/carrizo_trail_cam_2017.py +8 -8
data_management/importers/cct_field_adjustments.py +9 -9
data_management/importers/channel_islands_to_cct.py +10 -10
data_management/importers/eMammal/copy_and_unzip_emammal.py +1 -0
data_management/importers/ena24_to_json.py +7 -7
data_management/importers/filenames_to_json.py +8 -8
data_management/importers/helena_to_cct.py +7 -7
data_management/importers/idaho-camera-traps.py +7 -7
data_management/importers/idfg_iwildcam_lila_prep.py +10 -10
data_management/importers/jb_csv_to_json.py +9 -9
data_management/importers/mcgill_to_json.py +8 -8
data_management/importers/missouri_to_json.py +18 -18
data_management/importers/nacti_fieldname_adjustments.py +10 -10
data_management/importers/noaa_seals_2019.py +8 -8
data_management/importers/pc_to_json.py +7 -7
data_management/importers/plot_wni_giraffes.py +7 -7
data_management/importers/prepare-noaa-fish-data-for-lila.py +359 -359
data_management/importers/prepare_zsl_imerit.py +7 -7
data_management/importers/rspb_to_json.py +8 -8
data_management/importers/save_the_elephants_survey_A.py +8 -8
data_management/importers/save_the_elephants_survey_B.py +9 -9
data_management/importers/snapshot_safari_importer.py +26 -26
data_management/importers/snapshot_safari_importer_reprise.py +665 -665
data_management/importers/snapshot_serengeti_lila.py +14 -14
data_management/importers/sulross_get_exif.py +8 -9
data_management/importers/timelapse_csv_set_to_json.py +11 -11
data_management/importers/ubc_to_json.py +13 -13
data_management/importers/umn_to_json.py +7 -7
data_management/importers/wellington_to_json.py +8 -8
data_management/importers/wi_to_json.py +9 -9
data_management/importers/zamba_results_to_md_results.py +181 -181
data_management/labelme_to_coco.py +309 -159
data_management/labelme_to_yolo.py +103 -60
data_management/lila/__init__.py +0 -0
data_management/lila/add_locations_to_island_camera_traps.py +9 -9
data_management/lila/add_locations_to_nacti.py +147 -147
data_management/lila/create_lila_blank_set.py +114 -31
data_management/lila/create_lila_test_set.py +8 -8
data_management/lila/create_links_to_md_results_files.py +106 -106
data_management/lila/download_lila_subset.py +92 -90
data_management/lila/generate_lila_per_image_labels.py +56 -43
data_management/lila/get_lila_annotation_counts.py +18 -15
data_management/lila/get_lila_image_counts.py +11 -11
data_management/lila/lila_common.py +103 -70
data_management/lila/test_lila_metadata_urls.py +132 -116
data_management/ocr_tools.py +173 -128
data_management/read_exif.py +161 -99
data_management/remap_coco_categories.py +84 -0
data_management/remove_exif.py +58 -62
data_management/resize_coco_dataset.py +32 -44
data_management/wi_download_csv_to_coco.py +246 -0
data_management/yolo_output_to_md_output.py +86 -73
data_management/yolo_to_coco.py +535 -95
detection/__init__.py +0 -0
detection/detector_training/__init__.py +0 -0
detection/process_video.py +85 -33
detection/pytorch_detector.py +43 -25
detection/run_detector.py +157 -72
detection/run_detector_batch.py +189 -114
detection/run_inference_with_yolov5_val.py +118 -51
detection/run_tiled_inference.py +113 -42
detection/tf_detector.py +51 -28
detection/video_utils.py +606 -521
docs/source/conf.py +43 -0
md_utils/__init__.py +0 -0
md_utils/azure_utils.py +9 -9
md_utils/ct_utils.py +249 -70
md_utils/directory_listing.py +59 -64
md_utils/md_tests.py +968 -862
md_utils/path_utils.py +655 -155
md_utils/process_utils.py +157 -133
md_utils/sas_blob_utils.py +20 -20
md_utils/split_locations_into_train_val.py +45 -32
md_utils/string_utils.py +33 -10
md_utils/url_utils.py +208 -27
md_utils/write_html_image_list.py +51 -35
md_visualization/__init__.py +0 -0
md_visualization/plot_utils.py +102 -109
md_visualization/render_images_with_thumbnails.py +34 -34
md_visualization/visualization_utils.py +908 -311
md_visualization/visualize_db.py +109 -58
md_visualization/visualize_detector_output.py +61 -42
{megadetector-5.0.7.dist-info → megadetector-5.0.9.dist-info}/METADATA +21 -17
megadetector-5.0.9.dist-info/RECORD +224 -0
{megadetector-5.0.7.dist-info → megadetector-5.0.9.dist-info}/WHEEL +1 -1
{megadetector-5.0.7.dist-info → megadetector-5.0.9.dist-info}/top_level.txt +1 -0
taxonomy_mapping/__init__.py +0 -0
taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +342 -335
taxonomy_mapping/map_new_lila_datasets.py +154 -154
taxonomy_mapping/prepare_lila_taxonomy_release.py +142 -134
taxonomy_mapping/preview_lila_taxonomy.py +591 -591
taxonomy_mapping/retrieve_sample_image.py +12 -12
taxonomy_mapping/simple_image_download.py +11 -11
taxonomy_mapping/species_lookup.py +10 -10
taxonomy_mapping/taxonomy_csv_checker.py +18 -18
taxonomy_mapping/taxonomy_graph.py +47 -47
taxonomy_mapping/validate_lila_category_mappings.py +83 -76
data_management/cct_json_to_filename_json.py +0 -89
data_management/cct_to_csv.py +0 -140
data_management/databases/remove_corrupted_images_from_db.py +0 -191
detection/detector_training/copy_checkpoints.py +0 -43
md_visualization/visualize_megadb.py +0 -183
megadetector-5.0.7.dist-info/RECORD +0 -202
{megadetector-5.0.7.dist-info → megadetector-5.0.9.dist-info}/LICENSE +0 -0

docs/source/conf.py ADDED Viewed

@@ -0,0 +1,43 @@
+import sys
+import os
+project = 'MegaDetector'
+copyright = '2024, Your friendly neighborhood MegaDetector team'
+author = 'Your friendly neighborhood MegaDetector team'
+sys.path.insert(0, os.path.abspath("../.."))
+extensions = [
+    "sphinx.ext.napoleon",
+    "sphinx.ext.autodoc",
+    "sphinx.ext.viewcode",
+    "sphinx_mdinclude",
+    "sphinx_argparse_cli"
+]
+autodoc_mock_imports = ["azure", "deepdiff", "magic", "tensorflow", "pytesseract"]
+myst_enable_extensions = [
+    "colon_fence",
+]
+html_theme = 'sphinx_rtd_theme'
+# collapse_navigation doesn't actually work
+html_theme_options = {'navigation_depth': 2, 'collapse_navigation': False}
+# html_theme = 'sphinx_book_theme'
+# html_theme_options['show_navbar_depth'] = 2
+# html_static_path = ['_static']
+# Hide "bases: object" from all classes that don't define a base class
+from sphinx.ext import autodoc
+class MockedClassDocumenter(autodoc.ClassDocumenter):
+    def add_line(self, line: str, source: str, *lineno: int) -> None:
+        if line == "   Bases: :py:class:`object`":
+            return
+        super().add_line(line, source, *lineno)
+autodoc.ClassDocumenter = MockedClassDocumenter

md_utils/__init__.py ADDED Viewed

File without changes

md_utils/azure_utils.py CHANGED Viewed

@@ -1,12 +1,12 @@
-########
-#
-# azure_utils.py
-#
-# Miscellaneous Azure Blob Storage utilities
-#
-# Requires azure-storage-blob>=12.4.0
-#
-########
+"""
+azure_utils.py
+Miscellaneous Azure Blob Storage utilities
+Requires azure-storage-blob>=12.4.0
+"""
 import json
 from md_utils import path_utils

md_utils/ct_utils.py CHANGED Viewed

@@ -1,14 +1,13 @@
-########
-#
-# ct_utils.py
-#
-# Numeric/geometry utility functions
-#
-########
+"""
+ct_utils.py
+Numeric/geometry/array utility functions.
+"""
 #%% Imports and constants
-import argparse
 import inspect
 import json
 import math
@@ -26,12 +25,15 @@ image_extensions = ['.jpg', '.jpeg', '.gif', '.png']
 def truncate_float_array(xs, precision=3):
     """
-    Vectorized version of truncate_float(...)
+    Vectorized version of truncate_float(...), truncates the fractional portion of each
+    floating-point value to a specific number of floating-point digits.
     Args:
-    xs        (list of float) List of floats to truncate
-    precision (int)           The number of significant digits to preserve, should be
-                              greater or equal 1
+        xs (list): list of floats to truncate
+        precision (int, optional): the number of significant digits to preserve, should be >= 1
+    Returns:
+        list: list of truncated floats
     """
     return [truncate_float(x, precision=precision) for x in xs]
@@ -39,17 +41,23 @@ def truncate_float_array(xs, precision=3):
 def truncate_float(x, precision=3):
     """
-    Truncates a floating-point value to a specific number of significant digits.
+    Truncates the fractional portion of a floating-point value to a specific number of
+    floating-point digits.
-    For example: truncate_float(0.0003214884) --> 0.000321
+    For example:
+        truncate_float(0.0003214884) --> 0.000321
+        truncate_float(1.0003214884) --> 1.000321
     This function is primarily used to achieve a certain float representation
     before exporting to JSON.
     Args:
-    x         (float) Scalar to truncate
-    precision (int)   The number of significant digits to preserve, should be
-                      greater or equal 1
+        x (float): scalar to truncate
+        precision (int, optional): the number of significant digits to preserve, should be >= 1
+    Returns:
+        float: truncated version of [x]
     """
     assert precision > 0
@@ -58,41 +66,58 @@ def truncate_float(x, precision=3):
         return 0
+    elif (x > 1):
+        fractional_component = x - 1.0
+        return 1 + truncate_float(fractional_component)
     else:
         # Determine the factor, which shifts the decimal point of x
         # just behind the last significant digit.
         factor = math.pow(10, precision - 1 - math.floor(math.log10(abs(x))))
-        # Shift decimal point by multiplicatipon with factor, flooring, and
+        # Shift decimal point by multiplication with factor, flooring, and
         # division by factor.
         return math.floor(x * factor)/factor
-def args_to_object(args: argparse.Namespace, obj: object) -> None:
+def args_to_object(args, obj):
     """
     Copies all fields from a Namespace (typically the output from parse_args) to an
     object. Skips fields starting with _. Does not check existence in the target
     object.
     Args:
-        args: argparse.Namespace
-        obj: class or object whose whose attributes will be updated
+        args (argparse.Namespace): the namespace to convert to an object
+        obj (object): object whose whose attributes will be updated
+    Returns:
+        object: the modified object (modified in place, but also returned)
     """
     for n, v in inspect.getmembers(args):
         if not n.startswith('_'):
             setattr(obj, n, v)
+    return obj
 def pretty_print_object(obj, b_print=True):
     """
-    Prints an arbitrary object as .json
+    Converts an arbitrary object to .json, optionally printing the .json representation.
+    Args:
+        obj (object): object to print
+        b_print (bool, optional): whether to print the object
+    Returns:
+        str: .json reprepresentation of [obj]
     """
     # _ = pretty_print_object(obj)
-    # Sloppy that I'm making a module-wide change here...
+    # TODO: it's sloppy that I'm making a module-wide change here.
     jsonpickle.set_encoder_options('json', sort_keys=True, indent=2)
     a = jsonpickle.encode(obj)
     s = '{}'.format(a)
@@ -101,12 +126,19 @@ def pretty_print_object(obj, b_print=True):
     return s
-def is_list_sorted(L,reverse=False):
+def is_list_sorted(L, reverse=False):
     """
-    Returns true if the list L appears to be sorted, otherwise False.
+    Returns True if the list L appears to be sorted, otherwise False.
     Calling is_list_sorted(L,reverse=True) is the same as calling
     is_list_sorted(L.reverse(),reverse=False).
+    Args:
+        L (list): list to evaluate
+        reverse (bool, optional): whether to reverse the list before evaluating sort status
+    Returns:
+        bool: True if the list L appears to be sorted, otherwise False
     """
     if reverse:
@@ -117,32 +149,27 @@ def is_list_sorted(L,reverse=False):
 def write_json(path, content, indent=1):
     """
-    Standardized wrapper for json.dump
+    Standardized wrapper for json.dump().
+    Args:
+        path (str): filename to write to
+        content (object): object to dump
+        indent (int, optional): indentation depth passed to json.dump
     """
     with open(path, 'w') as f:
         json.dump(content, f, indent=indent)
-def is_image_file(s):
-    """
-    Checks a file's extension against a hard-coded set of image file extensions;
-    return True if it appears to be an image.
-    """
-    ext = os.path.splitext(s)[1]
-    return ext.lower() in image_extensions
 def convert_yolo_to_xywh(yolo_box):
     """
     Converts a YOLO format bounding box to [x_min, y_min, width_of_box, height_of_box].
     Args:
-        yolo_box: bounding box of format [x_center, y_center, width_of_box, height_of_box].
+        yolo_box (list): bounding box of format [x_center, y_center, width_of_box, height_of_box]
     Returns:
-        bbox with coordinates represented as [x_min, y_min, width_of_box, height_of_box].
+        list: bbox with coordinates represented as [x_min, y_min, width_of_box, height_of_box]
     """
     x_center, y_center, width_of_box, height_of_box = yolo_box
@@ -153,14 +180,14 @@ def convert_yolo_to_xywh(yolo_box):
 def convert_xywh_to_tf(api_box):
     """
-    Converts an xywh bounding box to an [y_min, x_min, y_max, x_max] box that the TensorFlow
-    Object Detection API uses
+    Converts an xywh bounding box (the format used in MD output) to the [y_min, x_min, y_max, x_max]
+    format that the TensorFlow Object Detection API uses.
     Args:
         api_box: bbox output by the batch processing API [x_min, y_min, width_of_box, height_of_box]
     Returns:
-        bbox with coordinates represented as [y_min, x_min, y_max, x_max]
+        list: bbox with coordinates represented as [y_min, x_min, y_max, x_max]
     """
     x_min, y_min, width_of_box, height_of_box = api_box
@@ -171,14 +198,13 @@ def convert_xywh_to_tf(api_box):
 def convert_xywh_to_xyxy(api_bbox):
     """
-    Converts an xywh bounding box to an xyxy bounding box.
+    Converts an xywh bounding box (the MD output format) to an xyxy bounding box.
-    Note that this is also different from the TensorFlow Object Detection API coords format.
     Args:
-        api_bbox: bbox output by the batch processing API [x_min, y_min, width_of_box, height_of_box]
+        api_bbox (list): bbox formatted as [x_min, y_min, width_of_box, height_of_box]
     Returns:
-        bbox with coordinates represented as [x_min, y_min, x_max, y_max]
+        list: bbox formatted as [x_min, y_min, x_max, y_max]
     """
     x_min, y_min, width_of_box, height_of_box = api_bbox
@@ -188,18 +214,18 @@ def convert_xywh_to_xyxy(api_bbox):
 def get_iou(bb1, bb2):
     """
-    Calculates the Intersection over Union (IoU) of two bounding boxes.
+    Calculates the intersection over union (IoU) of two bounding boxes.
     Adapted from:
     https://stackoverflow.com/questions/25349178/calculating-percentage-of-bounding-box-overlap-for-image-detector-evaluation
     Args:
-        bb1: [x_min, y_min, width_of_box, height_of_box]
-        bb2: [x_min, y_min, width_of_box, height_of_box]
+        bb1 (list): [x_min, y_min, width_of_box, height_of_box]
+        bb2 (list): [x_min, y_min, width_of_box, height_of_box]
     Returns:
-        intersection_over_union, a float in [0, 1]
+        float: intersection_over_union, a float in [0, 1]
     """
     bb1 = convert_xywh_to_xyxy(bb1)
@@ -251,9 +277,14 @@ def _get_max_conf_from_detections(detections):
 def get_max_conf(im):
     """
-    Given an image dict in the format used by the batch API, compute the maximum detection
-    confidence for any class.  Returns 0.0 (not None) if there was a failure and 'detections'
-    isn't present.
+    Given an image dict in the MD output format, computes the maximum detection confidence for any
+    class.  Returns 0.0 (rather than None) if there was a failure or 'detections' isn't present.
+    Args:
+        im (dict): image dictionary in the MD output format (with a 'detections' field)
+    Returns:
+        float: the maximum detection confidence across all classes
     """
     max_conf = 0.0
@@ -264,7 +295,14 @@ def get_max_conf(im):
 def point_dist(p1,p2):
     """
-    Distance between two points, represented as length-two tuples.
+    Computes the distance between two points, represented as length-two tuples.
+    Args:
+        p1: point, formatted as (x,y)
+        p2: point, formatted as (x,y)
+    Returns:
+        float: the Euclidean distance between p1 and p2
     """
     return math.sqrt( ((p1[0]-p2[0])**2) + ((p1[1]-p2[1])**2) )
@@ -272,13 +310,21 @@ def point_dist(p1,p2):
 def rect_distance(r1, r2, format='x0y0x1y1'):
     """
-    Minimum distance between two axis-aligned rectangles, each represented as
+    Computes the minimum distance between two axis-aligned rectangles, each represented as
     (x0,y0,x1,y1) by default.
-    Can also specify "format" as x0y0wh for MD-style bbox formatting (x0,y0,w,h).
+    Can also specify "format" as x0y0wh for MD-style bbox formatting (x0,y0,w,h).
+    Args:
+        r1: rectangle, formatted as (x0,y0,x1,y1) or (x0,y0,xy,y1)
+        r2: rectangle, formatted as (x0,y0,x1,y1) or (x0,y0,xy,y1)
+        format (str, optional): whether the boxes are formatted as 'x0y0x1y1' (default) or 'x0y0wh'
+    Returns:
+        float: the minimum distance between r1 and r2
     """
-    assert format in ('x0y0x1y1','x0y0wh')
+    assert format in ('x0y0x1y1','x0y0wh'), 'Illegal rectangle format {}'.format(format)
     if format == 'x0y0wh':
         # Convert to x0y0x1y1 without modifying the original rectangles
@@ -312,18 +358,17 @@ def rect_distance(r1, r2, format='x0y0x1y1'):
         return 0.0
-def list_is_sorted(l):
-    """
-    Returns True if the list [l] is sorted, else False.
-    """
-    return all(l[i] <= l[i+1] for i in range(len(l)-1))
 def split_list_into_fixed_size_chunks(L,n):
     """
     Split the list or tuple L into chunks of size n (allowing chunks of size n-1 if necessary,
-    i.e. len(L) does not have to be a multiple of n.
+    i.e. len(L) does not have to be a multiple of n).
+    Args:
+        L (list): list to split into chunks
+        n (int): preferred chunk size
+    Returns:
+        list: list of chunks, where each chunk is a list of length n or n-1
     """
     return [L[i * n:(i + 1) * n] for i in range((len(L) + n - 1) // n )]
@@ -332,11 +377,19 @@ def split_list_into_fixed_size_chunks(L,n):
 def split_list_into_n_chunks(L, n, chunk_strategy='greedy'):
     """
     Splits the list or tuple L into n equally-sized chunks (some chunks may be one
-    element smaller than others, i.e. len(L) does not have to be a multiple of n.
+    element smaller than others, i.e. len(L) does not have to be a multiple of n).
     chunk_strategy can be "greedy" (default, if there are k samples per chunk, the first
     k go into the first chunk) or "balanced" (alternate between chunks when pulling
     items from the list).
+    Args:
+        L (list): list to split into chunks
+        n (int): number of chunks
+        chunk_strategy (str, optiopnal): "greedy" or "balanced"; see above
+    Returns:
+        list: list of chunks, each of which is a list
     """
     if chunk_strategy == 'greedy':
@@ -352,10 +405,35 @@ def split_list_into_n_chunks(L, n, chunk_strategy='greedy'):
         raise ValueError('Invalid chunk strategy: {}'.format(chunk_strategy))
+def sort_dictionary_by_key(d,reverse=False):
+    """
+    Sorts the dictionary [d] by key.
+    Args:
+        d (dict): dictionary to sort
+        reverse (bool, optional): whether to sort in reverse (descending) order
+    Returns:
+        dict: sorted copy of [d]
+    """
+    d = dict(sorted(d.items(),reverse=reverse))
+    return d
 def sort_dictionary_by_value(d,sort_values=None,reverse=False):
     """
     Sorts the dictionary [d] by value.  If sort_values is None, uses d.values(),
     otherwise uses the dictionary sort_values as the sorting criterion.
+    Args:
+        d (dict): dictionary to sort
+        sort_values (dict, optional): dictionary mapping keys in [d] to sort values (defaults
+            to None, uses [d] itself for sorting)
+        reverse (bool, optional): whether to sort in reverse (descending) order
+    Returns:
+        dict: sorted copy of [d]
     """
     if sort_values is None:
@@ -367,16 +445,22 @@ def sort_dictionary_by_value(d,sort_values=None,reverse=False):
 def invert_dictionary(d):
     """
-    Create a new dictionary that maps d.values() to d.keys().  Does not check
-    uniqueness.
+    Creates a new dictionary that maps d.values() to d.keys().  Does not check
+    uniqueness.
+    Args:
+        d (dict): dictionary to invert
+    Returns:
+        dict: inverted copy of [d]
     """
     return {v: k for k, v in d.items()}
 def image_file_to_camera_folder(image_fn):
-    """
-    Remove common overflow folders (e.g. RECNX101, RECNX102) from paths, i.e. turn:
+    r"""
+    Removes common overflow folders (e.g. RECNX101, RECNX102) from paths, i.e. turn:
     a\b\c\RECNX101\image001.jpg
@@ -388,6 +472,12 @@ def image_file_to_camera_folder(image_fn):
     present.
     Always converts backslashes to slashes.
+    Args:
+        image_fn (str): the image filename from which we should remove overflow folders
+    Returns:
+        str: a version of [image_fn] from which camera overflow folders have been removed
     """
     import re
@@ -406,6 +496,95 @@ def image_file_to_camera_folder(image_fn):
     return camera_folder
+def is_float(v):
+    """
+    Determines whether v is either a float or a string representation of a float.
+    Args:
+        v (object): object to evaluate
+    Returns:
+        bool: True if [v] is a float or a string representation of a float, otherwise False
+    """
+    try:
+        _ = float(v)
+        return True
+    except ValueError:
+        return False
+def is_iterable(x):
+    """
+    Uses duck typing to assess whether [x] is iterable (list, set, dict, etc.).
+    Args:
+        x (object): the object to test
+    Returns:
+        bool: True if [x] appears to be iterable, otherwise False
+    """
+    try:
+        _ = iter(x)
+    except:
+       return False
+    return True
+def is_empty(v):
+    """
+    A common definition of "empty" used throughout the repo, particularly when loading
+    data from .csv files.  "empty" includes None, '', and NaN.
+    Args:
+        v: the object to evaluate for emptiness
+    Returns:
+        bool: True if [v] is None, '', or NaN, otherwise False
+    """
+    if v is None:
+        return True
+    if isinstance(v,str) and v == '':
+        return True
+    if isinstance(v,float) and np.isnan(v):
+        return True
+    return False
+def isnan(v):
+    """
+    Returns True if v is a nan-valued float, otherwise returns False.
+    Args:
+        v: the object to evaluate for nan-ness
+    Returns:
+        bool: True if v is a nan-valued float, otherwise False
+    """
+    try:
+        return np.isnan(v)
+    except Exception:
+        return False
+def sets_overlap(set1, set2):
+    """
+    Determines whether two sets overlap.
+    Args:
+        set1 (set): the first set to compare (converted to a set if it's not already)
+        set2 (set): the second set to compare (converted to a set if it's not already)
+    Returns:
+        bool: True if any elements are shared between set1 and set2
+    """
+    return not set(set1).isdisjoint(set(set2))
 #%% Test drivers
 if False:

megadetector 5.0.7__py3-none-any.whl → 5.0.9__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.7py3-none-any.whl → 5.0.9py3-none-any.whl