PyPI - megadetector - Versions diffs - 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl - Mend

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of megadetector might be problematic. Click here for more details.

Files changed (197) hide show

megadetector/api/batch_processing/integration/digiKam/xmp_integration.py +2 -2
megadetector/api/batch_processing/integration/eMammal/test_scripts/push_annotations_to_emammal.py +1 -1
megadetector/api/batch_processing/integration/eMammal/test_scripts/select_images_for_testing.py +1 -1
megadetector/classification/aggregate_classifier_probs.py +3 -3
megadetector/classification/analyze_failed_images.py +5 -5
megadetector/classification/cache_batchapi_outputs.py +5 -5
megadetector/classification/create_classification_dataset.py +11 -12
megadetector/classification/crop_detections.py +10 -10
megadetector/classification/csv_to_json.py +8 -8
megadetector/classification/detect_and_crop.py +13 -15
megadetector/classification/efficientnet/model.py +8 -8
megadetector/classification/efficientnet/utils.py +6 -5
megadetector/classification/evaluate_model.py +7 -7
megadetector/classification/identify_mislabeled_candidates.py +6 -6
megadetector/classification/json_to_azcopy_list.py +1 -1
megadetector/classification/json_validator.py +29 -32
megadetector/classification/map_classification_categories.py +9 -9
megadetector/classification/merge_classification_detection_output.py +12 -9
megadetector/classification/prepare_classification_script.py +19 -19
megadetector/classification/prepare_classification_script_mc.py +26 -26
megadetector/classification/run_classifier.py +4 -4
megadetector/classification/save_mislabeled.py +6 -6
megadetector/classification/train_classifier.py +1 -1
megadetector/classification/train_classifier_tf.py +9 -9
megadetector/classification/train_utils.py +10 -10
megadetector/data_management/annotations/annotation_constants.py +1 -2
megadetector/data_management/camtrap_dp_to_coco.py +79 -46
megadetector/data_management/cct_json_utils.py +103 -103
megadetector/data_management/cct_to_md.py +49 -49
megadetector/data_management/cct_to_wi.py +33 -33
megadetector/data_management/coco_to_labelme.py +75 -75
megadetector/data_management/coco_to_yolo.py +210 -193
megadetector/data_management/databases/add_width_and_height_to_db.py +86 -12
megadetector/data_management/databases/combine_coco_camera_traps_files.py +40 -40
megadetector/data_management/databases/integrity_check_json_db.py +228 -200
megadetector/data_management/databases/subset_json_db.py +33 -33
megadetector/data_management/generate_crops_from_cct.py +88 -39
megadetector/data_management/get_image_sizes.py +54 -49
megadetector/data_management/labelme_to_coco.py +133 -125
megadetector/data_management/labelme_to_yolo.py +159 -73
megadetector/data_management/lila/create_lila_blank_set.py +81 -83
megadetector/data_management/lila/create_lila_test_set.py +32 -31
megadetector/data_management/lila/create_links_to_md_results_files.py +18 -18
megadetector/data_management/lila/download_lila_subset.py +21 -24
megadetector/data_management/lila/generate_lila_per_image_labels.py +365 -107
megadetector/data_management/lila/get_lila_annotation_counts.py +35 -33
megadetector/data_management/lila/get_lila_image_counts.py +22 -22
megadetector/data_management/lila/lila_common.py +73 -70
megadetector/data_management/lila/test_lila_metadata_urls.py +28 -19
megadetector/data_management/mewc_to_md.py +344 -340
megadetector/data_management/ocr_tools.py +262 -255
megadetector/data_management/read_exif.py +249 -227
megadetector/data_management/remap_coco_categories.py +90 -28
megadetector/data_management/remove_exif.py +81 -21
megadetector/data_management/rename_images.py +187 -187
megadetector/data_management/resize_coco_dataset.py +588 -120
megadetector/data_management/speciesnet_to_md.py +41 -41
megadetector/data_management/wi_download_csv_to_coco.py +55 -55
megadetector/data_management/yolo_output_to_md_output.py +248 -122
megadetector/data_management/yolo_to_coco.py +333 -191
megadetector/detection/change_detection.py +832 -0
megadetector/detection/process_video.py +340 -337
megadetector/detection/pytorch_detector.py +358 -278
megadetector/detection/run_detector.py +399 -186
megadetector/detection/run_detector_batch.py +404 -377
megadetector/detection/run_inference_with_yolov5_val.py +340 -327
megadetector/detection/run_tiled_inference.py +257 -249
megadetector/detection/tf_detector.py +24 -24
megadetector/detection/video_utils.py +332 -295
megadetector/postprocessing/add_max_conf.py +19 -11
megadetector/postprocessing/categorize_detections_by_size.py +45 -45
megadetector/postprocessing/classification_postprocessing.py +468 -433
megadetector/postprocessing/combine_batch_outputs.py +23 -23
megadetector/postprocessing/compare_batch_results.py +590 -525
megadetector/postprocessing/convert_output_format.py +106 -102
megadetector/postprocessing/create_crop_folder.py +347 -147
megadetector/postprocessing/detector_calibration.py +173 -168
megadetector/postprocessing/generate_csv_report.py +508 -499
megadetector/postprocessing/load_api_results.py +48 -27
megadetector/postprocessing/md_to_coco.py +133 -102
megadetector/postprocessing/md_to_labelme.py +107 -90
megadetector/postprocessing/md_to_wi.py +40 -40
megadetector/postprocessing/merge_detections.py +92 -114
megadetector/postprocessing/postprocess_batch_results.py +319 -301
megadetector/postprocessing/remap_detection_categories.py +91 -38
megadetector/postprocessing/render_detection_confusion_matrix.py +214 -205
megadetector/postprocessing/repeat_detection_elimination/find_repeat_detections.py +57 -57
megadetector/postprocessing/repeat_detection_elimination/remove_repeat_detections.py +27 -28
megadetector/postprocessing/repeat_detection_elimination/repeat_detections_core.py +704 -679
megadetector/postprocessing/separate_detections_into_folders.py +226 -211
megadetector/postprocessing/subset_json_detector_output.py +265 -262
megadetector/postprocessing/top_folders_to_bottom.py +45 -45
megadetector/postprocessing/validate_batch_results.py +70 -70
megadetector/taxonomy_mapping/map_lila_taxonomy_to_wi_taxonomy.py +52 -52
megadetector/taxonomy_mapping/map_new_lila_datasets.py +18 -19
megadetector/taxonomy_mapping/prepare_lila_taxonomy_release.py +54 -33
megadetector/taxonomy_mapping/preview_lila_taxonomy.py +67 -67
megadetector/taxonomy_mapping/retrieve_sample_image.py +16 -16
megadetector/taxonomy_mapping/simple_image_download.py +8 -8
megadetector/taxonomy_mapping/species_lookup.py +156 -74
megadetector/taxonomy_mapping/taxonomy_csv_checker.py +14 -14
megadetector/taxonomy_mapping/taxonomy_graph.py +10 -10
megadetector/taxonomy_mapping/validate_lila_category_mappings.py +13 -13
megadetector/utils/ct_utils.py +1049 -211
megadetector/utils/directory_listing.py +21 -77
megadetector/utils/gpu_test.py +22 -22
megadetector/utils/md_tests.py +632 -529
megadetector/utils/path_utils.py +1520 -431
megadetector/utils/process_utils.py +41 -41
megadetector/utils/split_locations_into_train_val.py +62 -62
megadetector/utils/string_utils.py +148 -27
megadetector/utils/url_utils.py +489 -176
megadetector/utils/wi_utils.py +2658 -2526
megadetector/utils/write_html_image_list.py +137 -137
megadetector/visualization/plot_utils.py +34 -30
megadetector/visualization/render_images_with_thumbnails.py +39 -74
megadetector/visualization/visualization_utils.py +487 -435
megadetector/visualization/visualize_db.py +232 -198
megadetector/visualization/visualize_detector_output.py +82 -76
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/METADATA +5 -2
megadetector-10.0.0.dist-info/RECORD +139 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/WHEEL +1 -1
megadetector/api/batch_processing/api_core/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/__init__.py +0 -0
megadetector/api/batch_processing/api_core/batch_service/score.py +0 -439
megadetector/api/batch_processing/api_core/server.py +0 -294
megadetector/api/batch_processing/api_core/server_api_config.py +0 -97
megadetector/api/batch_processing/api_core/server_app_config.py +0 -55
megadetector/api/batch_processing/api_core/server_batch_job_manager.py +0 -220
megadetector/api/batch_processing/api_core/server_job_status_table.py +0 -149
megadetector/api/batch_processing/api_core/server_orchestration.py +0 -360
megadetector/api/batch_processing/api_core/server_utils.py +0 -88
megadetector/api/batch_processing/api_core_support/__init__.py +0 -0
megadetector/api/batch_processing/api_core_support/aggregate_results_manually.py +0 -46
megadetector/api/batch_processing/api_support/__init__.py +0 -0
megadetector/api/batch_processing/api_support/summarize_daily_activity.py +0 -152
megadetector/api/batch_processing/data_preparation/__init__.py +0 -0
megadetector/api/synchronous/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/__init__.py +0 -0
megadetector/api/synchronous/api_core/animal_detection_api/api_backend.py +0 -151
megadetector/api/synchronous/api_core/animal_detection_api/api_frontend.py +0 -263
megadetector/api/synchronous/api_core/animal_detection_api/config.py +0 -35
megadetector/api/synchronous/api_core/tests/__init__.py +0 -0
megadetector/api/synchronous/api_core/tests/load_test.py +0 -110
megadetector/data_management/importers/add_nacti_sizes.py +0 -52
megadetector/data_management/importers/add_timestamps_to_icct.py +0 -79
megadetector/data_management/importers/animl_results_to_md_results.py +0 -158
megadetector/data_management/importers/auckland_doc_test_to_json.py +0 -373
megadetector/data_management/importers/auckland_doc_to_json.py +0 -201
megadetector/data_management/importers/awc_to_json.py +0 -191
megadetector/data_management/importers/bellevue_to_json.py +0 -272
megadetector/data_management/importers/cacophony-thermal-importer.py +0 -793
megadetector/data_management/importers/carrizo_shrubfree_2018.py +0 -269
megadetector/data_management/importers/carrizo_trail_cam_2017.py +0 -289
megadetector/data_management/importers/cct_field_adjustments.py +0 -58
megadetector/data_management/importers/channel_islands_to_cct.py +0 -913
megadetector/data_management/importers/eMammal/copy_and_unzip_emammal.py +0 -180
megadetector/data_management/importers/eMammal/eMammal_helpers.py +0 -249
megadetector/data_management/importers/eMammal/make_eMammal_json.py +0 -223
megadetector/data_management/importers/ena24_to_json.py +0 -276
megadetector/data_management/importers/filenames_to_json.py +0 -386
megadetector/data_management/importers/helena_to_cct.py +0 -283
megadetector/data_management/importers/idaho-camera-traps.py +0 -1407
megadetector/data_management/importers/idfg_iwildcam_lila_prep.py +0 -294
megadetector/data_management/importers/import_desert_lion_conservation_camera_traps.py +0 -387
megadetector/data_management/importers/jb_csv_to_json.py +0 -150
megadetector/data_management/importers/mcgill_to_json.py +0 -250
megadetector/data_management/importers/missouri_to_json.py +0 -490
megadetector/data_management/importers/nacti_fieldname_adjustments.py +0 -79
megadetector/data_management/importers/noaa_seals_2019.py +0 -181
megadetector/data_management/importers/osu-small-animals-to-json.py +0 -364
megadetector/data_management/importers/pc_to_json.py +0 -365
megadetector/data_management/importers/plot_wni_giraffes.py +0 -123
megadetector/data_management/importers/prepare_zsl_imerit.py +0 -131
megadetector/data_management/importers/raic_csv_to_md_results.py +0 -416
megadetector/data_management/importers/rspb_to_json.py +0 -356
megadetector/data_management/importers/save_the_elephants_survey_A.py +0 -320
megadetector/data_management/importers/save_the_elephants_survey_B.py +0 -329
megadetector/data_management/importers/snapshot_safari_importer.py +0 -758
megadetector/data_management/importers/snapshot_serengeti_lila.py +0 -1067
megadetector/data_management/importers/snapshotserengeti/make_full_SS_json.py +0 -150
megadetector/data_management/importers/snapshotserengeti/make_per_season_SS_json.py +0 -153
megadetector/data_management/importers/sulross_get_exif.py +0 -65
megadetector/data_management/importers/timelapse_csv_set_to_json.py +0 -490
megadetector/data_management/importers/ubc_to_json.py +0 -399
megadetector/data_management/importers/umn_to_json.py +0 -507
megadetector/data_management/importers/wellington_to_json.py +0 -263
megadetector/data_management/importers/wi_to_json.py +0 -442
megadetector/data_management/importers/zamba_results_to_md_results.py +0 -180
megadetector/data_management/lila/add_locations_to_island_camera_traps.py +0 -101
megadetector/data_management/lila/add_locations_to_nacti.py +0 -151
megadetector/utils/azure_utils.py +0 -178
megadetector/utils/sas_blob_utils.py +0 -509
megadetector-5.0.28.dist-info/RECORD +0 -209
/megadetector/{api/batch_processing/__init__.py → __init__.py} +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/licenses/LICENSE +0 -0
{megadetector-5.0.28.dist-info → megadetector-10.0.0.dist-info}/top_level.txt +0 -0

megadetector/utils/ct_utils.py CHANGED Viewed

@@ -13,6 +13,10 @@ import json
 import math
 import os
 import builtins
+import datetime
+import tempfile
+import shutil
+import uuid
 import jsonpickle
 import numpy as np
@@ -28,13 +32,13 @@ image_extensions = ['.jpg', '.jpeg', '.gif', '.png']
 def truncate_float_array(xs, precision=3):
     """
-    Truncates the fractional portion of each floating-point value in the array [xs]
+    Truncates the fractional portion of each floating-point value in the array [xs]
     to a specific number of floating-point digits.
     Args:
         xs (list): list of floats to truncate
-        precision (int, optional): the number of significant digits to preserve, should be >= 1
+        precision (int, optional): the number of significant digits to preserve, should be >= 1
     Returns:
         list: list of truncated floats
     """
@@ -44,52 +48,52 @@ def truncate_float_array(xs, precision=3):
 def round_float_array(xs, precision=3):
     """
-    Truncates the fractional portion of each floating-point value in the array [xs]
+    Truncates the fractional portion of each floating-point value in the array [xs]
     to a specific number of floating-point digits.
     Args:
         xs (list): list of floats to round
-        precision (int, optional): the number of significant digits to preserve, should be >= 1
+        precision (int, optional): the number of significant digits to preserve, should be >= 1
     Returns:
-        list: list of rounded floats
+        list: list of rounded floats
     """
     return [round_float(x,precision) for x in xs]
 def round_float(x, precision=3):
     """
     Convenience wrapper for the native Python round()
     Args:
         x (float): number to truncate
         precision (int, optional): the number of significant digits to preserve, should be >= 1
     Returns:
         float: rounded value
     """
     return round(x,precision)
 def truncate_float(x, precision=3):
     """
-    Truncates the fractional portion of a floating-point value to a specific number of
+    Truncates the fractional portion of a floating-point value to a specific number of
     floating-point digits.
-    For example:
+    For example:
         truncate_float(0.0003214884) --> 0.000321
         truncate_float(1.0003214884) --> 1.000321
     This function is primarily used to achieve a certain float representation
     before exporting to JSON.
     Args:
         x (float): scalar to truncate
         precision (int, optional): the number of significant digits to preserve, should be >= 1
     Returns:
         float: truncated version of [x]
     """
@@ -106,11 +110,11 @@ def args_to_object(args, obj):
     Args:
         args (argparse.Namespace): the namespace to convert to an object
         obj (object): object whose whose attributes will be updated
     Returns:
         object: the modified object (modified in place, but also returned)
     """
     for n, v in inspect.getmembers(args):
         if not n.startswith('_'):
             setattr(obj, n, v)
@@ -120,17 +124,17 @@ def args_to_object(args, obj):
 def dict_to_object(d, obj):
     """
-    Copies all fields from a dict to an object. Skips fields starting with _.
+    Copies all fields from a dict to an object. Skips fields starting with _.
     Does not check existence in the target object.
     Args:
         d (dict): the dict to convert to an object
         obj (object): object whose whose attributes will be updated
     Returns:
         object: the modified object (modified in place, but also returned)
     """
     for k in d.keys():
         if not k.startswith('_'):
             setattr(obj, k, d[k])
@@ -141,11 +145,11 @@ def dict_to_object(d, obj):
 def pretty_print_object(obj, b_print=True):
     """
     Converts an arbitrary object to .json, optionally printing the .json representation.
     Args:
         obj (object): object to print
         b_print (bool, optional): whether to print the object
     Returns:
         str: .json reprepresentation of [obj]
     """
@@ -162,44 +166,90 @@ def pretty_print_object(obj, b_print=True):
     return s
-def is_list_sorted(L, reverse=False):
+def is_list_sorted(L, reverse=False): # noqa
     """
     Returns True if the list L appears to be sorted, otherwise False.
     Calling is_list_sorted(L,reverse=True) is the same as calling
     is_list_sorted(L.reverse(),reverse=False).
     Args:
         L (list): list to evaluate
-        reverse (bool, optional): whether to reverse the list before evaluating sort status
+        reverse (bool, optional): whether to reverse the list before evaluating sort status
     Returns:
         bool: True if the list L appears to be sorted, otherwise False
     """
     if reverse:
         return all(L[i] >= L[i + 1] for i in range(len(L)-1))
     else:
         return all(L[i] <= L[i + 1] for i in range(len(L)-1))
-def write_json(path, content, indent=1):
+def json_serialize_datetime(obj):
+    """
+    Serializes datetime.datetime and datetime.date objects to ISO format.
+    Args:
+        obj (object): The object to serialize.
+    Returns:
+        str: The ISO format string representation of the datetime object.
+    Raises:
+        TypeError: If the object is not a datetime.datetime or datetime.date instance.
+    """
+    if isinstance(obj, (datetime.datetime, datetime.date)):
+        return obj.isoformat()
+    raise TypeError(f"Object of type {type(obj)} is not JSON serializable by json_serialize_datetime")
+def write_json(path,
+               content,
+               indent=1,
+               force_str=False,
+               serialize_datetimes=False,
+               ensure_ascii=True,
+               encoding='utf-8'):
     """
     Standardized wrapper for json.dump().
     Args:
         path (str): filename to write to
         content (object): object to dump
         indent (int, optional): indentation depth passed to json.dump
+        force_str (bool, optional): whether to force string conversion for non-serializable objects
+        serialize_datetimes (bool, optional): whether to serialize datetime objects to ISO format
+        ensure_ascii (bool, optional): whether to ensure ASCII characters in the output
+        encoding (str, optional): string encoding to use
     """
-    with open(path, 'w', newline='\n') as f:
-        json.dump(content, f, indent=indent)
+    default_handler = None
+    if serialize_datetimes:
+        default_handler = json_serialize_datetime
+        if force_str:
+            def serialize_or_str(obj):
+                try:
+                    return json_serialize_datetime(obj)
+                except TypeError:
+                    return str(obj)
+            default_handler = serialize_or_str
+    elif force_str:
+        default_handler = str
+    os.makedirs(os.path.dirname(path), exist_ok=True)
+    with open(path, 'w', newline='\n', encoding=encoding) as f:
+        json.dump(content, f, indent=indent, default=default_handler, ensure_ascii=ensure_ascii)
+# ...def write_json(...)
 def convert_yolo_to_xywh(yolo_box):
     """
-    Converts a YOLO format bounding box [x_center, y_center, w, h] to
+    Converts a YOLO format bounding box [x_center, y_center, w, h] to
     [x_min, y_min, width_of_box, height_of_box].
     Args:
@@ -208,7 +258,7 @@ def convert_yolo_to_xywh(yolo_box):
     Returns:
         list: bbox with coordinates represented as [x_min, y_min, width_of_box, height_of_box]
     """
     x_center, y_center, width_of_box, height_of_box = yolo_box
     x_min = x_center - width_of_box / 2.0
     y_min = y_center - height_of_box / 2.0
@@ -238,7 +288,7 @@ def get_iou(bb1, bb2):
     Calculates the intersection over union (IoU) of two bounding boxes.
     Adapted from:
     https://stackoverflow.com/questions/25349178/calculating-percentage-of-bounding-box-overlap-for-image-detector-evaluation
     Args:
@@ -288,7 +338,7 @@ def _get_max_conf_from_detections(detections):
     """
     Internal function used by get_max_conf(); don't call this directly.
     """
     max_conf = 0.0
     if detections is not None and len(detections) > 0:
         confidences = [det['conf'] for det in detections]
@@ -298,17 +348,17 @@ def _get_max_conf_from_detections(detections):
 def get_max_conf(im):
     """
-    Given an image dict in the MD output format, computes the maximum detection confidence for any
-    class.  Returns 0.0 if there were no detections, if there was a failure, or if 'detections' isn't
+    Given an image dict in the MD output format, computes the maximum detection confidence for any
+    class.  Returns 0.0 if there were no detections, if there was a failure, or if 'detections' isn't
     present.
     Args:
         im (dict): image dictionary in the MD output format (with a 'detections' field)
     Returns:
         float: the maximum detection confidence across all classes
     """
     max_conf = 0.0
     if 'detections' in im and im['detections'] is not None and len(im['detections']) > 0:
         max_conf = _get_max_conf_from_detections(im['detections'])
@@ -318,7 +368,7 @@ def get_max_conf(im):
 def sort_results_for_image(im):
     """
     Sort classification and detection results in descending order by confidence (in place).
     Args:
         im (dict): image dictionary in the MD output format (with a 'detections' field)
     """
@@ -327,55 +377,56 @@ def sort_results_for_image(im):
     # Sort detections in descending order by confidence
     im['detections'] = sort_list_of_dicts_by_key(im['detections'],k='conf',reverse=True)
     for det in im['detections']:
         # Sort classifications (which are (class,conf) tuples) in descending order by confidence
         if 'classifications' in det and \
             (det['classifications'] is not None) and \
             (len(det['classifications']) > 0):
-            L = det['classifications']
-            det['classifications'] = sorted(L,key=itemgetter(1),reverse=True)
+            classifications = det['classifications']
+            det['classifications'] = \
+                sorted(classifications,key=itemgetter(1),reverse=True)
 def point_dist(p1,p2):
     """
     Computes the distance between two points, represented as length-two tuples.
     Args:
-        p1: point, formatted as (x,y)
-        p2: point, formatted as (x,y)
+        p1 (list or tuple): point, formatted as (x,y)
+        p2 (list or tuple): point, formatted as (x,y)
     Returns:
         float: the Euclidean distance between p1 and p2
     """
     return math.sqrt( ((p1[0]-p2[0])**2) + ((p1[1]-p2[1])**2) )
 def rect_distance(r1, r2, format='x0y0x1y1'):
     """
-    Computes the minimum distance between two axis-aligned rectangles, each represented as
+    Computes the minimum distance between two axis-aligned rectangles, each represented as
     (x0,y0,x1,y1) by default.
     Can also specify "format" as x0y0wh for MD-style bbox formatting (x0,y0,w,h).
     Args:
-        r1: rectangle, formatted as (x0,y0,x1,y1) or (x0,y0,xy,y1)
-        r2: rectangle, formatted as (x0,y0,x1,y1) or (x0,y0,xy,y1)
+        r1 (list or tuple): rectangle, formatted as (x0,y0,x1,y1) or (x0,y0,xy,y1)
+        r2 (list or tuple): rectangle, formatted as (x0,y0,x1,y1) or (x0,y0,xy,y1)
         format (str, optional): whether the boxes are formatted as 'x0y0x1y1' (default) or 'x0y0wh'
     Returns:
         float: the minimum distance between r1 and r2
     """
     assert format in ('x0y0x1y1','x0y0wh'), 'Illegal rectangle format {}'.format(format)
     if format == 'x0y0wh':
         # Convert to x0y0x1y1 without modifying the original rectangles
         r1 = [r1[0],r1[1],r1[0]+r1[2],r1[1]+r1[3]]
         r2 = [r2[0],r2[1],r2[0]+r2[2],r2[1]+r2[3]]
     # https://stackoverflow.com/a/26178015
     x1, y1, x1b, y1b = r1
     x2, y2, x2b, y2b = r2
@@ -403,40 +454,40 @@ def rect_distance(r1, r2, format='x0y0x1y1'):
         return 0.0
-def split_list_into_fixed_size_chunks(L,n):
+def split_list_into_fixed_size_chunks(L,n): # noqa
     """
-    Split the list or tuple L into chunks of size n (allowing at most one chunk with size
+    Split the list or tuple L into chunks of size n (allowing at most one chunk with size
     less than N, i.e. len(L) does not have to be a multiple of n).
     Args:
         L (list): list to split into chunks
         n (int): preferred chunk size
     Returns:
         list: list of chunks, where each chunk is a list of length n or n-1
     """
     return [L[i * n:(i + 1) * n] for i in range((len(L) + n - 1) // n )]
-def split_list_into_n_chunks(L, n, chunk_strategy='greedy'):
+def split_list_into_n_chunks(L, n, chunk_strategy='greedy'): # noqa
     """
-    Splits the list or tuple L into n equally-sized chunks (some chunks may be one
+    Splits the list or tuple L into n equally-sized chunks (some chunks may be one
     element smaller than others, i.e. len(L) does not have to be a multiple of n).
     chunk_strategy can be "greedy" (default, if there are k samples per chunk, the first
     k go into the first chunk) or "balanced" (alternate between chunks when pulling
     items from the list).
     Args:
         L (list): list to split into chunks
         n (int): number of chunks
-        chunk_strategy (str, optiopnal): "greedy" or "balanced"; see above
+        chunk_strategy (str, optional): "greedy" or "balanced"; see above
     Returns:
         list: list of chunks, each of which is a list
     """
     if chunk_strategy == 'greedy':
         k, m = divmod(len(L), n)
         return list(L[i*k+min(i, m):(i+1)*k+min(i+1, m)] for i in range(n))
@@ -450,54 +501,68 @@ def split_list_into_n_chunks(L, n, chunk_strategy='greedy'):
         raise ValueError('Invalid chunk strategy: {}'.format(chunk_strategy))
-def sort_list_of_dicts_by_key(L,k,reverse=False):
+def sort_list_of_dicts_by_key(L, k, reverse=False, none_handling='smallest'): # noqa ("L" should be lowercase)
     """
     Sorts the list of dictionaries [L] by the key [k].
     Args:
         L (list): list of dictionaries to sort
         k (object, typically str): the sort key
         reverse (bool, optional): whether to sort in reverse (descending) order
+        none_handling (str, optional): how to handle None values. Options:
+            "smallest" - treat None as smaller than all other values (default)
+            "largest" - treat None as larger than all other values
+            "error" - raise error when None is compared with non-None
     Returns:
-        dict: sorted copy of [d]
+        list: sorted copy of [L]
     """
-    return sorted(L, key=lambda d: d[k], reverse=reverse)
+    if none_handling == 'error':
+        return sorted(L, key=lambda d: d[k], reverse=reverse)
+    elif none_handling == 'smallest':
+        # None values treated as smaller than other values: use tuple (is_not_none, value)
+        return sorted(L, key=lambda d: (d[k] is not None, d[k]), reverse=reverse)
+    elif none_handling == "largest":
+        # None values treated as larger than other values: use tuple (is_none, value)
+        return sorted(L, key=lambda d: (d[k] is None, d[k]), reverse=reverse)
+    else:
+        raise ValueError('Invalid none_handling value: {}'.format(none_handling))
 def sort_dictionary_by_key(d,reverse=False):
     """
     Sorts the dictionary [d] by key.
     Args:
         d (dict): dictionary to sort
         reverse (bool, optional): whether to sort in reverse (descending) order
     Returns:
         dict: sorted copy of [d]
     """
     d = dict(sorted(d.items(),reverse=reverse))
     return d
 def sort_dictionary_by_value(d,sort_values=None,reverse=False):
     """
     Sorts the dictionary [d] by value.  If sort_values is None, uses d.values(),
-    otherwise uses the dictionary sort_values as the sorting criterion.  Always
-    returns a new standard dict, so if [d] is, for example, a defaultdict, the
+    otherwise uses the dictionary sort_values as the sorting criterion.  Always
+    returns a new standard dict, so if [d] is, for example, a defaultdict, the
     returned value is not.
     Args:
         d (dict): dictionary to sort
-        sort_values (dict, optional): dictionary mapping keys in [d] to sort values (defaults
+        sort_values (dict, optional): dictionary mapping keys in [d] to sort values (defaults
             to None, uses [d] itself for sorting)
         reverse (bool, optional): whether to sort in reverse (descending) order
     Returns:
         dict: sorted copy of [d
     """
     if sort_values is None:
         d = {k: v for k, v in sorted(d.items(), key=lambda item: item[1], reverse=reverse)}
     else:
@@ -509,112 +574,134 @@ def invert_dictionary(d):
     """
     Creates a new dictionary that maps d.values() to d.keys().  Does not check
     uniqueness.
     Args:
         d (dict): dictionary to invert
     Returns:
         dict: inverted copy of [d]
     """
     return {v: k for k, v in d.items()}
-def round_floats_in_nested_dict(obj, decimal_places=5):
+def round_floats_in_nested_dict(obj, decimal_places=5, allow_iterator_conversion=False):
     """
-    Recursively rounds all floating point values in a nested structure to the
-    specified number of decimal places. Handles dictionaries, lists, tuples,
+    Recursively rounds all floating point values in a nested structure to the
+    specified number of decimal places. Handles dictionaries, lists, tuples,
     sets, and other iterables. Modifies mutable objects in place.
     Args:
-        obj: The object to process (can be a dict, list, set, tuple, or primitive value)
-        decimal_places: Number of decimal places to round to (default: 5)
+        obj (obj): The object to process (can be a dict, list, set, tuple, or primitive value)
+        decimal_places (int, optional): Number of decimal places to round to
+        allow_iterator_conversion (bool, optional): for iterator types, should we convert
+            to lists?  Otherwise we error.
     Returns:
         The processed object (useful for recursive calls)
     """
     if isinstance(obj, dict):
         for key in obj:
-            obj[key] = round_floats_in_nested_dict(obj[key], decimal_places)
+            obj[key] = round_floats_in_nested_dict(obj[key], decimal_places=decimal_places,
+                                                   allow_iterator_conversion=allow_iterator_conversion)
         return obj
     elif isinstance(obj, list):
         for i in range(len(obj)):
-            obj[i] = round_floats_in_nested_dict(obj[i], decimal_places)
+            obj[i] = round_floats_in_nested_dict(obj[i], decimal_places=decimal_places,
+                                                 allow_iterator_conversion=allow_iterator_conversion)
         return obj
     elif isinstance(obj, tuple):
         # Tuples are immutable, so we create a new one
-        return tuple(round_floats_in_nested_dict(item, decimal_places) for item in obj)
+        return tuple(round_floats_in_nested_dict(item, decimal_places=decimal_places,
+                                                 allow_iterator_conversion=allow_iterator_conversion) for item in obj)
     elif isinstance(obj, set):
         # Sets are mutable but we can't modify elements in-place
         # Convert to list, process, and convert back to set
-        return set(round_floats_in_nested_dict(list(obj), decimal_places))
+        return set(round_floats_in_nested_dict(list(obj), decimal_places=decimal_places,
+                                               allow_iterator_conversion=allow_iterator_conversion))
     elif hasattr(obj, '__iter__') and not isinstance(obj, (str, bytes, bytearray)):
-        # Handle other iterable types - convert to list, process, and convert back
-        return type(obj)(round_floats_in_nested_dict(item, decimal_places) for item in obj)
+        # Handle other iterable types: convert to list, process, and convert back
+        processed_list = [round_floats_in_nested_dict(item,
+                                                      decimal_places=decimal_places,
+                                                      allow_iterator_conversion=allow_iterator_conversion) \
+                                                        for item in obj]
+        # Try to recreate the original type, but fall back to list for iterators
+        try:
+            return type(obj)(processed_list)
+        except (TypeError, ValueError):
+            if allow_iterator_conversion:
+                # For iterators and other types that can't be reconstructed, return a list
+                return processed_list
+            else:
+                raise ValueError('Cannot process iterator types when allow_iterator_conversion is False')
     elif isinstance(obj, float):
         return round(obj, decimal_places)
     else:
         # For other types (int, str, bool, None, etc.), return as is
         return obj
-# ...def round_floats_in_nested_dict(...)
+# ...def round_floats_in_nested_dict(...)
 def image_file_to_camera_folder(image_fn):
     r"""
     Removes common overflow folders (e.g. RECNX101, RECNX102) from paths, i.e. turn:
     a\b\c\RECNX101\image001.jpg
     ...into:
     a\b\c
-    Returns the same thing as os.dirname() (i.e., just the folder name) if no overflow folders are
+    Returns the same thing as os.dirname() (i.e., just the folder name) if no overflow folders are
     present.
     Always converts backslashes to slashes.
     Args:
         image_fn (str): the image filename from which we should remove overflow folders
     Returns:
         str: a version of [image_fn] from which camera overflow folders have been removed
     """
     import re
     # 100RECNX is the overflow folder style for Reconyx cameras
     # 100EK113 is (for some reason) the overflow folder style for Bushnell cameras
     # 100_BTCF is the overflow folder style for Browning cameras
     # 100MEDIA is the overflow folder style used on a number of consumer-grade cameras
     patterns = [r'/\d+RECNX/',r'/\d+EK\d+/',r'/\d+_BTCF/',r'/\d+MEDIA/']
-    image_fn = image_fn.replace('\\','/')
+    image_fn = image_fn.replace('\\','/')
     for pat in patterns:
         image_fn = re.sub(pat,'/',image_fn)
     camera_folder = os.path.dirname(image_fn)
     return camera_folder
 def is_float(v):
     """
     Determines whether v is either a float or a string representation of a float.
     Args:
         v (object): object to evaluate
     Returns:
         bool: True if [v] is a float or a string representation of a float, otherwise False
     """
+    if v is None:
+        return False
     try:
         _ = float(v)
         return True
@@ -625,17 +712,17 @@ def is_float(v):
 def is_iterable(x):
     """
     Uses duck typing to assess whether [x] is iterable (list, set, dict, etc.).
     Args:
         x (object): the object to test
     Returns:
         bool: True if [x] appears to be iterable, otherwise False
     """
     try:
         _ = iter(x)
-    except:
+    except Exception:
        return False
     return True
@@ -644,10 +731,10 @@ def is_empty(v):
     """
     A common definition of "empty" used throughout the repo, particularly when loading
     data from .csv files.  "empty" includes None, '', and NaN.
     Args:
-        v: the object to evaluate for emptiness
+        v (obj): the object to evaluate for emptiness
     Returns:
         bool: True if [v] is None, '', or NaN, otherwise False
     """
@@ -660,15 +747,55 @@ def is_empty(v):
     return False
+def to_bool(v):
+    """
+    Convert an object to a bool with specific rules.
+    Args:
+        v (object): The object to convert
+    Returns:
+        bool or None:
+        - For strings: True if 'true' (case-insensitive), False if 'false', recursively applied if int-like
+        - For int/bytes: False if 0, True otherwise
+        - For bool: returns the bool as-is
+        - For other types: None
+    """
+    if isinstance(v, bool):
+        return v
+    if isinstance(v, str):
+        try:
+            v = int(v)
+            return to_bool(v)
+        except Exception:
+            pass
+        v = v.lower().strip()
+        if v == 'true':
+            return True
+        elif v == 'false':
+            return False
+        else:
+            return None
+    if isinstance(v, (int, bytes)):
+        return v != 0
+    return None
 def min_none(a,b):
     """
-    Returns the minimum of a and b.  If both are None, returns None.  If one is None,
+    Returns the minimum of a and b.  If both are None, returns None.  If one is None,
     returns the other.
     Args:
         a (numeric): the first value to compare
         b (numeric): the second value to compare
     Returns:
         numeric: the minimum of a and b, or None
     """
@@ -680,17 +807,17 @@ def min_none(a,b):
         return a
     else:
         return min(a,b)
 def max_none(a,b):
     """
-    Returns the maximum of a and b.  If both are None, returns None.  If one is None,
+    Returns the maximum of a and b.  If both are None, returns None.  If one is None,
     returns the other.
     Args:
         a (numeric): the first value to compare
         b (numeric): the second value to compare
     Returns:
         numeric: the maximum of a and b, or None
     """
@@ -703,19 +830,19 @@ def max_none(a,b):
     else:
         return max(a,b)
 def isnan(v):
     """
     Returns True if v is a nan-valued float, otherwise returns False.
     Args:
-        v: the object to evaluate for nan-ness
+        v (obj): the object to evaluate for nan-ness
     Returns:
         bool: True if v is a nan-valued float, otherwise False
     """
-    try:
+    try:
         return np.isnan(v)
     except Exception:
         return False
@@ -724,55 +851,56 @@ def isnan(v):
 def sets_overlap(set1, set2):
     """
     Determines whether two sets overlap.
     Args:
         set1 (set): the first set to compare (converted to a set if it's not already)
         set2 (set): the second set to compare (converted to a set if it's not already)
     Returns:
         bool: True if any elements are shared between set1 and set2
     """
     return not set(set1).isdisjoint(set(set2))
 def is_function_name(s,calling_namespace):
     """
-    Determines whether [s] is a callable function in the global or local scope, or a
+    Determines whether [s] is a callable function in the global or local scope, or a
     built-in function.
     Args:
         s (str): the string to test for function-ness
         calling_namespace (dict): typically pass the output of locals()
     """
     assert isinstance(s,str), 'Input is not a string'
     return callable(globals().get(s)) or \
         callable(locals().get(s)) or \
         callable(calling_namespace.get(s)) or \
         callable(getattr(builtins, s, None))
 # From https://gist.github.com/fralau/061a4f6c13251367ef1d9a9a99fb3e8d
 def parse_kvp(s,kv_separator='='):
     """
     Parse a key/value pair, separated by [kv_separator].  Errors if s is not
-    a valid key/value pair string.
+    a valid key/value pair string.  Strips leading/trailing whitespace from
+    the key and value.
     Args:
         s (str): the string to parse
         kv_separator (str, optional): the string separating keys from values.
     Returns:
         tuple: a 2-tuple formatted as (key,value)
     """
     items = s.split(kv_separator)
     assert len(items) > 1, 'Illegal key-value pair'
     key = items[0].strip()
     if len(items) > 1:
-        value = kv_separator.join(items[1:])
+        value = kv_separator.join(items[1:]).strip()
     return (key, value)
@@ -780,26 +908,26 @@ def parse_kvp_list(items,kv_separator='=',d=None):
     """
     Parse a list key-value pairs into a dictionary.  If items is None or [],
     returns {}.
     Args:
         items (list): the list of KVPs to parse
         kv_separator (str, optional): the string separating keys from values.
         d (dict, optional): the initial dictionary, defaults to {}
     Returns:
         dict: a dict mapping keys to values
     """
     if d is None:
         d = {}
     if items is None or len(items) == 0:
         return d
     for item in items:
-        key, value = parse_kvp(item)
+        key, value = parse_kvp(item,kv_separator=kv_separator)
         d[key] = value
     return d
@@ -811,24 +939,24 @@ def dict_to_kvp_list(d,
     Convert a string <--> string dict into a string containing list of list of
     key-value pairs.  I.e., converts {'a':'dog','b':'cat'} to 'a=dog b=cat'.  If
     d is None, returns None.  If d is empty, returns ''.
     Args:
         d (dict): the dictionary to convert, must contain only strings
         item_separator (str, optional): the delimiter between KV pairs
         kv_separator (str, optional): the separator betweena a key and its value
         non_string_value_handling (str, optional): what do do with non-string values,
             can be "omit", "error", or "convert"
     Returns:
         str: the string representation of [d]
     """
     if d is None:
         return None
     if len(d) == 0:
         return ''
     s = None
     for k in d.keys():
         assert isinstance(k,str), 'Input {} is not a str <--> str dict'.format(str(d))
@@ -848,25 +976,25 @@ def dict_to_kvp_list(d,
         else:
             s += item_separator
         s += k + kv_separator + v
     if s is None:
         s = ''
     return s
 def parse_bool_string(s):
     """
     Convert the strings "true" or "false" to boolean values.  Case-insensitive, discards
     leading and trailing whitespace.  If s is already a bool, returns s.
     Args:
         s (str or bool): the string to parse, or the bool to return
     Returns:
         bool: the parsed value
     """
     if isinstance(s,bool):
         return s
     s = s.lower().strip()
@@ -876,57 +1004,767 @@ def parse_bool_string(s):
         return False
     else:
         raise ValueError('Cannot parse bool from string {}'.format(str(s)))
-#%% Test driver
-def __module_test__():
+def make_temp_folder(top_level_folder='megadetector',subfolder=None,append_guid=True):
+    """
+    Creates a temporary folder within the system temp folder, by default in a subfolder
+    called megadetector/some_guid.  Used for testing without making too much of a mess.
+    Args:
+        top_level_folder (str, optional): the top-level folder to use within the system temp folder
+        subfolder (str, optional): the subfolder within [top_level_folder]
+        append_guid (bool, optional): append a guid to the subfolder
+    Returns:
+        str: the new directory
+    """
+    to_return = os.path.join(tempfile.gettempdir(),top_level_folder)
+    if subfolder is not None:
+        to_return = os.path.join(to_return,subfolder)
+    if append_guid:
+        to_return = os.path.join(to_return,str(uuid.uuid1()))
+    to_return = os.path.normpath(to_return)
+    os.makedirs(to_return,exist_ok=True)
+    return to_return
+def make_test_folder(subfolder=None):
+    """
+    Wrapper around make_temp_folder that creates folders within megadetector/tests
+    Args:
+        subfolder (str): specific subfolder to create within the default megadetector temp
+            folder.
+    """
+    return make_temp_folder(top_level_folder='megadetector/tests',
+                            subfolder=subfolder,
+                            append_guid=True)
+#%% Tests
+def test_write_json():
+    """
+    Test driver for write_json.
+    """
+    temp_dir = make_test_folder()
+    def _verify_json_file(file_path, expected_content_str):
+        with open(file_path, 'r', encoding='utf-8') as f:
+            content = json.load(f)
+        assert isinstance(content,dict)
+        content = sort_dictionary_by_key(content)
+        expected_content = json.loads(expected_content_str)
+        expected_content = sort_dictionary_by_key(expected_content)
+        assert content == expected_content, \
+            f"File {file_path} content mismatch.\nExpected:\n{expected_content}\nGot:\n{content}"
+    # Test default indent (1)
+    data_default = {'a': 1, 'b': 2}
+    file_path_default = os.path.join(temp_dir, 'test_default_indent.json')
+    write_json(file_path_default, data_default)
+    # Default indent is 1
+    _verify_json_file(file_path_default, '{\n "a": 1,\n "b": 2\n}')
+    # Test custom indent (e.g., 4)
+    data_custom_indent = {'a': 1, 'b': 2}
+    file_path_custom_indent = os.path.join(temp_dir, 'test_custom_indent.json')
+    write_json(file_path_custom_indent, data_custom_indent, indent=4)
+    _verify_json_file(file_path_custom_indent, '{\n    "a": 1,\n    "b": 2\n}')
+    # Test indent=None (compact)
+    data_no_indent = {'a': 1, 'b': 2}
+    file_path_no_indent = os.path.join(temp_dir, 'test_no_indent.json')
+    write_json(file_path_no_indent, data_no_indent, indent=None)
+    _verify_json_file(file_path_no_indent, '{"a": 1, "b": 2}')
+    # Test force_str=True
+    data_force_str = {'a': 1, 's': {1, 2, 3}}  # Set is not normally JSON serializable
+    file_path_force_str = os.path.join(temp_dir, 'test_force_str.json')
+    write_json(file_path_force_str, data_force_str, force_str=True)
+    with open(file_path_force_str, 'r', encoding='utf-8') as f:
+        result_force_str = json.load(f)
+    assert isinstance(result_force_str['s'], str)
+    assert eval(result_force_str['s']) == {1, 2, 3}
+    # Test serialize_datetimes=True
+    dt = datetime.datetime(2023, 1, 1, 10, 30, 0)
+    d_date = datetime.date(2023, 2, 15)
+    data_serialize_datetimes = {'dt_obj': dt, 'd_obj': d_date}
+    file_path_serialize_datetimes = os.path.join(temp_dir, 'test_serialize_datetimes.json')
+    write_json(file_path_serialize_datetimes, data_serialize_datetimes, serialize_datetimes=True)
+    _verify_json_file(file_path_serialize_datetimes, '{\n "d_obj": "2023-02-15",\n "dt_obj": "2023-01-01T10:30:00"\n}')
+    # Test serialize_datetimes=True and force_str=True
+    dt_combo = datetime.datetime(2023, 1, 1, 12, 0, 0)
+    data_datetime_force_str = {'dt_obj': dt_combo, 's_obj': {4, 5}}
+    file_path_datetime_force_str = os.path.join(temp_dir, 'test_datetime_and_force_str.json')
+    write_json(file_path_datetime_force_str, data_datetime_force_str, serialize_datetimes=True, force_str=True)
+    with open(file_path_datetime_force_str, 'r', encoding='utf-8') as f:
+        result_datetime_force_str = json.load(f)
+    assert result_datetime_force_str['dt_obj'] == "2023-01-01T12:00:00"
+    assert isinstance(result_datetime_force_str['s_obj'], str)
+    assert eval(result_datetime_force_str['s_obj']) == {4, 5}
+    # Test ensure_ascii=False (with non-ASCII chars)
+    data_ensure_ascii_false = {'name': 'Jules César'}
+    file_path_ensure_ascii_false = os.path.join(temp_dir, 'test_ensure_ascii_false.json')
+    write_json(file_path_ensure_ascii_false, data_ensure_ascii_false, ensure_ascii=False)
+    with open(file_path_ensure_ascii_false, 'r', encoding='utf-8') as f:
+        content_ensure_ascii_false = f.read()
+    assert content_ensure_ascii_false == '{\n "name": "Jules César"\n}'
+    # Test ensure_ascii=True (with non-ASCII chars, default)
+    data_ensure_ascii_true = {'name': 'Jules César'}
+    file_path_ensure_ascii_true = os.path.join(temp_dir, 'test_ensure_ascii_true.json')
+    write_json(file_path_ensure_ascii_true, data_ensure_ascii_true, ensure_ascii=True)
+    with open(file_path_ensure_ascii_true, 'r', encoding='utf-8') as f:
+        content_ensure_ascii_true = f.read()
+    assert content_ensure_ascii_true == '{\n "name": "Jules C\\u00e9sar"\n}'
+    shutil.rmtree(temp_dir)
+# ...def test_write_json(...)
+def test_path_operations():
+    """
+    Test path manipulation functions.
     """
-    Module test driver
-    """
     ##%% Camera folder mapping
-    assert image_file_to_camera_folder('a/b/c/d/100EK113/blah.jpg') == 'a/b/c/d'
+    assert image_file_to_camera_folder('a/b/c/d/100EK113/blah.jpg') == 'a/b/c/d'
     assert image_file_to_camera_folder('a/b/c/d/100RECNX/blah.jpg') == 'a/b/c/d'
+    assert image_file_to_camera_folder('a/b/c/d/blah.jpg') == 'a/b/c/d'
+    assert image_file_to_camera_folder(r'a\b\c\d\100RECNX\blah.jpg') == 'a/b/c/d'
+def test_geometric_operations():
+    """
+    Test geometric calculations like distances.
+    """
     ##%% Test a few rectangle distances
     r1 = [0,0,1,1]; r2 = [0,0,1,1]; assert rect_distance(r1,r2)==0
     r1 = [0,0,1,1]; r2 = [0,0,1,100]; assert rect_distance(r1,r2)==0
     r1 = [0,0,1,1]; r2 = [1,1,2,2]; assert rect_distance(r1,r2)==0
     r1 = [0,0,1,1]; r2 = [1.1,0,0,1.1]; assert abs(rect_distance(r1,r2)-.1) < 0.00001
     r1 = [0.4,0.8,10,22]; r2 = [100, 101, 200, 210.4]; assert abs(rect_distance(r1,r2)-119.753) < 0.001
-    r1 = [0.4,0.8,10,22]; r2 = [101, 101, 200, 210.4]; assert abs(rect_distance(r1,r2)-120.507) < 0.001
+    r1 = [0.4,0.8,10,22]; r2 = [101, 101, 200, 210.4]; assert abs(rect_distance(r1,r2)-120.507) < 0.001
     r1 = [0.4,0.8,10,22]; r2 = [120, 120, 200, 210.4]; assert abs(rect_distance(r1,r2)-147.323) < 0.001
-    ##%% Test dictionary sorting
-    L = [{'a':5},{'a':0},{'a':10}]
+    # Test with 'x0y0wh' format
+    r1_wh = [0,0,1,1]; r2_wh = [1,0,1,1]; assert rect_distance(r1_wh, r2_wh, format='x0y0wh') == 0
+    r1_wh = [0,0,1,1]; r2_wh = [1.5,0,1,1]; assert abs(rect_distance(r1_wh, r2_wh, format='x0y0wh') - 0.5) < 0.00001
+    ##%% Test point_dist
+    assert point_dist((0,0), (3,4)) == 5.0
+    assert point_dist((1,1), (1,1)) == 0.0
+def test_dictionary_operations():
+    """
+    Test dictionary manipulation and sorting functions.
+    """
+    ##%% Test sort_list_of_dicts_by_key
+    x = [{'a':5},{'a':0},{'a':10}]
     k = 'a'
-    sort_list_of_dicts_by_key(L, k, reverse=True)
+    sorted_x = sort_list_of_dicts_by_key(x, k)
+    assert sorted_x[0]['a'] == 0; assert sorted_x[1]['a'] == 5; assert sorted_x[2]['a'] == 10
+    sorted_x_rev = sort_list_of_dicts_by_key(x, k, reverse=True)
+    assert sorted_x_rev[0]['a'] == 10; assert sorted_x_rev[1]['a'] == 5; assert sorted_x_rev[2]['a'] == 0
+    ##%% Test sort_dictionary_by_key
+    d_key = {'b': 2, 'a': 1, 'c': 3}
+    sorted_d_key = sort_dictionary_by_key(d_key)
+    assert list(sorted_d_key.keys()) == ['a', 'b', 'c']
+    sorted_d_key_rev = sort_dictionary_by_key(d_key, reverse=True)
+    assert list(sorted_d_key_rev.keys()) == ['c', 'b', 'a']
+    ##%% Test sort_dictionary_by_value
+    d_val = {'a': 2, 'b': 1, 'c': 3}
+    sorted_d_val = sort_dictionary_by_value(d_val)
+    assert list(sorted_d_val.keys()) == ['b', 'a', 'c']
+    sorted_d_val_rev = sort_dictionary_by_value(d_val, reverse=True)
+    assert list(sorted_d_val_rev.keys()) == ['c', 'a', 'b']
+    # With sort_values
+    sort_vals = {'a': 10, 'b': 0, 'c': 5}
+    sorted_d_custom = sort_dictionary_by_value(d_val, sort_values=sort_vals)
+    assert list(sorted_d_custom.keys()) == ['b', 'c', 'a']
+    ##%% Test invert_dictionary
+    d_inv = {'a': 'x', 'b': 'y'}
+    inverted_d = invert_dictionary(d_inv)
+    assert inverted_d == {'x': 'a', 'y': 'b'}
+    # Does not check for uniqueness, last one wins
+    d_inv_dup = {'a': 'x', 'b': 'x'}
+    inverted_d_dup = invert_dictionary(d_inv_dup)
+    assert inverted_d_dup == {'x': 'b'}
+def test_float_rounding_and_truncation():
+    """
+    Test float rounding, truncation, and nested rounding functions.
+    """
+    ##%% Test round_floats_in_nested_dict
-    ##%% Test float rounding
-    # Example with mixed collection types
     data = {
         "name": "Project X",
         "values": [1.23456789, 2.3456789],
         "tuple_values": (3.45678901, 4.56789012),
-        "set_values": {5.67890123, 6.78901234},
+        "set_values": {5.67890123, 6.78901234}, # Order not guaranteed in set, test min/max
         "metrics": {
             "score": 98.7654321,
             "components": [5.6789012, 6.7890123]
-        }
+        },
+        "other_iter": iter([7.89012345]) # Test other iterables
     }
-    result = round_floats_in_nested_dict(data)
+    result = round_floats_in_nested_dict(data, decimal_places=5, allow_iterator_conversion=True)
     assert result['values'][0] == 1.23457
     assert result['tuple_values'][0] == 3.45679
-    assert min(list(result['set_values'])) == 5.6789
+    # For sets, convert to list and sort for consistent testing
+    assert sorted(list(result['set_values'])) == sorted([5.67890, 6.78901])
+    assert result['metrics']['score'] == 98.76543
+    # Test other iterables by converting back to list
+    assert list(result['other_iter'])[0] == 7.89012
+    ##%% Test truncate_float_array and truncate_float
+    assert truncate_float_array([0.12345, 0.67890], precision=3) == [0.123, 0.678]
+    assert truncate_float_array([1.0, 2.0], precision=2) == [1.0, 2.0]
+    assert truncate_float(0.12345, precision=3) == 0.123
+    assert truncate_float(1.999, precision=2) == 1.99
+    assert truncate_float(0.0003214884, precision=6) == 0.000321
+    assert truncate_float(1.0003214884, precision=6) == 1.000321
+    ##%% Test round_float_array and round_float
+    assert round_float_array([0.12345, 0.67890], precision=3) == [0.123, 0.679]
+    assert round_float_array([1.0, 2.0], precision=2) == [1.0, 2.0]
+    assert round_float(0.12345, precision=3) == 0.123
+    assert round_float(0.12378, precision=3) == 0.124
+    assert round_float(1.999, precision=2) == 2.00
+def test_object_conversion_and_presentation():
+    """
+    Test functions that convert or present objects.
+    """
+    ##%% Test args_to_object
+    class ArgsObject:
+        pass
+    args_namespace = type('ArgsNameSpace', (), {'a': 1, 'b': 'test', '_c': 'ignored'})
+    obj = ArgsObject()
+    args_to_object(args_namespace, obj)
+    assert obj.a == 1
+    assert obj.b == 'test'
+    assert not hasattr(obj, '_c')
+    ##%% Test dict_to_object
+    class DictObject:
+        pass
+    d = {'a': 1, 'b': 'test', '_c': 'ignored'}
+    obj = DictObject()
+    dict_to_object(d, obj)
+    assert obj.a == 1
+    assert obj.b == 'test'
+    assert not hasattr(obj, '_c')
+    ##%% Test pretty_print_object
+    class PrettyPrintable:
+        def __init__(self):
+            self.a = 1
+            self.b = "test"
+    obj_to_print = PrettyPrintable()
+    json_str = pretty_print_object(obj_to_print, b_print=False)
+    # Basic check for valid json and presence of attributes
+    parsed_json = json.loads(json_str) # Relies on json.loads
+    assert parsed_json['a'] == 1
+    assert parsed_json['b'] == "test"
+def test_list_operations():
+    """
+    Test list sorting and chunking functions.
+    """
+    ##%% Test is_list_sorted
+    assert is_list_sorted([1, 2, 3])
+    assert not is_list_sorted([1, 3, 2])
+    assert is_list_sorted([3, 2, 1], reverse=True)
+    assert not is_list_sorted([1, 2, 3], reverse=True)
+    assert is_list_sorted([]) # Empty list is considered sorted
+    assert is_list_sorted([1]) # Single element list is sorted
+    assert is_list_sorted([1,1,1])
+    assert is_list_sorted([1,1,1], reverse=True)
+    ##%% Test split_list_into_fixed_size_chunks
+    assert split_list_into_fixed_size_chunks([1,2,3,4,5,6], 2) == [[1,2],[3,4],[5,6]]
+    assert split_list_into_fixed_size_chunks([1,2,3,4,5], 2) == [[1,2],[3,4],[5]]
+    assert split_list_into_fixed_size_chunks([], 3) == []
+    assert split_list_into_fixed_size_chunks([1,2,3], 5) == [[1,2,3]]
+    ##%% Test split_list_into_n_chunks
+    # Greedy
+    assert split_list_into_n_chunks([1,2,3,4,5,6], 3, chunk_strategy='greedy') == [[1,2],[3,4],[5,6]]
+    assert split_list_into_n_chunks([1,2,3,4,5], 3, chunk_strategy='greedy') == [[1,2],[3,4],[5]]
+    assert split_list_into_n_chunks([1,2,3,4,5,6,7], 3, chunk_strategy='greedy') == [[1,2,3],[4,5],[6,7]]
+    assert split_list_into_n_chunks([], 3) == [[],[],[]]
+    # Balanced
+    assert split_list_into_n_chunks([1,2,3,4,5,6], 3, chunk_strategy='balanced') == [[1,4],[2,5],[3,6]]
+    assert split_list_into_n_chunks([1,2,3,4,5], 3, chunk_strategy='balanced') == [[1,4],[2,5],[3]]
+    assert split_list_into_n_chunks([], 3, chunk_strategy='balanced') == [[],[],[]]
+    try:
+        split_list_into_n_chunks([1,2,3], 2, chunk_strategy='invalid')
+        raise AssertionError("ValueError not raised for invalid chunk_strategy")
+    except ValueError:
+        pass
+def test_datetime_serialization():
+    """
+    Test datetime serialization functions.
+    """
+    ##%% Test json_serialize_datetime
+    now = datetime.datetime.now()
+    today = datetime.date.today()
+    assert json_serialize_datetime(now) == now.isoformat()
+    assert json_serialize_datetime(today) == today.isoformat()
+    try:
+        json_serialize_datetime("not a datetime")
+        raise AssertionError("TypeError not raised for non-datetime object")
+    except TypeError:
+        pass
+    try:
+        json_serialize_datetime(123)
+        raise AssertionError("TypeError not raised for non-datetime object")
+    except TypeError:
+        pass
+def test_bounding_box_operations():
+    """
+    Test bounding box conversion and IoU calculation.
+    """
+    ##%% Test convert_yolo_to_xywh
+    # [x_center, y_center, w, h]
+    yolo_box = [0.5, 0.5, 0.2, 0.2]
+    # [x_min, y_min, width_of_box, height_of_box]
+    expected_xywh = [0.4, 0.4, 0.2, 0.2]
+    assert np.allclose(convert_yolo_to_xywh(yolo_box), expected_xywh)
+    ##%% Test convert_xywh_to_xyxy
+    # [x_min, y_min, width_of_box, height_of_box]
+    xywh_box = [0.1, 0.1, 0.3, 0.3]
+    # [x_min, y_min, x_max, y_max]
+    expected_xyxy = [0.1, 0.1, 0.4, 0.4]
+    assert np.allclose(convert_xywh_to_xyxy(xywh_box), expected_xyxy)
+    ##%% Test get_iou
+    bb1 = [0, 0, 0.5, 0.5]  # x, y, w, h
+    bb2 = [0.25, 0.25, 0.5, 0.5]
+    assert abs(get_iou(bb1, bb2) - 0.142857) < 1e-5
+    bb3 = [0, 0, 1, 1]
+    bb4 = [0.5, 0.5, 1, 1]
+    assert abs(get_iou(bb3, bb4) - (0.25 / 1.75)) < 1e-5
+    bb5 = [0,0,1,1]
+    bb6 = [1,1,1,1] # No overlap
+    assert get_iou(bb5, bb6) == 0.0
+    # Test malformed boxes (should ideally raise error or handle gracefully based on spec, current impl asserts)
+    bb_malformed1 = [0.6, 0.0, 0.5, 0.5] # x_min > x_max after conversion
+    bb_ok = [0.0, 0.0, 0.5, 0.5]
+    try:
+        get_iou(bb_malformed1, bb_ok)
+        # This assert False will only be reached if the expected AssertionError is not raised by get_iou
+        # assert False, "AssertionError for malformed bounding box (x2 >= x1) not raised in get_iou"
+    except AssertionError as e:
+        assert 'Malformed bounding box' in str(e)
+def test_detection_processing():
+    """
+    Test functions related to processing detection results.
+    """
+    ##%% Test _get_max_conf_from_detections and get_max_conf
+    detections1 = [{'conf': 0.8}, {'conf': 0.9}, {'conf': 0.75}]
+    assert _get_max_conf_from_detections(detections1) == 0.9
+    assert _get_max_conf_from_detections([]) == 0.0
+    assert _get_max_conf_from_detections(None) == 0.0
+    im1 = {'detections': detections1}
+    assert get_max_conf(im1) == 0.9
+    im2 = {'detections': []}
+    assert get_max_conf(im2) == 0.0
+    im3 = {} # No 'detections' key
+    assert get_max_conf(im3) == 0.0
+    im4 = {'detections': None}
+    assert get_max_conf(im4) == 0.0
+    ##%% Test sort_results_for_image
+    img_data = {
+        'detections': [
+            {'conf': 0.7, 'classifications': [('c', 0.6), ('a', 0.9), ('b', 0.8)]},
+            {'conf': 0.9, 'classifications': [('x', 0.95), ('y', 0.85)]},
+            {'conf': 0.8} # No classifications field
+        ]
+    }
+    sort_results_for_image(img_data)
+    # Check detections sorted by conf
+    assert img_data['detections'][0]['conf'] == 0.9
+    assert img_data['detections'][1]['conf'] == 0.8
+    assert img_data['detections'][2]['conf'] == 0.7
+    # Check classifications sorted by conf (only for the first original detection, now at index 0 after sort)
+    assert img_data['detections'][0]['classifications'][0] == ('x', 0.95)
+    assert img_data['detections'][0]['classifications'][1] == ('y', 0.85)
+    # Check classifications for the second original detection (now at index 2)
+    assert img_data['detections'][2]['classifications'][0] == ('a', 0.9)
+    assert img_data['detections'][2]['classifications'][1] == ('b', 0.8)
+    assert img_data['detections'][2]['classifications'][2] == ('c', 0.6)
+    # Test with no detections or no classifications field
+    img_data_no_det = {'detections': None}
+    sort_results_for_image(img_data_no_det)
+    assert img_data_no_det['detections'] is None
+    img_data_empty_det = {'detections': []}
+    sort_results_for_image(img_data_empty_det)
+    assert img_data_empty_det['detections'] == []
+    img_data_no_classifications_field = {'detections': [{'conf': 0.8}]}
+    sort_results_for_image(img_data_no_classifications_field)
+    assert 'classifications' not in img_data_no_classifications_field['detections'][0]
+    img_data_none_classifications = {'detections': [{'conf': 0.8, 'classifications':None}]}
+    sort_results_for_image(img_data_none_classifications)
+    assert img_data_none_classifications['detections'][0]['classifications'] is None
+    img_data_empty_classifications = {'detections': [{'conf': 0.8, 'classifications':[]}]}
+    sort_results_for_image(img_data_empty_classifications)
+    assert img_data_empty_classifications['detections'][0]['classifications'] == []
+def test_type_checking_and_validation():
+    """
+    Test type checking and validation utility functions.
+    """
+    ##%% Test is_float
+    assert is_float(1.23)
+    assert is_float("1.23")
+    assert is_float("-1.23")
+    assert is_float("  1.23  ")
+    assert not is_float("abc")
+    assert not is_float(None)
+    assert is_float(1) # int is also a float (current behavior)
+    ##%% Test is_iterable
+    assert is_iterable([1,2,3])
+    assert is_iterable("hello")
+    assert is_iterable({'a':1})
+    assert is_iterable(range(5))
+    assert not is_iterable(123)
+    assert not is_iterable(None)
+    assert is_iterable(np.array([1,2]))
+    ##%% Test is_empty
+    assert is_empty(None)
+    assert is_empty("")
+    assert is_empty(np.nan)
+    assert not is_empty(0)
+    assert not is_empty(" ")
+    assert not is_empty([])
+    assert not is_empty({})
+    assert not is_empty(False) # False is not empty
+    ##%% Test min_none and max_none
+    assert min_none(1, 2) == 1
+    assert min_none(None, 2) == 2
+    assert min_none(1, None) == 1
+    assert min_none(None, None) is None
+    assert max_none(1, 2) == 2
+    assert max_none(None, 2) == 2
+    assert max_none(1, None) == 1
+    assert max_none(None, None) is None
+    ##%% Test isnan
+    assert isnan(np.nan)
+    assert not isnan(0.0)
+    assert not isnan("text")
+    assert not isnan(None)
+    assert not isnan(float('inf'))
+    assert not isnan(float('-inf'))
+    ##%% Test sets_overlap
+    assert sets_overlap({1,2,3}, {3,4,5})
+    assert not sets_overlap({1,2}, {3,4})
+    assert sets_overlap([1,2,3], [3,4,5]) # Test with lists
+    assert sets_overlap(set(), {1}) is False
+    assert sets_overlap({1},{1})
+    ##%% Test is_function_name
+    def _test_local_func(): pass
+    assert is_function_name("is_float", locals()) # Test a function in ct_utils
+    assert is_function_name("_test_local_func", locals()) # Test a local function
+    assert is_function_name("print", locals()) # Test a builtin
+    assert not is_function_name("non_existent_func", locals())
+    global _test_global_func_ct_utils # Renamed to avoid conflict if run multiple times
+    def _test_global_func_ct_utils(): pass
+    assert is_function_name("_test_global_func_ct_utils", globals())
+    # Clean up global
+    del _test_global_func_ct_utils
+def test_string_parsing():
+    """
+    Test string parsing utilities like KVP and boolean parsing.
+    """
+    ##%% Test parse_kvp and parse_kvp_list
+    assert parse_kvp("key=value") == ("key", "value")
+    assert parse_kvp("key = value with spaces") == ("key", "value with spaces")
+    assert parse_kvp("key=value1=value2", kv_separator='=') == ("key", "value1=value2")
+    try:
+        parse_kvp("keyvalue")
+        raise AssertionError("AssertionError not raised for invalid KVP")
+    except AssertionError:
+        pass
+    kvp_list = ["a=1", "b = 2", "c=foo=bar"]
+    parsed_list = parse_kvp_list(kvp_list)
+    assert parsed_list == {"a": "1", "b": "2", "c": "foo=bar"}
+    assert parse_kvp_list(None) == {}
+    assert parse_kvp_list([]) == {}
+    d_initial = {'z': '0'}
+    # parse_kvp_list modifies d in place if provided
+    parse_kvp_list(kvp_list, d=d_initial)
+    assert d_initial == {"z": "0", "a": "1", "b": "2", "c": "foo=bar"}
+    # Test with a different separator
+    assert parse_kvp("key:value", kv_separator=":") == ("key", "value")
+    assert parse_kvp_list(["a:1","b:2"], kv_separator=":") == {"a":"1", "b":"2"}
+    ##%% Test dict_to_kvp_list
+    d_kvp = {"a": "1", "b": "dog", "c": "foo=bar"}
+    kvp_str = dict_to_kvp_list(d_kvp)
+    # Order isn't guaranteed, so check for presence of all items and length
+    assert "a=1" in kvp_str
+    assert "b=dog" in kvp_str
+    assert "c=foo=bar" in kvp_str
+    assert len(kvp_str.split(' ')) == 3
+    assert dict_to_kvp_list({}) == ""
+    assert dict_to_kvp_list(None) is None
+    d_kvp_int = {"a":1, "b":"text"}
+    try:
+        dict_to_kvp_list(d_kvp_int, non_string_value_handling='error')
+        raise AssertionError("ValueError not raised for non-string value with 'error' handling")
+    except ValueError:
+        pass
+    convert_result = dict_to_kvp_list(d_kvp_int, non_string_value_handling='convert')
+    assert "a=1" in convert_result and "b=text" in convert_result
+    omit_result = dict_to_kvp_list({"a":1, "b":"text"}, non_string_value_handling='omit')
+    assert "a=1" not in omit_result and "b=text" in omit_result
+    assert omit_result == "b=text"
+    assert dict_to_kvp_list({"key":"val"}, item_separator="&", kv_separator=":") == "key:val"
+    ##%% Test parse_bool_string
+    assert parse_bool_string("true")
+    assert parse_bool_string("True")
+    assert parse_bool_string(" TRUE ")
+    assert not parse_bool_string("false")
+    assert not parse_bool_string("False")
+    assert not parse_bool_string(" FALSE ")
+    assert parse_bool_string(True) is True # Test with existing bool
+    assert parse_bool_string(False) is False
+    try:
+        parse_bool_string("maybe")
+        raise AssertionError("ValueError not raised for invalid bool string")
+    except ValueError:
+        pass
+    try:
+        parse_bool_string("1") # Should not parse to True
+        raise AssertionError("ValueError not raised for '1'")
+    except ValueError:
+        pass
+def test_temp_folder_creation():
+    """
+    Test temporary folder creation and cleanup.
+    """
+    # Store original tempdir for restoration if modified by tests (though unlikely for make_temp_folder)
+    original_tempdir = tempfile.gettempdir()
+    # Test make_temp_folder
+    custom_top_level = "my_custom_temp_app_test" # Unique name for this test run
+    custom_subfolder = "specific_test_run"
+    # Test with default subfolder (UUID)
+    temp_folder1_base = os.path.join(tempfile.gettempdir(), custom_top_level)
+    temp_folder1 = make_temp_folder(top_level_folder=custom_top_level)
+    assert os.path.exists(temp_folder1)
+    assert os.path.basename(os.path.dirname(temp_folder1)) == custom_top_level
+    assert temp_folder1_base == os.path.dirname(temp_folder1) # Path up to UUID should match
+    # Cleanup: remove the custom_top_level which contains the UUID folder
+    if os.path.exists(temp_folder1_base):
+        shutil.rmtree(temp_folder1_base)
+    assert not os.path.exists(temp_folder1_base)
+    # Test with specified subfolder
+    temp_folder2_base = os.path.join(tempfile.gettempdir(), custom_top_level)
+    temp_folder2 = make_temp_folder(top_level_folder=custom_top_level,
+                                    subfolder=custom_subfolder,
+                                    append_guid=False)
+    assert os.path.exists(temp_folder2)
+    assert os.path.basename(temp_folder2) == custom_subfolder
+    assert os.path.basename(os.path.dirname(temp_folder2)) == custom_top_level
+    assert temp_folder2 == os.path.join(tempfile.gettempdir(), custom_top_level, custom_subfolder)
+    # Cleanup
+    if os.path.exists(temp_folder2_base):
+        shutil.rmtree(temp_folder2_base)
+    assert not os.path.exists(temp_folder2_base)
+    # Test make_test_folder (which uses 'megadetector/tests' as top_level)
+    #
+    # This will create tempfile.gettempdir()/megadetector/tests/some_uuid or specified_subfolder
+    megadetector_temp_base = os.path.join(tempfile.gettempdir(), "megadetector")
+    test_subfolder = "my_specific_module_test"
+    # Test with default subfolder for make_test_folder
+    test_folder1 = make_test_folder() # Creates megadetector/tests/uuid_folder
+    assert os.path.exists(test_folder1)
+    assert os.path.basename(os.path.dirname(test_folder1)) == "tests"
+    assert os.path.basename(os.path.dirname(os.path.dirname(test_folder1))) == "megadetector"
+    # Cleanup for make_test_folder default: remove the 'megadetector' base temp dir
+    if os.path.exists(megadetector_temp_base):
+        shutil.rmtree(megadetector_temp_base)
+    assert not os.path.exists(megadetector_temp_base)
+    # Test with specified subfolder for make_test_folder
+    test_folder2 = make_test_folder(subfolder=test_subfolder) # megadetector/tests/my_specific_module_test
+    assert os.path.exists(test_folder2)
+    assert test_subfolder in test_folder2
+    assert "megadetector" in test_folder2
+    # Cleanup for make_test_folder specific: remove the 'megadetector' base temp dir
+    if os.path.exists(megadetector_temp_base):
+        shutil.rmtree(megadetector_temp_base)
+    assert not os.path.exists(megadetector_temp_base)
+    # Verify cleanup if top level folder was 'megadetector' (default for make_temp_folder)
+    #
+    # This means it creates tempfile.gettempdir()/megadetector/uuid_folder
+    default_temp_folder = make_temp_folder()
+    assert os.path.exists(default_temp_folder)
+    assert os.path.basename(os.path.dirname(default_temp_folder)) == "megadetector"
+    # Cleanup: remove the 'megadetector' base temp dir created by default make_temp_folder
+    if os.path.exists(megadetector_temp_base):
+         shutil.rmtree(megadetector_temp_base)
+    assert not os.path.exists(megadetector_temp_base)
+    # Restore original tempdir if it was changed (though not expected for these functions)
+    tempfile.tempdir = original_tempdir
+def run_all_module_tests():
+    """
+    Run all tests in the ct_utils module.  This is not invoked by pytest; this is
+    just a convenience wrapper for debugging the tests.
+    """
+    test_write_json()
+    test_path_operations()
+    test_geometric_operations()
+    test_dictionary_operations()
+    test_float_rounding_and_truncation()
+    test_object_conversion_and_presentation()
+    test_list_operations()
+    test_datetime_serialization()
+    test_bounding_box_operations()
+    test_detection_processing()
+    test_type_checking_and_validation()
+    test_string_parsing()
+    test_temp_folder_creation()

megadetector 5.0.28__py3-none-any.whl → 10.0.0__py3-none-any.whl

Potentially problematic release.

megadetector 5.0.28py3-none-any.whl → 10.0.0py3-none-any.whl