PyPI - sonusai - Versions diffs - 0.20.2__py3-none-any.whl → 1.0.1__py3-none-any.whl - Mend

sonusai 0.20.2py3-none-any.whl → 1.0.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (97) hide show

sonusai/__init__.py +16 -3
sonusai/audiofe.py +240 -76
sonusai/calc_metric_spenh.py +71 -73
sonusai/config/__init__.py +3 -0
sonusai/config/config.py +61 -0
sonusai/config/config.yml +20 -0
sonusai/config/constants.py +8 -0
sonusai/constants.py +11 -0
sonusai/data/genmixdb.yml +21 -36
sonusai/{mixture/datatypes.py → datatypes.py} +91 -130
sonusai/deprecated/plot.py +4 -5
sonusai/doc/doc.py +4 -4
sonusai/doc.py +11 -4
sonusai/genft.py +43 -45
sonusai/genmetrics.py +23 -19
sonusai/genmix.py +54 -82
sonusai/genmixdb.py +88 -264
sonusai/ir_metric.py +30 -34
sonusai/lsdb.py +41 -48
sonusai/main.py +15 -22
sonusai/metrics/calc_audio_stats.py +4 -17
sonusai/metrics/calc_class_weights.py +4 -4
sonusai/metrics/calc_optimal_thresholds.py +8 -5
sonusai/metrics/calc_pesq.py +2 -2
sonusai/metrics/calc_segsnr_f.py +4 -4
sonusai/metrics/calc_speech.py +25 -13
sonusai/metrics/class_summary.py +7 -7
sonusai/metrics/confusion_matrix_summary.py +5 -5
sonusai/metrics/one_hot.py +4 -4
sonusai/metrics/snr_summary.py +7 -7
sonusai/metrics_summary.py +38 -45
sonusai/mixture/__init__.py +5 -104
sonusai/mixture/audio.py +10 -39
sonusai/mixture/class_balancing.py +103 -0
sonusai/mixture/config.py +251 -271
sonusai/mixture/constants.py +35 -39
sonusai/mixture/data_io.py +25 -36
sonusai/mixture/db_datatypes.py +58 -22
sonusai/mixture/effects.py +386 -0
sonusai/mixture/feature.py +7 -11
sonusai/mixture/generation.py +484 -611
sonusai/mixture/helpers.py +82 -184
sonusai/mixture/ir_delay.py +3 -4
sonusai/mixture/ir_effects.py +77 -0
sonusai/mixture/log_duration_and_sizes.py +6 -12
sonusai/mixture/mixdb.py +931 -669
sonusai/mixture/pad_audio.py +35 -0
sonusai/mixture/resample.py +7 -0
sonusai/mixture/sox_effects.py +195 -0
sonusai/mixture/sox_help.py +650 -0
sonusai/mixture/spectral_mask.py +2 -2
sonusai/mixture/truth.py +17 -15
sonusai/mixture/truth_functions/crm.py +12 -12
sonusai/mixture/truth_functions/energy.py +22 -22
sonusai/mixture/truth_functions/file.py +5 -5
sonusai/mixture/truth_functions/metadata.py +4 -4
sonusai/mixture/truth_functions/metrics.py +4 -4
sonusai/mixture/truth_functions/phoneme.py +3 -3
sonusai/mixture/truth_functions/sed.py +11 -13
sonusai/mixture/truth_functions/target.py +10 -10
sonusai/mkwav.py +26 -29
sonusai/onnx_predict.py +240 -88
sonusai/queries/__init__.py +2 -2
sonusai/queries/queries.py +38 -34
sonusai/speech/librispeech.py +1 -1
sonusai/speech/mcgill.py +1 -1
sonusai/speech/timit.py +2 -2
sonusai/summarize_metric_spenh.py +10 -17
sonusai/utils/__init__.py +7 -1
sonusai/utils/asl_p56.py +2 -2
sonusai/utils/asr.py +2 -2
sonusai/utils/asr_functions/aaware_whisper.py +4 -5
sonusai/utils/choice.py +31 -0
sonusai/utils/compress.py +1 -1
sonusai/utils/dataclass_from_dict.py +19 -1
sonusai/utils/energy_f.py +3 -3
sonusai/utils/evaluate_random_rule.py +15 -0
sonusai/utils/keyboard_interrupt.py +12 -0
sonusai/utils/onnx_utils.py +3 -17
sonusai/utils/print_mixture_details.py +21 -19
sonusai/utils/{temp_seed.py → rand.py} +3 -3
sonusai/utils/read_predict_data.py +2 -2
sonusai/utils/reshape.py +3 -3
sonusai/utils/stratified_shuffle_split.py +3 -3
sonusai/{mixture → utils}/tokenized_shell_vars.py +1 -1
sonusai/utils/write_audio.py +2 -2
sonusai/vars.py +11 -4
{sonusai-0.20.2.dist-info → sonusai-1.0.1.dist-info}/METADATA +4 -2
sonusai-1.0.1.dist-info/RECORD +138 -0
sonusai/mixture/augmentation.py +0 -444
sonusai/mixture/class_count.py +0 -15
sonusai/mixture/eq_rule_is_valid.py +0 -45
sonusai/mixture/target_class_balancing.py +0 -107
sonusai/mixture/targets.py +0 -175
sonusai-0.20.2.dist-info/RECORD +0 -128
{sonusai-0.20.2.dist-info → sonusai-1.0.1.dist-info}/WHEEL +0 -0
{sonusai-0.20.2.dist-info → sonusai-1.0.1.dist-info}/entry_points.txt +0 -0

sonusai/__init__.py CHANGED Viewed

@@ -3,9 +3,6 @@ from importlib import metadata
 from os.path import dirname
 from rich.logging import RichHandler
-from rich.traceback import install
-install(show_locals=True)
 __version__ = metadata.version(__package__)  # pyright: ignore [reportArgumentType]
 BASEDIR = dirname(__file__)
@@ -81,3 +78,19 @@ def commands_list(doc: str = commands_doc) -> list[str]:
         if command:
             commands.append(command)
     return commands
+def exception_handler(e: Exception) -> None:
+    import sys
+    from rich.console import Console
+    logger.error(f"{type(e).__name__}: {e}")
+    handlers = [handler for handler in logger.handlers if isinstance(handler, logging.FileHandler)]
+    logger.error(f"See {', '.join(handler.baseFilename for handler in handlers)} for details")
+    console = Console(color_system=None)
+    with console.capture() as capture:
+        console.print_exception(show_locals=False)
+    logger.debug(capture.get())
+    sys.exit(1)

sonusai/audiofe.py CHANGED Viewed

@@ -1,17 +1,23 @@
 """sonusai audiofe
-usage: audiofe [-hvds] [--version] [-i INPUT] [-l LENGTH] [-m MODEL] [-a ASR] [-w WMODEL]
+usage: audiofe [-hvdsp] [--version] [-i INPUT] [-l LENGTH] [-a ASR] [-n NOISEDB]
+                        [-w WMODEL] [-o FEATURE] MODEL
 options:
     -h, --help
     -v, --verbose                   Be verbose.
     -d, --debug                     Write debug data to H5 file.
     -s, --show                      Display a list of available audio inputs.
-    -i INPUT, --input INPUT         Input audio.
+    -i INPUT, --input INPUT         Audio source from ALSA or .wav file. See -s or arecord -L. [default: default]
     -l LENGTH, --length LENGTH      Length of audio in seconds. [default: -1].
-    -m MODEL, --model MODEL         ONNX model.
+    -m MODEL, --model MODEL         SonusAI ONNX model applied to the captured audio.
+    -n NOISEDB, --noiseadd NOISEDB  Amount of noise to keep in clean audio output. [default: -30]
+    -p, --playback                  Enable playback of noisy audio, then the model prediction output audio
     -a ASR, --asr ASR               ASR method to use.
     -w WMODEL, --whisper WMODEL     Model used in whisper, aixplain_whisper and faster_whisper methods. [default: tiny].
+    -o FEATURE, --feature-overlap   Run SonusAI model in overlap-streaming mode using FEATURE which is an 8-10 character
+                                    string specifying a stride-overlap feature of the same type as the model, i.e. a
+                                    model with default feature of hun00ns1 could use hun00nv80 or hun00nv128, etc.
 Aaware SonusAI Audio Front End.
@@ -35,68 +41,40 @@ audiofe_<TIMESTAMP>.h5.
 """
-import signal
 import numpy as np
 from sonusai.mixture import AudioT
-def signal_handler(_sig, _frame):
-    import sys
-    from sonusai import logger
-    logger.info("Canceled due to keyboard interrupt")
-    sys.exit(1)
-signal.signal(signal.SIGINT, signal_handler)
 def main() -> None:
     from docopt import docopt
-    import sonusai
+    from sonusai import __version__ as sai_version
     from sonusai.utils import trim_docstring
-    args = docopt(trim_docstring(__doc__), version=sonusai.__version__, options_first=True)
+    args = docopt(trim_docstring(__doc__), version=sai_version, options_first=True)
     verbose = args["--verbose"]
     length = float(args["--length"])
     input_name = args["--input"]
-    model_name = args["--model"]
+    feature_ovr = args["--feature-overlap"]
     asr_name = args["--asr"]
     whisper_name = args["--whisper"]
     debug = args["--debug"]
     show = args["--show"]
+    playback = args["--playback"]
+    noiseadd = args["--noiseadd"]
+    model_name = args["MODEL"]
-    from os.path import exists
-    import h5py
     import pyaudio
     from sonusai import create_file_handler
     from sonusai import initial_log_messages
     from sonusai import logger
     from sonusai import update_console_handler
-    from sonusai.mixture import SAMPLE_RATE
-    from sonusai.mixture import get_audio_from_feature
-    from sonusai.mixture import get_feature_from_audio
-    from sonusai.utils import calc_asr
     from sonusai.utils import create_timestamp
     from sonusai.utils import get_input_devices
     from sonusai.utils import load_ort_session
-    from sonusai.utils import write_audio
-    ts = create_timestamp()
-    capture_name = f"audiofe_capture_{ts}"
-    capture_wav = capture_name + ".wav"
-    capture_png = capture_name + ".png"
-    predict_name = f"audiofe_predict_{ts}"
-    predict_wav = predict_name + ".wav"
-    predict_png = predict_name + ".png"
-    h5_name = f"audiofe_{ts}.h5"
     # Setup logging file
     create_file_handler("audiofe.log")
@@ -111,7 +89,91 @@ def main() -> None:
             logger.info(f"{name}")
         logger.info("")
         p.terminate()
-        return
+        # return
+    ts = create_timestamp()
+    capture_name = f"{ts}-noisy"
+    capture_wav = capture_name + ".wav"
+    capture_png = capture_name + ".png"
+    predict_name = f"{ts}-pred"
+    predict_wav = predict_name + ".wav"
+    predict_png = predict_name + ".png"
+    h5_name = f"{ts}-audiofe.h5"
+    if model_name is not None:
+        session, options, model_root, hparams, sess_inputs, sess_outputs = load_ort_session(model_name)
+        if hparams is None:
+            logger.error("Error: ONNX model does not have required SonusAI hyperparameters, cannot proceed.")
+            raise SystemExit(1)
+        feature_mode = hparams["feature"]
+        if feature_ovr is not None:
+            # TBD checks for match and valid feature_ovr
+            stride = int(feature_ovr[7:])
+            sov_type = feature_ovr[6]  # v,e,f,t supported, need to calculate stride from tstep
+            if sov_type == "v":
+                feat_step = int(np.ceil(0.5 * stride))
+            elif sov_type == "e":
+                feat_step = int(np.ceil(4 * stride / 5))
+            elif sov_type == "f":
+                feat_step = int(np.ceil(3 * stride / 4))
+            elif sov_type == "t":
+                feat_step = int(np.ceil(2 * stride / 3))
+            else:
+                logger.error("Override feature does not have a supported overlap mode, exiting.")
+                raise SystemExit(1)
+            feature_orig = feature_mode
+            feature_mode = feature_ovr
+            logger.info(
+                f"Overriding feature with {feature_ovr} (was {feature_orig}), with stride={stride}, step={feat_step}."
+            )
+        else:
+            feat_step = 1
+        from pyaaware import FeatureGenerator
+        fg = FeatureGenerator(feature_mode=feature_mode)
+        ftn = fg.ftransform_length  # feature transform length
+        ftr = fg.ftransform_overlap  # forward transform samples per step (R)
+        fstride = fg.stride  # feature stride
+        fsamples = fstride * ftr  # total samples in feature
+        in0name = sess_inputs[0].name
+        in0type = sess_inputs[0].type
+        out_names = [n.name for n in session.get_outputs()]
+        if len(sess_inputs) != 1:
+            logger.error(f"Error: ONNX model does not have 1 input, but {len(sess_inputs)}. Exit due to unknown input.")
+            raise SystemExit(1)
+        if verbose:
+            logger.info(f"Read and compiled ONNX model from {model_name}.")
+            import onnx
+            omodel = onnx.load(model_name)
+            from sonusai.utils.onnx_utils import get_and_check_inputs
+            from sonusai.utils.onnx_utils import get_and_check_outputs
+            logger.info(f"Onnx model uses ir_version {omodel.ir_version}")
+            onnx_inputs, inshapes = get_and_check_inputs(omodel)  # Note: logs warning if # inputs > 1
+            logger.info(f"Onnx model input has {len(inshapes[0])} dims with shape (0 means dynamic): {inshapes[0]}")
+            logger.info(f"Onnx model input has type: {in0type}")
+            onnx_outputs, oshapes = get_and_check_outputs(omodel)
+            logger.info(f"Onnx model output has {len(oshapes[0])} dims with shape (0 means dynamic): {oshapes[0]}")
+            import onnxruntime as ort
+            providers = ort.get_available_providers()
+            logger.info(f"ONNX runtime available providers: {providers}.")
+    else:
+        logger.error("No ONNX model provided, exiting.")
+        raise SystemExit(1)
+    from os.path import exists
+    import h5py
+    from sonusai.constants import SAMPLE_RATE
+    from sonusai.mixture import get_audio_from_feature
+    from sonusai.mixture import get_feature_from_audio
+    from sonusai.utils import calc_asr
+    from sonusai.utils import write_audio
     if input_name is not None and exists(input_name):
         capture_audio = get_frames_from_file(input_name, length)
@@ -123,8 +185,12 @@ def main() -> None:
             return
         # Only write if capture from device, not for file input
         write_audio(capture_wav, capture_audio, SAMPLE_RATE)
-        logger.info("")
-        logger.info(f"Wrote capture audio with shape {capture_audio.shape} to {capture_wav}")
+        logger.debug("")
+        logger.debug(f"Wrote capture audio with shape {capture_audio.shape} to {capture_wav}")
+    # Pad audio to transform step size
+    padlen_tf = int(np.ceil(len(capture_audio) / ftr)) * ftr - len(capture_audio)
+    capture_audio = np.pad(capture_audio, (0, padlen_tf), "constant", constant_values=(0, 0))
     if debug:
         with h5py.File(h5_name, "a") as f:
@@ -135,24 +201,16 @@ def main() -> None:
     if asr_name is not None:
         logger.info(f"Running ASR on captured audio with {asr_name} ...")
-        capture_asr = calc_asr(capture_audio, engine=asr_name, whisper_model_name=whisper_name).text
-        logger.info(f"Capture audio ASR: {capture_asr}")
+        capture_asr = calc_asr(capture_audio, engine=asr_name, model=whisper_name).text
+        logger.info(f"Noisy audio ASR: {capture_asr}")
     if model_name is not None:
-        session, options, model_root, hparams, sess_inputs, sess_outputs = load_ort_session(model_name)
-        if hparams is None:
-            logger.error("Error: ONNX model does not have required SonusAI hyperparameters, cannot proceed.")
-            raise SystemExit(1)
-        feature_mode = hparams["feature"]
-        in0name = sess_inputs[0].name
-        in0type = sess_inputs[0].type
-        out_names = [n.name for n in session.get_outputs()]
-        # frames x stride x feat_params
-        feature = get_feature_from_audio(audio=capture_audio, feature_mode=feature_mode)
-        save_figure(capture_png, capture_audio, feature)
-        logger.info(f"Wrote capture plots to {capture_png}")
+        # Pad audio to fill total feature stride * transform stride samples
+        padlen = int(np.ceil(len(capture_audio) / fsamples)) * fsamples - len(capture_audio)
+        capture_audio_p = np.pad(capture_audio, (0, padlen), "constant", constant_values=(0, 0))
+        # feature always frames x stride x feat_params, convert to always Batch x Tsteps x Bins
+        feature = get_feature_from_audio(audio=capture_audio_p, feature_mode=feature_mode)
         if debug:
             with h5py.File(h5_name, "a") as f:
                 if "feature" in f:
@@ -160,25 +218,61 @@ def main() -> None:
                 f.create_dataset("feature", data=feature)
             logger.info(f"Wrote feature with shape {feature.shape} to {h5_name}")
+        feat_nov = sov2nov(feature, feat_step)  # remove overlap, output always Batch x Tsteps x Bins
+        # TBD remove padding of feature-stride
+        # if padlen > 0:
+        save_figure(capture_png, capture_audio, feat_nov)
+        logger.info(f"Wrote capture plots to {capture_png}")
+        if feature_ovr is not None:
+            test_audio = get_audio_from_feature(feature=feat_nov, feature_mode=feature_orig)
+            # write_audio(f'{ts}-noisy-itf.wav', test_audio, SAMPLE_RATE)
+        else:
+            # feature is frames x 1 x Bins, reshape to 1 x frames x Bins for model
+            feature = feature.transpose((1, 0, 2))
         if in0type.find("float16") != -1:
             logger.info("Detected input of float16, converting all feature inputs to that type.")
-            feature = np.float16(feature)  # type: ignore[assignment]
+            feature = np.float16(feature)  # type: ignore
         # Run inference, ort session wants batch x timesteps x feat_params, outputs numpy BxTxFP or BxFP
         # Note full reshape not needed here since we assume speech enhancement type model, so a transpose suffices
-        predict = np.transpose(
-            session.run(out_names, {in0name: np.transpose(feature, (1, 0, 2))})[0],
-            (1, 0, 2),
-        )
+        logger.info(f"Running model on data with shape {feature.shape} ...")
+        if feature_ovr is None:
+            predict = session.run(out_names, {in0name: feature})[0]  # standard mode (entire batch)
+        else:
+            predict = np.zeros(feature.shape)
+            for i in range(predict.shape[0]):
+                logger.debug(f"running batch: {i}")
+                predict[i, :, :] = session.run(out_names, {in0name: feature[i : i + 1, :, :]})[0]
         if debug:
             with h5py.File(h5_name, "a") as f:
                 if "predict" in f:
                     del f["predict"]
                 f.create_dataset("predict", data=predict)
-            logger.info(f"Wrote predict with shape {predict.shape} to {h5_name}")
+            logger.info(f"Wrote predict data with shape {predict.shape} to {h5_name}")
+        if feature_ovr is not None:
+            predict = sov2nov(predict, feat_step)  # always returns batch x tsteps x feat_params
+            predict_audio = get_audio_from_feature(feature=predict, feature_mode=feature_orig)
+        else:
+            predict = predict.transpose((1, 0, 2))  # need transpose to frames x 1 x bins
+            predict_audio = get_audio_from_feature(feature=predict, feature_mode=feature_mode)
+        if predict_audio.shape[0] > capture_audio.shape[0]:
+            predict_audio = predict_audio[0 : (capture_audio.shape[0] - predict_audio.shape[0])]
+        if predict_audio.shape[0] < capture_audio.shape[0]:
+            capture_audio = capture_audio[0 : (predict_audio.shape[0] - capture_audio.shape[0])]
+        if noiseadd is not None:
+            ngain = np.power(10, min(float(noiseadd), 0.0) / 20.0)  # limit to gain <1, convert to float
+            if ngain < 1.0:  # don't apply if it's 1.0
+                logger.info(f"Adding back noise with gain of {ngain} = {noiseadd} db.")
+                noise = capture_audio - predict_audio
+                predict_audio = predict_audio + ngain * noise
-        predict_audio = get_audio_from_feature(feature=predict, feature_mode=feature_mode)
         write_audio(predict_wav, predict_audio, SAMPLE_RATE)
         logger.info(f"Wrote predict audio with shape {predict_audio.shape} to {predict_wav}")
         if debug:
@@ -193,9 +287,35 @@ def main() -> None:
         if asr_name is not None:
             logger.info(f"Running ASR on model-enhanced audio with {asr_name} ...")
-            predict_asr = calc_asr(predict_audio, engine=asr_name, whisper_model_name=whisper_name).text
+            predict_asr = calc_asr(predict_audio, engine=asr_name, model=whisper_name).text
             logger.info(f"Predict audio ASR: {predict_asr}")
+        plot_en = True
+        if plot_en is not None:
+            import subprocess
+            # Construct plot command using spgramd, start the process non-blocking (will leave matplot open)
+            command = ["python", "spgramd.py", capture_wav, predict_wav]
+            process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+        if playback is not None:
+            import sh
+            sh.play(capture_wav)
+            sh.play(predict_wav)
+            flag_end = False
+            while not flag_end:
+                choice = input("Press 'r' to replay or 'q' to quit: ").strip().lower()
+                if choice == "q":
+                    print("Quitting...")
+                    flag_end = True
+                elif choice == "r":
+                    print("Replaying...")
+                    sh.play(capture_wav)
+                    sh.play(predict_wav)
+                else:
+                    print("Invalid input. Please try again.")
 def get_frames_from_device(input_name: str | None, length: float, chunk: int = 1024) -> AudioT:
     from select import select
@@ -204,8 +324,8 @@ def get_frames_from_device(input_name: str | None, length: float, chunk: int = 1
     import pyaudio
     from sonusai import logger
-    from sonusai.mixture import CHANNEL_COUNT
-    from sonusai.mixture import SAMPLE_RATE
+    from sonusai.constants import CHANNEL_COUNT
+    from sonusai.constants import SAMPLE_RATE
     from sonusai.utils import get_input_device_index_by_name
     from sonusai.utils import get_input_devices
@@ -220,20 +340,16 @@ def get_frames_from_device(input_name: str | None, length: float, chunk: int = 1
     try:
         device_index = get_input_device_index_by_name(p, input_name)
-    except ValueError as e:
+    except ValueError as ex:
         msg = f"Could not find {input_name}\n"
         msg += "Available devices:\n"
         for input_device in input_devices:
             msg += f"  {input_device}\n"
-        raise ValueError(msg) from e
+        raise ValueError(msg) from ex
     logger.info(f"Capturing from {p.get_device_info_by_index(device_index).get('name')}")
     stream = p.open(
-        format=pyaudio.paFloat32,
-        channels=CHANNEL_COUNT,
-        rate=SAMPLE_RATE,
-        input=True,
-        input_device_index=device_index,
+        format=pyaudio.paFloat32, channels=CHANNEL_COUNT, rate=SAMPLE_RATE, input=True, input_device_index=device_index
     )
     stream.start_stream()
@@ -269,7 +385,7 @@ def get_frames_from_device(input_name: str | None, length: float, chunk: int = 1
 def get_frames_from_file(input_name: str, length: float) -> AudioT:
     from sonusai import logger
-    from sonusai.mixture import SAMPLE_RATE
+    from sonusai.constants import SAMPLE_RATE
     from sonusai.mixture import read_audio
     logger.info(f"Capturing from {input_name}")
@@ -281,14 +397,30 @@ def get_frames_from_file(input_name: str, length: float) -> AudioT:
     return frames
+def sov2nov(feature: np.ndarray, step: int) -> np.ndarray:
+    """Convert stride-overlap batch x stride x bins to no overlap frames x 1 x bins"""
+    stride = feature.shape[1]  # stride, tsteps is set to stride in sov mode
+    if stride == 1:
+        return feature  # no reshape if stride is already 1
+    # else:
+    #     hs = feature.shape[1]//2   # half of stride
+    #     nb = feature.shape[0]      # batches
+    nb = feature.shape[0]
+    fout = feature[:, (stride - step) :, :]  # take last
+    fout = np.reshape(fout, [step * nb, 1, feature.shape[2]])
+    return fout  # np.transpose(fout,[1,0,2])
 def save_figure(name: str, audio: np.ndarray, feature: np.ndarray) -> None:
     import matplotlib.pyplot as plt
     from scipy.interpolate import CubicSpline
-    from sonusai.mixture import SAMPLE_RATE
+    from sonusai.constants import SAMPLE_RATE
     from sonusai.utils import unstack_complex
-    spectrum = 20 * np.log(np.abs(np.squeeze(unstack_complex(feature)).transpose()))
+    spectrum = 20 * np.log(np.abs(np.squeeze(unstack_complex(feature)).transpose()) + 1e-7)
     frames = spectrum.shape[1]
     samples = (len(audio) // frames) * frames
     length_in_s = samples / SAMPLE_RATE
@@ -314,4 +446,36 @@ def save_figure(name: str, audio: np.ndarray, feature: np.ndarray) -> None:
 if __name__ == "__main__":
-    main()
+    from sonusai import exception_handler
+    from sonusai.utils import register_keyboard_interrupt
+    register_keyboard_interrupt()
+    try:
+        main()
+    except Exception as e:
+        exception_handler(e)
+# import subprocess
+#
+# # Define the arguments
+# arg1 = "value1"
+# arg2 = "value2"
+#
+# # Construct the command
+# command = ["python", "script.py", arg1, arg2]
+#
+# # Start the process
+# process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+#
+# # Optionally, you can communicate with the process later if needed
+# # For example, to wait for the process to finish and get the output
+# stdout, stderr = process.communicate()
+#
+# # Check if the process was successful
+# if process.returncode == 0:
+#     print("Process executed successfully:")
+#     print(stdout)
+# else:
+#     print("Process failed:")
+#     print(stderr)

sonusai 0.20.2__py3-none-any.whl → 1.0.1__py3-none-any.whl

sonusai 0.20.2py3-none-any.whl → 1.0.1py3-none-any.whl