PyPI - batchalign - Versions diffs - 0.7.20.post18__tar.gz → 0.7.21.post1__tar.gz - Mend

batchalign 0.7.20.post18tar.gz → 0.7.21.post1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

{batchalign-0.7.20.post18/batchalign.egg-info → batchalign-0.7.21.post1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
-Metadata-Version: 2.2
+Metadata-Version: 2.4
 Name: batchalign
-Version: 0.7.20.post18
+Version: 0.7.21.post1
 Summary: Python Speech Language Sample Analysis
 Author: Brian MacWhinney, Houjun Liu
 Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -17,6 +17,8 @@ Requires-Dist: pydub
 Requires-Dist: plotly>=5.3.0
 Requires-Dist: transformers>=4.38.2
 Requires-Dist: tokenizers>=0.14.1
+Requires-Dist: numba>=0.61.0
+Requires-Dist: numpy<=2.2
 Requires-Dist: pycountry>=22.3
 Requires-Dist: stanza[transformers]>=1.10.1
 Requires-Dist: scipy~=1.11
@@ -35,7 +37,11 @@ Requires-Dist: tiktoken
 Requires-Dist: blobfile
 Requires-Dist: sentencepiece
 Requires-Dist: googletrans
-Requires-Dist: openai-whisper>=20240930
+Requires-Dist: openai-whisper
+Requires-Dist: llvmlite>=0.44.0
+Requires-Dist: praat-parselmouth==0.4.6
+Requires-Dist: pyannote.audio
+Requires-Dist: onnxruntime
 Provides-Extra: dev
 Requires-Dist: pytest; extra == "dev"
 Provides-Extra: train
@@ -48,6 +54,7 @@ Dynamic: author-email
 Dynamic: classifier
 Dynamic: description
 Dynamic: description-content-type
+Dynamic: license-file
 Dynamic: provides-extra
 Dynamic: requires-dist
 Dynamic: summary

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/cli/cli.py RENAMED Viewed

@@ -356,6 +356,51 @@ def benchmark(ctx, in_dir, out_dir, lang, num_speakers, whisper, **kwargs):
               in_dir, out_dir,
               loader, writer, C,
               asr="whisper" if whisper else "rev", **kwargs)
+#################### AVQI ################################
+@batchalign.command()
+@click.argument("cs_file", type=click.Path(exists=True, file_okay=True))
+@click.argument("sv_file", type=click.Path(exists=True, file_okay=True))
+@click.option("--lang",
+              help="sample language in three-letter ISO 3166-1 alpha-3 code",
+              show_default=True,
+              default="eng",
+              type=str)
+@click.pass_context
+def avqi(ctx, cs_file, sv_file, lang, **kwargs):
+    """Calculate Acoustic Voice Quality Index (AVQI) from continuous speech and sustained vowel audio files."""
+    # Import AVQI engine
+    from batchalign.pipelines.avqi import AVQIEngine
+    # Get output file path (same directory as cs_file, with .avqi.txt extension)
+    cs_path = Path(cs_file)
+    output_file = cs_path.with_suffix('.avqi.txt')
+    # Create AVQI engine
+    avqi_engine = AVQIEngine()
+    try:
+        # Calculate AVQI
+        C.print(f"\n[blue]Calculating AVQI[/blue] for:")
+        C.print(f"  Continuous Speech: [cyan]{cs_file}[/cyan]")
+        C.print(f"  Sustained Vowel:   [cyan]{sv_file}[/cyan]")
+        C.print(f"  Language:          [cyan]{lang}[/cyan]")
+        C.print(f"  Output:            [cyan]{output_file}[/cyan]\n")
+        results = avqi_engine.analyze(cs_file, sv_file, str(output_file), lang)
+        C.print(f"[bold green]✓ AVQI calculation completed![/bold green]")
+        C.print(f"[bold]AVQI Score: {results['avqi']:.3f}[/bold]")
+        C.print(f"Results saved to: [cyan]{output_file}[/cyan]\n")
+    except Exception as e:
+        C.print(f"[bold red]ERROR[/bold red]: {str(e)}")
+        if ctx.obj["verbose"] > 0:
+            import traceback
+            C.print(traceback.format_exc())
 #################### SETUP ################################
@@ -379,3 +424,4 @@ def version(ctx, **kwargs):
            f"[italic]{RELEASE_NOTES.strip()}[/italic]"+"\n" +
            "\nDeveloped by Brian MacWhinney and Houjun Liu")
     C.print("\n\n"+ptr+"\n\n")

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/cli/dispatch.py RENAMED Viewed

@@ -163,9 +163,11 @@ def _dispatch(command, lang, num_speakers,
                                    callback=lambda *args:progress_callback(file, *args),
                                    **kw)
                 msgs = [escape(str(i.message)).strip() for i in w]
+                msgs = [i for i in msgs if "torchaudio" not in i.lower()]
                 # write the format, as needed
                 writer(doc, output)
                 # print any warnings
                 if len(msgs) > 0:
                     if ctx.obj["verbose"] > 1:
                         Console().print(f"\n[bold yellow]WARN[/bold yellow] on {file}:\n","\n".join(msgs)+"\n")

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/__init__.py RENAMED Viewed

@@ -13,3 +13,6 @@ from .analysis import EvaluationEngine
 from .utterance import StanzaUtteranceEngine
 from .translate import SeamlessTranslationModel, GoogleTranslateEngine
+from .avqi import AVQIEngine
+from .diarization import PyannoteEngine

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/asr/rev.py RENAMED Viewed

@@ -28,9 +28,9 @@ class RevEngine(BatchalignEngine):
         # if there is no utterance segmentation scheme, we only
         # run ASR
         if self.__engine:
-            return [ Task.ASR, Task.SPEAKER_RECOGNITION, Task.UTTERANCE_SEGMENTATION ]
+            return [ Task.ASR, Task.UTTERANCE_SEGMENTATION ]
         else:
-            return [ Task.ASR, Task.SPEAKER_RECOGNITION ]
+            return [ Task.ASR ]
     def __init__(self, key:str=None, lang="eng", num_speakers=2):

batchalign-0.7.21.post1/batchalign/pipelines/avqi/__init__.py ADDED Viewed

@@ -0,0 +1,8 @@
+"""
+AVQI Pipeline Module
+Acoustic Voice Quality Index calculation
+"""
+from .engine import AVQIEngine
+__all__ = ['AVQIEngine']

batchalign-0.7.21.post1/batchalign/pipelines/avqi/engine.py ADDED Viewed

@@ -0,0 +1,264 @@
+"""
+AVQI Engine for Batchalign2
+Acoustic Voice Quality Index calculation for voice quality assessment
+"""
+import parselmouth
+import numpy as np
+from parselmouth.praat import call
+import re
+from typing import Tuple, Dict, Optional
+import os
+from pathlib import Path
+import logging
+from batchalign.pipelines.base import BatchalignEngine
+from batchalign.document import Task
+L = logging.getLogger('batchalign')
+class AVQIEngine(BatchalignEngine):
+    """Engine for calculating Acoustic Voice Quality Index (AVQI)."""
+    def __init__(self):
+        super().__init__()
+        self._tasks = [Task.FEATURE_EXTRACT]
+    @property
+    def tasks(self):
+        return self._tasks
+    def extract_voiced_segments(self, sound):
+        """Extract voiced segments from audio."""
+        original = call(sound, "Copy", "original")
+        sampling_rate = call(original, "Get sampling frequency")
+        onlyVoice = call("Create Sound", "onlyVoice", 0, 0.001, sampling_rate, "0")
+        textgrid = call(
+            original,
+            "To TextGrid (silences)",
+            50,
+            0.003,
+            -25,
+            0.1,
+            0.1,
+            "silence",
+            "sounding",
+        )
+        intervals = call(
+            [original, textgrid],
+            "Extract intervals where",
+            1,
+            False,
+            "does not contain",
+            "silence",
+        )
+        onlyLoud = call(intervals, "Concatenate")
+        globalPower = call(onlyLoud, "Get power in air")
+        voicelessThreshold = globalPower * 0.3
+        signalEnd = call(onlyLoud, "Get end time")
+        windowBorderLeft = call(onlyLoud, "Get start time")
+        windowWidth = 0.03
+        while windowBorderLeft + windowWidth <= signalEnd:
+            part = call(
+                onlyLoud,
+                "Extract part",
+                windowBorderLeft,
+                windowBorderLeft + windowWidth,
+                "Rectangular",
+                1.0,
+                False,
+            )
+            partialPower = call(part, "Get power in air")
+            if partialPower > voicelessThreshold:
+                try:
+                    start = 0.0025
+                    startZero = call(part, "Get nearest zero crossing", start)
+                    if startZero is not None and not np.isinf(startZero):
+                        onlyVoice = call([onlyVoice, part], "Concatenate")
+                except:
+                    pass
+            windowBorderLeft += 0.03
+        return onlyVoice
+    def calculate_avqi_features(self, cs_file, sv_file):
+        """Calculate AVQI score and features from continuous speech and sustained vowel files."""
+        cs_sound = parselmouth.Sound(cs_file)
+        sv_sound = parselmouth.Sound(sv_file)
+        cs_filtered = call(cs_sound, "Filter (stop Hann band)", 0, 34, 0.1)
+        sv_filtered = call(sv_sound, "Filter (stop Hann band)", 0, 34, 0.1)
+        voiced_cs = self.extract_voiced_segments(cs_filtered)
+        sv_duration = call(sv_filtered, "Get total duration")
+        if sv_duration > 3:
+            sv_start = sv_duration - 3
+            sv_part = call(
+                sv_filtered, "Extract part", sv_start, sv_duration, "rectangular", 1, False
+            )
+        else:
+            sv_part = call(sv_filtered, "Copy", "sv_part")
+        concatenated = call([voiced_cs, sv_part], "Concatenate")
+        powercepstrogram = call(concatenated, "To PowerCepstrogram", 60, 0.002, 5000, 50)
+        cpps = call(
+            powercepstrogram,
+            "Get CPPS",
+            False,
+            0.01,
+            0.001,
+            60,
+            330,
+            0.05,
+            "Parabolic",
+            0.001,
+            0,
+            "Straight",
+            "Robust",
+        )
+        ltas = call(concatenated, "To Ltas", 1)
+        slope = call(ltas, "Get slope", 0, 1000, 1000, 10000, "energy")
+        ltas_copy = call(ltas, "Copy", "ltas_for_tilt")
+        try:
+            call(ltas_copy, "Compute trend line", 1, 10000)
+            tilt = call(ltas_copy, "Get slope", 0, 1000, 1000, 10000, "energy")
+            if abs(tilt - slope) < 0.01:
+                ltas_copy2 = call(ltas, "Copy", "ltas_for_tilt2")
+                call(ltas_copy2, "Compute trend line", 100, 8000)
+                tilt = call(ltas_copy2, "Get slope", 0, 1000, 1000, 10000, "energy")
+            if abs(tilt - slope) < 0.01:
+                tilt = slope + 5.5
+        except:
+            tilt = slope + 5.5
+        pointprocess = call(concatenated, "To PointProcess (periodic, cc)", 50, 400)
+        shim_percent = call(
+            [concatenated, pointprocess],
+            "Get shimmer (local)",
+            0,
+            0,
+            0.0001,
+            0.02,
+            1.3,
+            1.6,
+        )
+        shim = shim_percent * 100
+        shdb = call(
+            [concatenated, pointprocess],
+            "Get shimmer (local_dB)",
+            0,
+            0,
+            0.0001,
+            0.02,
+            1.3,
+            1.6,
+        )
+        pitch = call(
+            concatenated,
+            "To Pitch (cc)",
+            0,
+            75,
+            15,
+            False,
+            0.03,
+            0.45,
+            0.01,
+            0.35,
+            0.14,
+            600,
+        )
+        pointprocess2 = call([concatenated, pitch], "To PointProcess (cc)")
+        voice_report = call(
+            [concatenated, pitch, pointprocess2],
+            "Voice report",
+            0,
+            0,
+            75,
+            600,
+            1.3,
+            1.6,
+            0.03,
+            0.45,
+        )
+        hnr_match = re.search(
+            r"Mean harmonics-to-noise ratio:\s*([-+]?\d*\.?\d+)", voice_report
+        )
+        hnr = float(hnr_match.group(1)) if hnr_match else 0.0
+        avqi = (
+            4.152
+            - (0.177 * cpps)
+            - (0.006 * hnr)
+            - (0.037 * shim)
+            + (0.941 * shdb)
+            + (0.01 * slope)
+            + (0.093 * tilt)
+        ) * 2.8902
+        return avqi, {
+            "cpps": cpps,
+            "hnr": hnr,
+            "shimmer_local": shim,
+            "shimmer_local_db": shdb,
+            "slope": slope,
+            "tilt": tilt,
+        }
+    def analyze(self, cs_file: str, sv_file: str, output_file: str, lang: str = 'eng', **kwargs) -> Dict:
+        """
+        Analyze audio files and calculate AVQI.
+        Parameters
+        ----------
+        cs_file : str
+            Path to continuous speech audio file
+        sv_file : str
+            Path to sustained vowel audio file
+        output_file : str
+            Path to output file
+        lang : str
+            Language code (default: 'eng')
+        Returns
+        -------
+        Dict
+            Dictionary containing AVQI score and features
+        """
+        L.info(f"Calculating AVQI for CS: {cs_file}, SV: {sv_file}")
+        try:
+            # Calculate AVQI using the proper algorithm
+            avqi_score, features = self.calculate_avqi_features(cs_file, sv_file)
+            # Prepare results
+            results = {
+                'avqi': avqi_score,
+                'cpps': features['cpps'],
+                'hnr': features['hnr'],
+                'shimmer_local': features['shimmer_local'],
+                'shimmer_local_db': features['shimmer_local_db'],
+                'slope': features['slope'],
+                'tilt': features['tilt']
+            }
+            # Write results to file
+            with open(output_file, 'w') as f:
+                f.write(f"AVQI: {avqi_score:.3f}\n")
+                f.write(f"CPPS: {features['cpps']:.3f}\n")
+                f.write(f"HNR: {features['hnr']:.3f}\n")
+                f.write(f"Shimmer Local: {features['shimmer_local']:.3f}\n")
+                f.write(f"Shimmer Local dB: {features['shimmer_local_db']:.3f}\n")
+                f.write(f"LTAS Slope: {features['slope']:.3f}\n")
+                f.write(f"LTAS Tilt: {features['tilt']:.3f}\n")
+                f.write(f"Language: {lang}\n")
+            L.info(f"AVQI results written to: {output_file}")
+            return results
+        except Exception as e:
+            L.error(f"Error calculating AVQI: {e}")
+            # Return default values on error
+            return {
+                'avqi': 0.0,
+                'cpps': 0.0,
+                'hnr': 0.0,
+                'shimmer_local': 0.0,
+                'shimmer_local_db': 0.0,
+                'slope': 0.0,
+                'tilt': 0.0
+            }

batchalign-0.7.21.post1/batchalign/pipelines/diarization/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ from .pyannote import PyannoteEngine

batchalign-0.7.21.post1/batchalign/pipelines/diarization/pyannote.py ADDED Viewed

@@ -0,0 +1,103 @@
+# system utils
+import glob, os, re
+from itertools import groupby
+# pathing tools
+from pathlib import Path
+# UD tools
+import stanza
+import copy
+from stanza.utils.conll import CoNLL
+from stanza import Document, DownloadMethod
+from stanza.models.common.doc import Token
+from stanza.pipeline.core import CONSTITUENCY
+from stanza import DownloadMethod
+from torch import heaviside
+from stanza.pipeline.processor import ProcessorVariant, register_processor_variant
+from stanza.resources.common import download_resources_json, load_resources_json, get_language_resources
+# the loading bar
+from tqdm import tqdm
+from bdb import BdbQuit
+from nltk import word_tokenize
+from collections import defaultdict
+import warnings
+from stanza.utils.conll import CoNLL
+# Oneliner of directory-based glob and replace
+globase = lambda path, statement: glob.glob(os.path.join(path, statement))
+repath_file = lambda file_path, new_dir: os.path.join(new_dir, pathlib.Path(file_path).name)
+from batchalign.document import *
+from batchalign.constants import *
+from batchalign.pipelines.base import *
+from batchalign.formats.chat.parser import chat_parse_utterance
+from batchalign.utils.dp import *
+from pyannote.audio import Pipeline
+import logging
+L = logging.getLogger("batchalign")
+import pycountry
+class PyannoteEngine(BatchalignEngine):
+    tasks = [ Task.SPEAKER_RECOGNITION ]
+    status_hook = None
+    def __init__(self, num_speakers=2):
+        self.pipe = Pipeline.from_pretrained("talkbank/dia-fork")
+        self.num_speakers = num_speakers
+    def process(self, doc):
+        assert doc.media != None and doc.media.url != None, f"We cannot diarize something that doesn't have a media path! Provided media tier='{doc.media}'"
+        res = self.pipe(doc.media.url, num_speakers=self.num_speakers)
+        speakers = list(set([int(i[-1].split("_")[-1])
+                            for i in res.itertracks(yield_label=True)]))
+        corpus = doc.tiers[0].corpus
+        lang = doc.tiers[0].lang
+        tiers = {
+            i:
+            Tier(
+                lang=lang, corpus=corpus,
+                id="PAR"+str(i), name="Participant",
+                birthday="",
+            )
+            for i in speakers
+        }
+        for i in doc.content:
+            if not isinstance(i, Utterance):
+                continue
+            if i.alignment is None:
+                continue
+            start,end = i.alignment
+            if start is None or end is None:
+                continue
+            for (a,b),_,speaker in res.itertracks(yield_label=True):
+                speaker_id = int(speaker.split("_")[-1])
+                tier = tiers.get(speaker_id)
+                # we set the end time of the utterance as the
+                # *LAST* segment it ends before
+                # i.e. [seg_end, ....., ut_end]
+                # like that
+                if b <= end/1000 and tier:
+                    i.tier = tier
+        # doc.tiers = list(tiers.values())
+        return doc

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/dispatch.py RENAMED Viewed

@@ -7,7 +7,7 @@ from batchalign import (WhisperEngine, WhisperFAEngine, StanzaEngine, RevEngine,
                         NgramRetraceEngine, DisfluencyReplacementEngine, WhisperUTREngine,
                         RevUTREngine, EvaluationEngine, WhisperXEngine, NemoSpeakerEngine,
                         StanzaUtteranceEngine, CorefEngine, Wave2VecFAEngine, SeamlessTranslationModel,
-                        GoogleTranslateEngine, OAIWhisperEngine)
+                        GoogleTranslateEngine, OAIWhisperEngine, PyannoteEngine)
 from batchalign import BatchalignPipeline
 from batchalign.models import resolve
@@ -22,7 +22,7 @@ DEFAULT_PACKAGES = {
     "asr": "whisper_oai",
     "utr": "whisper_utr",
     "fa": "whisper_fa",
-    "speaker": "nemo_speaker",
+    "speaker": "pyannote",
     "morphosyntax": "stanza",
     "disfluency": "replacement",
     "retracing": "ngram",
@@ -72,6 +72,8 @@ def dispatch_pipeline(pkg_str, lang, num_speakers=None, **arg_overrides):
     # if asr is in engines but disfluency or retracing is not
     # add them
     if "asr" in packages:
+        if "speaker" not in packages:
+            packages.append("speaker")
         if "disfluency" not in packages:
             packages.append("disfluency")
         if "retracing" not in packages:
@@ -137,6 +139,9 @@ def dispatch_pipeline(pkg_str, lang, num_speakers=None, **arg_overrides):
             engines.append(GoogleTranslateEngine())
         elif engine == "whisper_oai":
             engines.append(OAIWhisperEngine())
+        elif engine == "pyannote":
+            engines.append(PyannoteEngine())
     L.debug(f"Done initalizing packages.")
     return BatchalignPipeline(*engines)

batchalign-0.7.21.post1/batchalign/version ADDED Viewed

@@ -0,0 +1,3 @@
+0.7.21-post.1
+August 28, 2025
+Pyannote support

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1/batchalign.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
-Metadata-Version: 2.2
+Metadata-Version: 2.4
 Name: batchalign
-Version: 0.7.20.post18
+Version: 0.7.21.post1
 Summary: Python Speech Language Sample Analysis
 Author: Brian MacWhinney, Houjun Liu
 Author-email: macw@cmu.edu, houjun@cmu.edu
@@ -17,6 +17,8 @@ Requires-Dist: pydub
 Requires-Dist: plotly>=5.3.0
 Requires-Dist: transformers>=4.38.2
 Requires-Dist: tokenizers>=0.14.1
+Requires-Dist: numba>=0.61.0
+Requires-Dist: numpy<=2.2
 Requires-Dist: pycountry>=22.3
 Requires-Dist: stanza[transformers]>=1.10.1
 Requires-Dist: scipy~=1.11
@@ -35,7 +37,11 @@ Requires-Dist: tiktoken
 Requires-Dist: blobfile
 Requires-Dist: sentencepiece
 Requires-Dist: googletrans
-Requires-Dist: openai-whisper>=20240930
+Requires-Dist: openai-whisper
+Requires-Dist: llvmlite>=0.44.0
+Requires-Dist: praat-parselmouth==0.4.6
+Requires-Dist: pyannote.audio
+Requires-Dist: onnxruntime
 Provides-Extra: dev
 Requires-Dist: pytest; extra == "dev"
 Provides-Extra: train
@@ -48,6 +54,7 @@ Dynamic: author-email
 Dynamic: classifier
 Dynamic: description
 Dynamic: description-content-type
+Dynamic: license-file
 Dynamic: provides-extra
 Dynamic: requires-dist
 Dynamic: summary

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign.egg-info/SOURCES.txt RENAMED Viewed

@@ -64,6 +64,8 @@ batchalign/pipelines/asr/rev.py
 batchalign/pipelines/asr/utils.py
 batchalign/pipelines/asr/whisper.py
 batchalign/pipelines/asr/whisperx.py
+batchalign/pipelines/avqi/__init__.py
+batchalign/pipelines/avqi/engine.py
 batchalign/pipelines/cleanup/__init__.py
 batchalign/pipelines/cleanup/cleanup.py
 batchalign/pipelines/cleanup/disfluencies.py
@@ -72,6 +74,8 @@ batchalign/pipelines/cleanup/retrace.py
 batchalign/pipelines/cleanup/support/filled_pauses.eng
 batchalign/pipelines/cleanup/support/replacements.eng
 batchalign/pipelines/cleanup/support/test.test
+batchalign/pipelines/diarization/__init__.py
+batchalign/pipelines/diarization/pyannote.py
 batchalign/pipelines/fa/__init__.py
 batchalign/pipelines/fa/wave2vec_fa.py
 batchalign/pipelines/fa/whisper_fa.py

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign.egg-info/requires.txt RENAMED Viewed

@@ -7,6 +7,8 @@ pydub
 plotly>=5.3.0
 transformers>=4.38.2
 tokenizers>=0.14.1
+numba>=0.61.0
+numpy<=2.2
 pycountry>=22.3
 stanza[transformers]>=1.10.1
 scipy~=1.11
@@ -25,7 +27,11 @@ tiktoken
 blobfile
 sentencepiece
 googletrans
-openai-whisper>=20240930
+openai-whisper
+llvmlite>=0.44.0
+praat-parselmouth==0.4.6
+pyannote.audio
+onnxruntime
 [dev]
 pytest

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/setup.py RENAMED Viewed

@@ -39,6 +39,8 @@ setup(
         "plotly>=5.3.0",
         "transformers>=4.38.2",
         "tokenizers>=0.14.1",
+        "numba>=0.61.0",
+        "numpy<=2.2",
         "pycountry>=22.3",
         "stanza[transformers]>=1.10.1",
         "scipy~=1.11",
@@ -57,7 +59,11 @@ setup(
         "blobfile",
         "sentencepiece",
         "googletrans",
-        "openai-whisper>=20240930"
+        "openai-whisper",
+        "llvmlite>=0.44.0",
+        "praat-parselmouth==0.4.6",  # Added parselmouth for AVQI
+        "pyannote.audio",
+        "onnxruntime"
     ],
     extras_require={
         'dev': [
@@ -113,5 +119,3 @@ setup(
         "Topic :: Utilities"
     ]
 )

batchalign-0.7.20.post18/batchalign/version DELETED Viewed

@@ -1,3 +0,0 @@
-0.7.20-post.18
-August 19, 2025
-Patch small bug

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/LICENSE RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/MANIFEST.in RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/README.md RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/__main__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/cli/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/constants.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/document.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/errors.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/base.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/chat/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/chat/file.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/chat/generator.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/chat/lexer.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/chat/parser.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/chat/utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/textgrid/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/textgrid/file.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/textgrid/generator.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/formats/textgrid/parser.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/resolve.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/speaker/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/speaker/config.yaml RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/speaker/infer.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/speaker/utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/training/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/training/run.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/training/utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/utterance/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/utterance/cantonese_infer.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/utterance/dataset.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/utterance/execute.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/utterance/infer.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/utterance/prep.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/utterance/train.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/wave2vec/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/wave2vec/infer_fa.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/whisper/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/whisper/infer_asr.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/models/whisper/infer_fa.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/analysis/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/analysis/eval.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/asr/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/asr/num2chinese.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/asr/oai_whisper.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/asr/utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/asr/whisper.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/asr/whisperx.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/base.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/cleanup/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/cleanup/cleanup.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/cleanup/disfluencies.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/cleanup/parse_support.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/cleanup/retrace.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/cleanup/support/filled_pauses.eng RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/cleanup/support/replacements.eng RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/cleanup/support/test.test RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/fa/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/fa/wave2vec_fa.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/fa/whisper_fa.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/morphosyntax/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/morphosyntax/coref.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/morphosyntax/en/irr.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/morphosyntax/fr/apm.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/morphosyntax/fr/apmn.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/morphosyntax/fr/case.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/morphosyntax/ja/verbforms.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/morphosyntax/ud.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/pipeline.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/speaker/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/speaker/nemo_speaker.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/translate/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/translate/gtrans.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/translate/seamless.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/translate/utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/utr/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/utr/rev_utr.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/utr/utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/utr/whisper_utr.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/utterance/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/pipelines/utterance/ud_utterance.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/conftest.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/formats/chat/test_chat_file.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/formats/chat/test_chat_generator.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/formats/chat/test_chat_lexer.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/formats/chat/test_chat_parser.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/formats/chat/test_chat_utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/formats/textgrid/test_textgrid.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/analysis/test_eval.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/asr/test_asr_pipeline.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/asr/test_asr_utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/cleanup/test_disfluency.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/cleanup/test_parse_support.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/fa/test_fa_pipeline.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/fixures.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/test_pipeline.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/pipelines/test_pipeline_models.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/tests/test_document.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/utils/__init__.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/utils/abbrev.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/utils/compounds.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/utils/config.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/utils/dp.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/utils/names.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign/utils/utils.py RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign.egg-info/entry_points.txt RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/batchalign.egg-info/top_level.txt RENAMED Viewed

File without changes

{batchalign-0.7.20.post18 → batchalign-0.7.21.post1}/setup.cfg RENAMED Viewed

File without changes

batchalign 0.7.20.post18__tar.gz → 0.7.21.post1__tar.gz

batchalign 0.7.20.post18tar.gz → 0.7.21.post1tar.gz