modusa 0.4.30__py3-none-any.whl → 0.4.32__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- modusa/__init__.py +5 -2
- modusa/tools/__init__.py +4 -1
- modusa/tools/audio_stft.py +72 -0
- modusa/tools/synth.py +58 -1
- {modusa-0.4.30.dist-info → modusa-0.4.32.dist-info}/METADATA +1 -1
- {modusa-0.4.30.dist-info → modusa-0.4.32.dist-info}/RECORD +10 -9
- pyproject.toml +1 -1
- {modusa-0.4.30.dist-info → modusa-0.4.32.dist-info}/WHEEL +0 -0
- {modusa-0.4.30.dist-info → modusa-0.4.32.dist-info}/entry_points.txt +0 -0
- {modusa-0.4.30.dist-info → modusa-0.4.32.dist-info}/licenses/LICENSE.md +0 -0
modusa/__init__.py
CHANGED
@@ -9,6 +9,9 @@ from modusa.tools import load_ann, save_ann
|
|
9
9
|
from modusa.tools import dist_plot, hill_plot, plot, fig
|
10
10
|
|
11
11
|
# Synthsizing related
|
12
|
-
from modusa.tools import synth_f0
|
12
|
+
from modusa.tools import synth_f0, synth_clicks
|
13
13
|
|
14
|
-
|
14
|
+
# Audio features related
|
15
|
+
from modusa.tools import stft
|
16
|
+
|
17
|
+
__version__ = "0.4.32" # This is dynamically used by the documentation, and pyproject.toml; Only need to change it here; rest gets taken care of.
|
modusa/tools/__init__.py
CHANGED
@@ -0,0 +1,72 @@
|
|
1
|
+
#!/usr/bin/env python3
|
2
|
+
|
3
|
+
#---------------------------------
|
4
|
+
# Author: Ankit Anand
|
5
|
+
# Date: 23/10/25
|
6
|
+
# Email: ankit0.anand0@gmail.com
|
7
|
+
#---------------------------------
|
8
|
+
|
9
|
+
import numpy as np
|
10
|
+
|
11
|
+
def stft(y, sr, winlen=None, hoplen=None, gamma=None):
|
12
|
+
"""
|
13
|
+
Compute spectrogram with just numpy.
|
14
|
+
|
15
|
+
Parameters
|
16
|
+
----------
|
17
|
+
y: ndarray
|
18
|
+
- Audio signal.
|
19
|
+
sr: int
|
20
|
+
- Sampling rate of the audio signal.
|
21
|
+
winlen: int
|
22
|
+
- Window length in samples.
|
23
|
+
- Default: None => set at 0.064 sec
|
24
|
+
hoplen: int
|
25
|
+
- Hop length in samples.
|
26
|
+
- Default: None => set at one-forth of winlen
|
27
|
+
gamma: int | None
|
28
|
+
- Log compression factor.
|
29
|
+
- Add contrast to the plot.
|
30
|
+
|
31
|
+
Returns
|
32
|
+
-------
|
33
|
+
ndarray:
|
34
|
+
- Spectrogram matrix, complex is gamma is None else real
|
35
|
+
ndarray:
|
36
|
+
- Frequency bins in Hz.
|
37
|
+
ndarray:
|
38
|
+
- Timeframes in sec.
|
39
|
+
"""
|
40
|
+
|
41
|
+
if winlen is None:
|
42
|
+
winlen = 2 ** int(np.log2(0.064 * sr))
|
43
|
+
if hoplen is None:
|
44
|
+
hoplen = int(winlen * 0.25)
|
45
|
+
|
46
|
+
# Estimating the shape of the S matrix
|
47
|
+
M = int(np.ceil(winlen / 2))
|
48
|
+
N = int(np.ceil((y.size - winlen) / hoplen))
|
49
|
+
|
50
|
+
# Initialize the S matrix
|
51
|
+
S = np.empty((M, N), dtype=np.complex64) # M X N => freq bin X time frame
|
52
|
+
|
53
|
+
# We will need a hann window
|
54
|
+
hann = np.hanning(winlen)
|
55
|
+
|
56
|
+
# Get the frames
|
57
|
+
frames = np.lib.stride_tricks.sliding_window_view(y, window_shape=winlen)[::hoplen] # frame X chunk
|
58
|
+
|
59
|
+
# Apply window to the frame
|
60
|
+
frames_windowed = frames * hann # frame X chunk
|
61
|
+
|
62
|
+
# Compute fft for each frame
|
63
|
+
S = np.fft.rfft(frames_windowed, n=winlen, axis=1).T # transpose to match shape (freq_bins, frame)
|
64
|
+
|
65
|
+
# Magnitude spectrogram
|
66
|
+
Sf = np.fft.rfftfreq(winlen, d=1/sr) # Frequency bins (Hz)
|
67
|
+
St = np.arange(N) * hoplen / sr # Time bins (sec)
|
68
|
+
|
69
|
+
if gamma is not None:
|
70
|
+
S = np.log1p(gamma * np.abs(S))
|
71
|
+
|
72
|
+
return S, Sf, St
|
modusa/tools/synth.py
CHANGED
@@ -52,4 +52,61 @@ def synth_f0(f0, f0t, sr, nharm=0):
|
|
52
52
|
# Normalize output to avoid clipping
|
53
53
|
y /= np.max(np.abs(y))
|
54
54
|
|
55
|
-
return y, sr
|
55
|
+
return y, sr
|
56
|
+
|
57
|
+
def synth_clicks(event_times, sr, freq=500, nharm=4, click_duration_ms=5):
|
58
|
+
"""
|
59
|
+
Generate a train of short sine wave clicks with harmonics at specified event times.
|
60
|
+
|
61
|
+
Parameters
|
62
|
+
----------
|
63
|
+
event_times : array-like
|
64
|
+
- Times of events in seconds where clicks should be placed.
|
65
|
+
sr : int
|
66
|
+
- Sampling rate in Hz.
|
67
|
+
freq : float, optional
|
68
|
+
- Fundamental frequency of the sine click in Hz. Default is 500 Hz.
|
69
|
+
nharm : int | None
|
70
|
+
- Number of harmonics to include (including fundamental). Default is 4.
|
71
|
+
click_duration_ms : float | None
|
72
|
+
- Duration of each click in milliseconds. Default is 5 ms.
|
73
|
+
|
74
|
+
Returns
|
75
|
+
-------
|
76
|
+
np.ndarray
|
77
|
+
- Audio signal with sine wave clicks (with harmonics) at event times.
|
78
|
+
int
|
79
|
+
- Sampling rate of the generated click audio.
|
80
|
+
"""
|
81
|
+
|
82
|
+
n_samples = int(np.ceil(sr * event_times[-1]))
|
83
|
+
y = np.zeros(n_samples, dtype=np.float32)
|
84
|
+
|
85
|
+
# Single click length
|
86
|
+
click_len = int(sr * click_duration_ms / 1000)
|
87
|
+
if click_len < 1:
|
88
|
+
click_len = 1
|
89
|
+
|
90
|
+
t = np.arange(click_len) / sr
|
91
|
+
window = np.hanning(click_len)
|
92
|
+
|
93
|
+
# Generate harmonic sine click
|
94
|
+
sine_click = np.zeros(click_len)
|
95
|
+
for n in range(1, nharm+2):
|
96
|
+
sine_click += (1 / n**2) * np.sin(2 * np.pi * freq * n * t)
|
97
|
+
|
98
|
+
# Apply window
|
99
|
+
sine_click = sine_click * window**2
|
100
|
+
|
101
|
+
for event_time in event_times:
|
102
|
+
start_sample = int(event_time * sr)
|
103
|
+
end_sample = start_sample + click_len
|
104
|
+
if end_sample > n_samples:
|
105
|
+
end_sample = n_samples
|
106
|
+
y[start_sample:end_sample] += sine_click[:end_sample - start_sample]
|
107
|
+
|
108
|
+
# Normalize to avoid clipping if clicks overlap
|
109
|
+
y /= np.max(np.abs(y))
|
110
|
+
|
111
|
+
return y, sr
|
112
|
+
|
@@ -1,21 +1,22 @@
|
|
1
1
|
LICENSE.md,sha256=JTaXAjx5awk76VArKCx5dUW8vmLEWsL_ZlR7-umaHbA,1078
|
2
2
|
README.md,sha256=Ybe2rcDecfSCiUpec2n7btQvgyi4R9JG0bfdwSWijWk,981
|
3
|
-
modusa-0.4.
|
4
|
-
modusa-0.4.
|
5
|
-
modusa-0.4.
|
6
|
-
modusa-0.4.
|
7
|
-
modusa/__init__.py,sha256=
|
3
|
+
modusa-0.4.32.dist-info/METADATA,sha256=FpyrNdZ-RNYXR2bP9VBcEjJROVAilRGeeRFQm6DB1AE,1443
|
4
|
+
modusa-0.4.32.dist-info/WHEEL,sha256=9P2ygRxDrTJz3gsagc0Z96ukrxjr-LFBGOgv3AuKlCA,90
|
5
|
+
modusa-0.4.32.dist-info/entry_points.txt,sha256=fmKpleVXj6CdaBVL14WoEy6xx7JQCs85jvzwTi3lePM,73
|
6
|
+
modusa-0.4.32.dist-info/licenses/LICENSE.md,sha256=JTaXAjx5awk76VArKCx5dUW8vmLEWsL_ZlR7-umaHbA,1078
|
7
|
+
modusa/__init__.py,sha256=OBgGLMPzXgtssSpH8N2Thmdcomig7FR17bPLf7UnrQI,520
|
8
8
|
modusa/fonts/NotoSansDevanagari-Regular.ttf,sha256=CEqU2J61Sq-5OgVuFUJcNP2Fn2NCh1Fl0wSDezvPwtI,221084
|
9
9
|
modusa/images/icon.png,sha256=UgGXlL4xjdIYxqO1en3iQfNN1BFsazxpT7NiPZSDu70,13321
|
10
|
-
modusa/tools/__init__.py,sha256=
|
10
|
+
modusa/tools/__init__.py,sha256=1Oryj_Kw1ZgzxMeD4bfzf890sDwgeysGmNJoRxrxfn4,514
|
11
11
|
modusa/tools/ann_loader.py,sha256=m6Qu6jXnQ8LfUhKItoHSaHlGxUyzUJlGEyu4_50qJ8w,3099
|
12
12
|
modusa/tools/ann_saver.py,sha256=rB2gP1rD69PkSnBZrzc_83ylb7eAyqyCMjn9Bh16VaM,650
|
13
13
|
modusa/tools/audio_converter.py,sha256=415qBoPm2sBIuBSI7m1XBKm0AbmVmPydIPPr-uO8D3c,1778
|
14
14
|
modusa/tools/audio_loader.py,sha256=xmeodrJqJV5j9-lrUPk3W9-bdEA4-6RvTAn8pIErUN0,4084
|
15
15
|
modusa/tools/audio_player.py,sha256=kyBUnodkOE9Ox-hKHkfPeGAQ1RPTddbZYXO1ezz6-9w,2494
|
16
16
|
modusa/tools/audio_recorder.py,sha256=cADeeUpPcDIYBIuuVZvWqulDkv7TavkpL3o3SO9QyKc,2787
|
17
|
+
modusa/tools/audio_stft.py,sha256=vy1J-qFUVIkOh5Y1-dyy3zAh26n0IaMtO2D9EMbtITU,1742
|
17
18
|
modusa/tools/plotter.py,sha256=QfF8kCi79nS-J5lQyEuH_BbAmTo-PdfjDbnK9yTAmRE,30863
|
18
|
-
modusa/tools/synth.py,sha256=
|
19
|
+
modusa/tools/synth.py,sha256=qVAxXRz2tK2OBfsYtQJxUHNEFDD-_cCQtzVjb3-bXjA,2795
|
19
20
|
modusa/tools/youtube_downloader.py,sha256=Ij7fipSlRpsf0pFOwRY-j7Yf2PMp0kpWMhyMQchR0e0,1574
|
20
|
-
pyproject.toml,sha256=
|
21
|
-
modusa-0.4.
|
21
|
+
pyproject.toml,sha256=v0k6ker6OK_uwN08B5XX3WplB8CyPWei0Tp9zMbrTyQ,1414
|
22
|
+
modusa-0.4.32.dist-info/RECORD,,
|
pyproject.toml
CHANGED
File without changes
|
File without changes
|
File without changes
|