neverlib 0.2.3__py3-none-any.whl → 0.2.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (207) hide show
  1. neverlib/.history/Docs/audio_aug/test_snr_20250806011311.py +0 -0
  2. neverlib/.history/Docs/audio_aug/test_snr_20250806011331.py +75 -0
  3. neverlib/.history/Docs/audio_aug/test_snr_20250806011342.py +57 -0
  4. neverlib/.history/Docs/audio_aug/test_snr_20250806011352.py +57 -0
  5. neverlib/.history/Docs/audio_aug/test_snr_20250806011403.py +57 -0
  6. neverlib/.history/Docs/audio_aug/test_snr_20250806011413.py +57 -0
  7. neverlib/.history/Docs/audio_aug/test_snr_20250806011435.py +55 -0
  8. neverlib/.history/Docs/vad/1_20250810032405.py +0 -0
  9. neverlib/.history/Docs/vad/1_20250810032417.py +39 -0
  10. neverlib/.history/audio_aug/audio_aug_20250806010451.py +125 -0
  11. neverlib/.history/audio_aug/audio_aug_20250806010750.py +138 -0
  12. neverlib/.history/audio_aug/audio_aug_20250806010759.py +140 -0
  13. neverlib/.history/audio_aug/audio_aug_20250806010803.py +140 -0
  14. neverlib/.history/audio_aug/audio_aug_20250806010809.py +140 -0
  15. neverlib/.history/audio_aug/audio_aug_20250806011108.py +140 -0
  16. neverlib/.history/dataAnalyze/__init___20250806204125.py +14 -0
  17. neverlib/.history/dataAnalyze/__init___20250806204139.py +14 -0
  18. neverlib/.history/dataAnalyze/__init___20250806204159.py +14 -0
  19. neverlib/.history/filter/__init___20250820103351.py +70 -0
  20. neverlib/.history/filter/__init___20250821102348.py +70 -0
  21. neverlib/.history/filter/__init___20250821102405.py +14 -0
  22. neverlib/.history/filter/auto_eq/__init___20250819213121.py +36 -0
  23. neverlib/.history/filter/auto_eq/__init___20250821102241.py +36 -0
  24. neverlib/.history/filter/auto_eq/__init___20250821102259.py +36 -0
  25. neverlib/.history/filter/auto_eq/__init___20250821102307.py +36 -0
  26. neverlib/.history/filter/auto_eq/__init___20250821102310.py +36 -0
  27. neverlib/.history/filter/auto_eq/__init___20250821102318.py +36 -0
  28. neverlib/.history/filter/auto_eq/__init___20250821102507.py +36 -0
  29. neverlib/{filter/AudoEQ/auto_eq_de.py → .history/filter/auto_eq/de_eq_20250820103848.py} +1 -1
  30. neverlib/.history/filter/auto_eq/de_eq_20250821102422.py +360 -0
  31. neverlib/.history/filter/auto_eq/freq_eq_20250820140732.py +75 -0
  32. neverlib/.history/filter/auto_eq/freq_eq_20250820140745.py +75 -0
  33. neverlib/.history/filter/auto_eq/freq_eq_20250820140816.py +75 -0
  34. neverlib/.history/filter/auto_eq/freq_eq_20250820140938.py +77 -0
  35. neverlib/.history/filter/auto_eq/freq_eq_20250820141003.py +77 -0
  36. neverlib/.history/filter/auto_eq/freq_eq_20250820141006.py +77 -0
  37. neverlib/.history/filter/auto_eq/freq_eq_20250820141019.py +77 -0
  38. neverlib/.history/filter/auto_eq/freq_eq_20250820141049.py +77 -0
  39. neverlib/.history/filter/auto_eq/freq_eq_20250820141211.py +77 -0
  40. neverlib/.history/filter/auto_eq/freq_eq_20250820141227.py +77 -0
  41. neverlib/.history/filter/auto_eq/freq_eq_20250820141311.py +78 -0
  42. neverlib/.history/filter/auto_eq/freq_eq_20250820141340.py +78 -0
  43. neverlib/.history/filter/auto_eq/freq_eq_20250820141712.py +78 -0
  44. neverlib/.history/filter/auto_eq/freq_eq_20250820141733.py +78 -0
  45. neverlib/.history/filter/auto_eq/freq_eq_20250820141755.py +78 -0
  46. neverlib/.history/filter/auto_eq/freq_eq_20250821102434.py +76 -0
  47. neverlib/.history/filter/auto_eq/freq_eq_20250821102500.py +76 -0
  48. neverlib/.history/filter/auto_eq/freq_eq_20250821102502.py +76 -0
  49. neverlib/{filter/AudoEQ/auto_eq_ga_basic.py → .history/filter/auto_eq/ga_eq_basic_20250820102957.py} +1 -1
  50. neverlib/.history/filter/auto_eq/ga_eq_basic_20250820113054.py +380 -0
  51. neverlib/.history/filter/auto_eq/ga_eq_basic_20250820113150.py +380 -0
  52. neverlib/.history/filter/auto_eq/ga_eq_basic_20250820113520.py +385 -0
  53. neverlib/.history/filter/auto_eq/ga_eq_basic_20250820113525.py +385 -0
  54. neverlib/.history/filter/auto_eq/ga_eq_basic_20250821102212.py +385 -0
  55. neverlib/.history/metrics/dnsmos_20250806001612.py +160 -0
  56. neverlib/.history/metrics/dnsmos_20250815180659.py +160 -0
  57. neverlib/.history/metrics/dnsmos_20250815180701.py +158 -0
  58. neverlib/.history/metrics/dnsmos_20250815181321.py +154 -0
  59. neverlib/.history/metrics/dnsmos_20250815181327.py +154 -0
  60. neverlib/.history/metrics/dnsmos_20250815181331.py +154 -0
  61. neverlib/.history/metrics/dnsmos_20250815181620.py +154 -0
  62. neverlib/.history/metrics/dnsmos_20250815181631.py +154 -0
  63. neverlib/.history/metrics/dnsmos_20250815181742.py +154 -0
  64. neverlib/.history/metrics/dnsmos_20250815181824.py +153 -0
  65. neverlib/.history/metrics/dnsmos_20250815181834.py +153 -0
  66. neverlib/.history/metrics/dnsmos_20250815181922.py +153 -0
  67. neverlib/.history/metrics/dnsmos_20250815182011.py +147 -0
  68. neverlib/.history/metrics/dnsmos_20250815182036.py +144 -0
  69. neverlib/.history/metrics/dnsmos_20250815182936.py +143 -0
  70. neverlib/.history/metrics/dnsmos_20250815182942.py +143 -0
  71. neverlib/.history/metrics/dnsmos_20250815183032.py +137 -0
  72. neverlib/.history/metrics/dnsmos_20250815183101.py +144 -0
  73. neverlib/.history/metrics/dnsmos_20250815183121.py +144 -0
  74. neverlib/.history/metrics/dnsmos_20250815183123.py +143 -0
  75. neverlib/.history/metrics/dnsmos_20250815183214.py +143 -0
  76. neverlib/.history/metrics/dnsmos_20250815183240.py +143 -0
  77. neverlib/.history/metrics/dnsmos_20250815183248.py +144 -0
  78. neverlib/.history/metrics/dnsmos_20250815183407.py +142 -0
  79. neverlib/.history/metrics/dnsmos_20250815183409.py +142 -0
  80. neverlib/.history/metrics/dnsmos_20250815183431.py +142 -0
  81. neverlib/.history/metrics/dnsmos_20250815183507.py +140 -0
  82. neverlib/.history/metrics/dnsmos_20250815183513.py +139 -0
  83. neverlib/.history/metrics/dnsmos_20250815183618.py +139 -0
  84. neverlib/.history/metrics/dnsmos_20250815183709.py +140 -0
  85. neverlib/.history/metrics/dnsmos_20250815183756.py +137 -0
  86. neverlib/.history/metrics/dnsmos_20250815183815.py +128 -0
  87. neverlib/.history/metrics/dnsmos_20250815183827.py +129 -0
  88. neverlib/.history/metrics/dnsmos_20250815183913.py +117 -0
  89. neverlib/.history/metrics/dnsmos_20250815183914.py +117 -0
  90. neverlib/.history/metrics/dnsmos_20250815184003.py +118 -0
  91. neverlib/.history/metrics/dnsmos_20250815184040.py +118 -0
  92. neverlib/.history/metrics/dnsmos_20250815184049.py +118 -0
  93. neverlib/.history/metrics/dnsmos_20250815184104.py +117 -0
  94. neverlib/.history/metrics/dnsmos_20250815184200.py +117 -0
  95. neverlib/.history/metrics/lpc_lsp_metric_20250816015944.py +128 -0
  96. neverlib/.history/metrics/lpc_lsp_metric_20250816020142.py +128 -0
  97. neverlib/.history/metrics/lpc_lsp_metric_20250816020156.py +128 -0
  98. neverlib/.history/metrics/lpc_lsp_metric_20250816020554.py +130 -0
  99. neverlib/.history/metrics/lpc_lsp_metric_20250816020600.py +125 -0
  100. neverlib/.history/metrics/lpc_lsp_metric_20250816020631.py +120 -0
  101. neverlib/.history/metrics/lpc_lsp_metric_20250816020746.py +118 -0
  102. neverlib/.history/metrics/lpc_me_20250816013111.py +0 -0
  103. neverlib/.history/metrics/lpc_me_20250816013129.py +121 -0
  104. neverlib/.history/metrics/lpc_me_20250816015430.py +103 -0
  105. neverlib/.history/metrics/lpc_me_20250816015535.py +96 -0
  106. neverlib/.history/metrics/lpc_me_20250816015542.py +96 -0
  107. neverlib/.history/metrics/lpc_me_20250816015636.py +97 -0
  108. neverlib/.history/metrics/lpc_me_20250816015658.py +104 -0
  109. neverlib/.history/metrics/lpc_me_20250816015703.py +100 -0
  110. neverlib/.history/metrics/lpc_me_20250816015945.py +128 -0
  111. neverlib/.history/metrics/snr_20250806010538.py +177 -0
  112. neverlib/.history/metrics/snr_20250806211634.py +184 -0
  113. neverlib/.history/metrics/spec_20250805234209.py +45 -0
  114. neverlib/.history/metrics/spec_20250816135530.py +11 -0
  115. neverlib/.history/metrics/spec_20250816135654.py +16 -0
  116. neverlib/.history/metrics/spec_20250816135736.py +68 -0
  117. neverlib/.history/metrics/spec_20250816135904.py +75 -0
  118. neverlib/.history/metrics/spec_20250816135921.py +82 -0
  119. neverlib/.history/metrics/spec_20250816140111.py +82 -0
  120. neverlib/.history/metrics/spec_20250816140543.py +136 -0
  121. neverlib/.history/metrics/spec_20250816140559.py +172 -0
  122. neverlib/.history/metrics/spec_20250816140602.py +172 -0
  123. neverlib/.history/metrics/spec_20250816140608.py +172 -0
  124. neverlib/.history/metrics/spec_20250816140654.py +148 -0
  125. neverlib/.history/metrics/spec_20250816140705.py +144 -0
  126. neverlib/.history/metrics/spec_20250816140755.py +138 -0
  127. neverlib/.history/metrics/spec_20250816140823.py +170 -0
  128. neverlib/.history/metrics/spec_20250816140832.py +170 -0
  129. neverlib/.history/metrics/spec_20250816140833.py +170 -0
  130. neverlib/.history/metrics/spec_20250816140922.py +147 -0
  131. neverlib/.history/metrics/spec_20250816141148.py +107 -0
  132. neverlib/.history/metrics/spec_20250816141219.py +123 -0
  133. neverlib/.history/metrics/spec_20250816141732.py +178 -0
  134. neverlib/.history/metrics/spec_20250816141740.py +178 -0
  135. neverlib/.history/metrics/spec_20250816142030.py +178 -0
  136. neverlib/.history/metrics/spec_20250816142107.py +135 -0
  137. neverlib/.history/metrics/spec_20250816142126.py +135 -0
  138. neverlib/.history/metrics/spec_20250816142410.py +135 -0
  139. neverlib/.history/metrics/spec_20250816142415.py +136 -0
  140. neverlib/.history/metrics/spec_metric_20250816135156.py +0 -0
  141. neverlib/.history/metrics/spec_metric_20250816135226.py +5 -0
  142. neverlib/.history/metrics/spec_metric_20250816135227.py +10 -0
  143. neverlib/.history/metrics/spec_metric_20250816135306.py +15 -0
  144. neverlib/.history/metrics/spec_metric_20250816135442.py +31 -0
  145. neverlib/.history/metrics/spec_metric_20250816135448.py +31 -0
  146. neverlib/.history/metrics/spec_metric_20250816135520.py +29 -0
  147. neverlib/.history/metrics/spec_metric_20250816135537.py +63 -0
  148. neverlib/.history/metrics/spec_metric_20250816135653.py +65 -0
  149. neverlib/.history/vad/PreProcess_20250805234211.py +63 -0
  150. neverlib/.history/vad/PreProcess_20250809232455.py +63 -0
  151. neverlib/.history/vad/PreProcess_20250816020725.py +66 -0
  152. neverlib/.history/vad/VAD_Silero_20250805234211.py +50 -0
  153. neverlib/.history/vad/VAD_Silero_20250809232456.py +50 -0
  154. neverlib/.history/vad/VAD_WebRTC_20250805234211.py +61 -0
  155. neverlib/.history/vad/VAD_WebRTC_20250809232456.py +61 -0
  156. neverlib/.history/vad/VAD_funasr_20250805234211.py +54 -0
  157. neverlib/.history/vad/VAD_funasr_20250809232456.py +54 -0
  158. neverlib/.history/vad/VAD_vadlib_20250805234211.py +70 -0
  159. neverlib/.history/vad/VAD_vadlib_20250809232455.py +70 -0
  160. neverlib/.history/vad/VAD_whisper_20250805234211.py +55 -0
  161. neverlib/.history/vad/VAD_whisper_20250809232456.py +55 -0
  162. neverlib/.specstory/.what-is-this.md +69 -0
  163. neverlib/.specstory/history/2025-08-05_17-06Z-/350/277/231/344/270/200/346/255/245/347/232/204/347/233/256/347/232/204/346/230/257/344/273/200/344/271/210.md +424 -0
  164. neverlib/Docs/audio_aug/test_snr.py +55 -0
  165. neverlib/audio_aug/HarmonicDistortion.py +79 -0
  166. neverlib/audio_aug/TFDrop.py +41 -0
  167. neverlib/audio_aug/TFMask.py +56 -0
  168. neverlib/audio_aug/audio_aug.py +16 -1
  169. neverlib/audio_aug/clip_aug.py +41 -0
  170. neverlib/audio_aug/coder_aug.py +209 -0
  171. neverlib/audio_aug/coder_aug2.py +118 -0
  172. neverlib/audio_aug/loss_packet_aug.py +103 -0
  173. neverlib/audio_aug/quant_aug.py +78 -0
  174. neverlib/data_analyze/__init__.py +14 -0
  175. neverlib/filter/auto_eq/__init__.py +36 -0
  176. neverlib/filter/auto_eq/de_eq.py +360 -0
  177. neverlib/filter/auto_eq/freq_eq.py +76 -0
  178. neverlib/filter/{AudoEQ/auto_eq_ga_advanced.py → auto_eq/ga_eq_advanced.py} +1 -1
  179. neverlib/filter/auto_eq/ga_eq_basic.py +385 -0
  180. neverlib/metrics/dnsmos.py +58 -101
  181. neverlib/metrics/lpc_lsp.py +118 -0
  182. neverlib/metrics/snr.py +11 -4
  183. neverlib/metrics/spec.py +136 -45
  184. neverlib/utils/utils.py +17 -14
  185. neverlib/vad/PreProcess.py +5 -2
  186. neverlib/vad/VAD_Silero.py +1 -1
  187. neverlib/vad/VAD_WebRTC.py +1 -1
  188. neverlib/vad/VAD_funasr.py +1 -1
  189. neverlib/vad/VAD_vadlib.py +1 -1
  190. neverlib/vad/VAD_whisper.py +1 -1
  191. {neverlib-0.2.3.dist-info → neverlib-0.2.4.dist-info}/METADATA +1 -1
  192. neverlib-0.2.4.dist-info/RECORD +229 -0
  193. neverlib-0.2.3.dist-info/RECORD +0 -53
  194. /neverlib/{dataAnalyze/__init__.py → .history/dataAnalyze/__init___20250805234204.py} +0 -0
  195. /neverlib/{filter/AudoEQ/auto_eq_spectral_direct.py → .history/filter/auto_eq/freq_eq_20250805234206.py} +0 -0
  196. /neverlib/{dataAnalyze → data_analyze}/README.md +0 -0
  197. /neverlib/{dataAnalyze → data_analyze}/dataset_analyzer.py +0 -0
  198. /neverlib/{dataAnalyze → data_analyze}/quality_metrics.py +0 -0
  199. /neverlib/{dataAnalyze → data_analyze}/rms_distrubution.py +0 -0
  200. /neverlib/{dataAnalyze → data_analyze}/spectral_analysis.py +0 -0
  201. /neverlib/{dataAnalyze → data_analyze}/statistics.py +0 -0
  202. /neverlib/{dataAnalyze → data_analyze}/temporal_features.py +0 -0
  203. /neverlib/{dataAnalyze → data_analyze}/visualization.py +0 -0
  204. /neverlib/filter/{AudoEQ → auto_eq}/README.md +0 -0
  205. {neverlib-0.2.3.dist-info → neverlib-0.2.4.dist-info}/WHEEL +0 -0
  206. {neverlib-0.2.3.dist-info → neverlib-0.2.4.dist-info}/licenses/LICENSE +0 -0
  207. {neverlib-0.2.3.dist-info → neverlib-0.2.4.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,70 @@
1
+ # -*- coding:utf-8 -*-
2
+ # Author:凌逆战 | Never
3
+ # Date: 2024/9/19
4
+ """
5
+ 基于能量的VAD
6
+ """
7
+ import numpy as np
8
+
9
+
10
+ class Vadlib_C():
11
+ def __init__(self, sr=16000, frame_length=20, frame_shift=20,
12
+ energy_threshold=0.05, pre_emphasis=0.95):
13
+ """
14
+ :param sr: 采样率
15
+ :param frame_length: 帧长(ms)
16
+ :param frame_shift: 帧移(ms)
17
+ :param energy_threshold: 能量阈值
18
+ :param pre_emphasis: 预加重系数
19
+ """
20
+ from vad import EnergyVAD
21
+ self.sr = sr
22
+ self.vad = EnergyVAD(
23
+ sample_rate=sr,
24
+ frame_length=frame_length,
25
+ frame_shift=frame_shift,
26
+ energy_threshold=energy_threshold,
27
+ pre_emphasis=pre_emphasis,
28
+ )
29
+ self.frame_length = frame_length
30
+
31
+ def process(self, wav):
32
+ assert wav.ndim == 1, f"wav shape为{wav.shape}, 期望1D"
33
+ # 返回布尔阵列, 指示框架是否是语音
34
+ voice_activity = self.vad(wav) # (115,) [1,1,0,0,1,,1,0,0....]
35
+
36
+ window_len = int(self.frame_length / 1000 * self.sr)
37
+ vad_array = np.zeros_like(wav)
38
+ for i in range(len(voice_activity)):
39
+ if voice_activity[i]:
40
+ vad_array[i * window_len: (i + 1) * window_len] = 1
41
+ return vad_array
42
+
43
+
44
+ if __name__ == "__main__":
45
+ import soundfile as sf
46
+ import matplotlib.pyplot as plt
47
+ from neverlib.vad.PreProcess import HPFilter, volume_norm
48
+
49
+ sr = 16000
50
+ wav_path = "../../data/vad_example.wav"
51
+ wav, wav_sr = sf.read(wav_path, always_2d=False, dtype="float32")
52
+ assert wav_sr == sr, f"音频采样率为{wav_sr}, 期望{sr}"
53
+ wav = HPFilter(wav, sr=sr, order=6, cutoff=100)
54
+ wav = volume_norm(wav)
55
+
56
+ vad = Vadlib_C()
57
+ vad_array = vad.process(wav)
58
+
59
+ plt.figure(figsize=(20, 5))
60
+ plt.plot(wav)
61
+ plt.plot(vad_array)
62
+ plt.grid()
63
+ plt.show()
64
+
65
+ plt.figure(figsize=(20, 5))
66
+ plt.subplot(2, 1, 1)
67
+ plt.specgram(wav, Fs=sr, scale_by_freq=True, sides='default', cmap="jet")
68
+ plt.subplot(2, 1, 2)
69
+ plt.specgram(vad_array, Fs=sr, scale_by_freq=True, sides='default', cmap="jet")
70
+ plt.show()
@@ -0,0 +1,70 @@
1
+ # -*- coding:utf-8 -*-
2
+ # Author:凌逆战 | Never
3
+ # Date: 2024/9/19
4
+ """
5
+ 基于能量的VAD
6
+ """
7
+ import numpy as np
8
+
9
+
10
+ class Vadlib_C():
11
+ def __init__(self, sr=16000, frame_length=20, frame_shift=20,
12
+ energy_threshold=0.05, pre_emphasis=0.95):
13
+ """
14
+ :param sr: 采样率
15
+ :param frame_length: 帧长(ms)
16
+ :param frame_shift: 帧移(ms)
17
+ :param energy_threshold: 能量阈值
18
+ :param pre_emphasis: 预加重系数
19
+ """
20
+ from vad import EnergyVAD
21
+ self.sr = sr
22
+ self.vad = EnergyVAD(
23
+ sample_rate=sr,
24
+ frame_length=frame_length,
25
+ frame_shift=frame_shift,
26
+ energy_threshold=energy_threshold,
27
+ pre_emphasis=pre_emphasis,
28
+ )
29
+ self.frame_length = frame_length
30
+
31
+ def process(self, wav):
32
+ assert wav.ndim == 1, f"wav shape为{wav.shape}, 期望1D"
33
+ # 返回布尔阵列, 指示框架是否是语音
34
+ voice_activity = self.vad(wav) # (115,) [1,1,0,0,1,,1,0,0....]
35
+
36
+ window_len = int(self.frame_length / 1000 * self.sr)
37
+ vad_array = np.zeros_like(wav)
38
+ for i in range(len(voice_activity)):
39
+ if voice_activity[i]:
40
+ vad_array[i * window_len: (i + 1) * window_len] = 1
41
+ return vad_array
42
+
43
+
44
+ if __name__ == "__main__":
45
+ import soundfile as sf
46
+ import matplotlib.pyplot as plt
47
+ from neverlib.vad.PreProcess import HPFilter, volume_norm
48
+
49
+ sr = 16000
50
+ wav_path = "../../data/vad_example.wav"
51
+ wav, wav_sr = sf.read(wav_path, always_2d=False, dtype="float32")
52
+ assert wav_sr == sr, f"音频采样率为{wav_sr}, 期望{sr}"
53
+ wav = HPFilter(wav, sr=sr, order=6, cutoff=100)
54
+ wav = volume_norm(wav)
55
+
56
+ vad = Vadlib_C()
57
+ vad_array = vad.process(wav)
58
+
59
+ plt.figure(figsize=(20, 5))
60
+ plt.plot(wav)
61
+ plt.plot(vad_array)
62
+ plt.grid()
63
+ plt.show()
64
+
65
+ plt.figure(figsize=(20, 5))
66
+ plt.subplot(2, 1, 1)
67
+ plt.specgram(wav, Fs=sr, scale_by_freq=True, sides='default', cmap="jet")
68
+ plt.subplot(2, 1, 2)
69
+ plt.specgram(vad_array, Fs=sr, scale_by_freq=True, sides='default', cmap="jet")
70
+ plt.show()
@@ -0,0 +1,55 @@
1
+ # -*- coding:utf-8 -*-
2
+ # Author:凌逆战 | Never
3
+ # Date: 2024/9/19
4
+ """
5
+
6
+ """
7
+ import numpy as np
8
+
9
+
10
+ class Whisper_VAD_C():
11
+ def __init__(self, sr=16000, mode="base"):
12
+ """
13
+ :param mode: "base"、"large-v3"
14
+ """
15
+ import whisper
16
+ self.sr=16000
17
+ self.model = whisper.load_model(mode)
18
+
19
+ def process(self, wav):
20
+ assert wav.ndim == 1, f"wav shape为{wav.shape}, 期望1D"
21
+ result = self.model.transcribe(wav, word_timestamps=True)
22
+
23
+ timestamps = []
24
+ for segment in result['segments']:
25
+ # print(f"Segment: {segment['text']}")
26
+ # 句级别时间戳
27
+ # start_time, end_time = segment['start'], segment['end']
28
+ # print(f"Start: {start_time:.3f}s, End: {end_time:.3f}s") # Start: 0.00s, End: 2.80s
29
+ # 词级别时间戳
30
+ for word_info in segment['words']:
31
+ # word = word_info['word']
32
+ start_time = word_info['start']
33
+ end_time = word_info['end']
34
+ timestamps.append({"start": int(start_time * self.sr), "end": int(end_time * self.sr)})
35
+ # print(f"Word: {word}, Start: {start_time:.2f}s, End: {end_time:.2f}s")
36
+ return timestamps
37
+
38
+
39
+
40
+ if __name__ == "__main__":
41
+ import soundfile as sf
42
+ import matplotlib.pyplot as plt
43
+ from neverlib.vad.PreProcess import HPFilter, volume_norm
44
+
45
+ sr = 16000
46
+ wav_path = "../../data/vad_example.wav"
47
+ wav, wav_sr = sf.read(wav_path, always_2d=False, dtype="float32")
48
+ assert wav_sr == sr, f"音频采样率为{wav_sr}, 期望{sr}"
49
+ wav = HPFilter(wav, sr=sr, order=6, cutoff=100)
50
+ wav = volume_norm(wav)
51
+
52
+ vad = Whisper_VAD_C()
53
+ timestamps = vad.process(wav)
54
+
55
+
@@ -0,0 +1,55 @@
1
+ # -*- coding:utf-8 -*-
2
+ # Author:凌逆战 | Never
3
+ # Date: 2024/9/19
4
+ """
5
+
6
+ """
7
+ import numpy as np
8
+
9
+
10
+ class Whisper_VAD_C():
11
+ def __init__(self, sr=16000, mode="base"):
12
+ """
13
+ :param mode: "base"、"large-v3"
14
+ """
15
+ import whisper
16
+ self.sr=16000
17
+ self.model = whisper.load_model(mode)
18
+
19
+ def process(self, wav):
20
+ assert wav.ndim == 1, f"wav shape为{wav.shape}, 期望1D"
21
+ result = self.model.transcribe(wav, word_timestamps=True)
22
+
23
+ timestamps = []
24
+ for segment in result['segments']:
25
+ # print(f"Segment: {segment['text']}")
26
+ # 句级别时间戳
27
+ # start_time, end_time = segment['start'], segment['end']
28
+ # print(f"Start: {start_time:.3f}s, End: {end_time:.3f}s") # Start: 0.00s, End: 2.80s
29
+ # 词级别时间戳
30
+ for word_info in segment['words']:
31
+ # word = word_info['word']
32
+ start_time = word_info['start']
33
+ end_time = word_info['end']
34
+ timestamps.append({"start": int(start_time * self.sr), "end": int(end_time * self.sr)})
35
+ # print(f"Word: {word}, Start: {start_time:.2f}s, End: {end_time:.2f}s")
36
+ return timestamps
37
+
38
+
39
+
40
+ if __name__ == "__main__":
41
+ import soundfile as sf
42
+ import matplotlib.pyplot as plt
43
+ from neverlib.vad.PreProcess import HPFilter, volume_norm
44
+
45
+ sr = 16000
46
+ wav_path = "../../data/vad_example.wav"
47
+ wav, wav_sr = sf.read(wav_path, always_2d=False, dtype="float32")
48
+ assert wav_sr == sr, f"音频采样率为{wav_sr}, 期望{sr}"
49
+ wav = HPFilter(wav, sr=sr, order=6, cutoff=100)
50
+ wav = volume_norm(wav)
51
+
52
+ vad = Whisper_VAD_C()
53
+ timestamps = vad.process(wav)
54
+
55
+
@@ -0,0 +1,69 @@
1
+ # SpecStory Artifacts Directory
2
+
3
+ This directory is automatically created and maintained by the SpecStory extension to preserve your AI chat history.
4
+
5
+ ## What's Here?
6
+
7
+ - `.specstory/history`: Contains auto-saved markdown files of your AI coding sessions
8
+ - Each file represents a separate AI chat session
9
+ - If you enable auto-save, files are automatically updated as you work
10
+ - You can enable/disable the auto-save feature in the SpecStory settings, it is disabled by default
11
+ - `.specstory/.project.json`: Contains the persistent project identity for the current workspace
12
+ - This file is only present if you enable AI rules derivation
13
+ - This is used to provide consistent project identity of your project, even as the workspace is moved or renamed
14
+ - `.specstory/ai_rules_backups`: Contains backups of the `.cursor/rules/derived-cursor-rules.mdc` or the `.github/copilot-instructions.md` file
15
+ - Backups are automatically created each time the `.cursor/rules/derived-cursor-rules.mdc` or the `.github/copilot-instructions.md` file is updated
16
+ - You can enable/disable the AI Rules derivation feature in the SpecStory settings, it is disabled by default
17
+ - `.specstory/.gitignore`: Contains directives to exclude non-essential contents of the `.specstory` directory from version control
18
+ - Add `/history` to exclude the auto-saved chat history from version control
19
+
20
+ ## Valuable Uses
21
+
22
+ - Capture: Keep your context window up-to-date when starting new Chat/Composer sessions via @ references
23
+ - Search: For previous prompts and code snippets
24
+ - Learn: Meta-analyze your patterns and learn from your past experiences
25
+ - Derive: Keep the AI on course with your past decisions by automatically deriving rules from your AI interactions
26
+
27
+ ## Version Control
28
+
29
+ We recommend keeping this directory under version control to maintain a history of your AI interactions. However, if you prefer not to version these files, you can exclude them by adding this to your `.gitignore`:
30
+
31
+ ```
32
+ .specstory/**
33
+ ```
34
+
35
+ We recommend __not__ keeping the `.specstory/ai_rules_backups` directory under version control if you are already using git to version your AI rules, and committing regularly. You can exclude it by adding this to your `.gitignore`:
36
+
37
+ ```
38
+ .specstory/ai_rules_backups
39
+ ```
40
+
41
+ ## Searching Your Codebase
42
+
43
+ When searching your codebase, search results may include your previous AI coding interactions. To focus solely on your actual code files, you can exclude the AI interaction history from search results.
44
+
45
+ To exclude AI interaction history:
46
+
47
+ 1. Open the "Find in Files" search in Cursor or VSCode (Cmd/Ctrl + Shift + F)
48
+ 2. Navigate to the "files to exclude" section
49
+ 3. Add the following pattern:
50
+
51
+ ```
52
+ .specstory/*
53
+ ```
54
+
55
+ This will ensure your searches only return results from your working codebase files.
56
+
57
+ ## Notes
58
+
59
+ - Auto-save only works when Cursor or VSCode flushes sqlite database data to disk. This results in a small delay after the AI response is complete before SpecStory can save the history.
60
+
61
+ ## Settings
62
+
63
+ You can control auto-saving behavior in Cursor or VSCode:
64
+
65
+ 1. Open Cursor/Code → Settings → VS Code Settings (Cmd/Ctrl + ,)
66
+ 2. Search for "SpecStory"
67
+ 3. Find "Auto Save" setting to enable/disable
68
+
69
+ Auto-save occurs when changes are detected in the sqlite database, or every 2 minutes as a safety net.