PyPI - neverlib - Versions diffs - 0.2.8__py3-none-any.whl → 0.3.0__py3-none-any.whl - Mend

neverlib 0.2.8py3-none-any.whl → 0.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (466) hide show

neverlib/Docs/audio_aug/test_volume.ipynb +8 -8
neverlib/Docs/filter/biquad.ipynb +1 -1
neverlib/Docs/filter/filter_family.ipynb +4 -4
neverlib/Docs/vad/VAD_WebRTC.ipynb +4 -4
neverlib/Docs/vad/VAD_whisper.ipynb +2 -2
neverlib/LLM/__init__.py +37 -0
neverlib/LLM/bailian.py +342 -0
neverlib/LLM/image.py +73 -0
neverlib/LLM/text.py +32 -0
neverlib/QA/ImpactNoiseRejection.py +119 -0
neverlib/QA/gen_init.py +13 -16
neverlib/__init__.py +5 -5
neverlib/audio_aug/HarmonicDistortion.py +11 -11
neverlib/audio_aug/README.md +3 -0
neverlib/audio_aug/__init__.py +2 -2
neverlib/audio_aug/audio_aug.py +18 -18
neverlib/audio_aug/coder_aug.py +25 -25
neverlib/audio_aug/coder_aug2.py +10 -10
neverlib/audio_aug/loss_packet_aug.py +16 -16
neverlib/audio_aug/quant_aug.py +7 -7
neverlib/data_analyze/README.md +1 -1
neverlib/data_analyze/__init__.py +2 -2
neverlib/data_analyze/dataset_analyzer.py +2 -2
neverlib/data_analyze/quality_metrics.py +12 -12
neverlib/data_analyze/statistics.py +1 -1
neverlib/data_analyze/visualization.py +1 -1
neverlib/filter/README.md +3 -3
neverlib/filter/__init__.py +2 -2
neverlib/filter/auto_eq/README.md +2 -2
neverlib/filter/auto_eq/__init__.py +2 -2
neverlib/filter/auto_eq/de_eq.py +1 -1
neverlib/filter/auto_eq/ga_eq_advanced.py +2 -2
neverlib/filter/auto_eq/ga_eq_basic.py +1 -1
neverlib/filter/biquad.py +1 -1
neverlib/filter/core.py +8 -5
neverlib/metrics/README.md +35 -0
neverlib/metrics/__init__.py +2 -2
neverlib/metrics/dnsmos.py +2 -2
neverlib/metrics/lpc_lsp.py +8 -8
neverlib/metrics/pesq_c/PESQ +0 -0
neverlib/metrics/snr.py +5 -5
neverlib/metrics/spec.py +23 -23
neverlib/metrics/test_pesq.py +3 -3
neverlib/signal_gen/babble_noise_generate.py +113 -0
neverlib/tests/__init__.py +2 -2
neverlib/tests/test_imports.py +1 -1
neverlib/utils/README.md +29 -0
neverlib/utils/__init__.py +24 -16
neverlib/utils/audio_split.py +21 -21
neverlib/utils/checkGPU.py +52 -79
neverlib/utils/floder.py +115 -0
neverlib/utils/lazy_expose.py +1 -1
neverlib/utils/lazy_module.py +6 -6
neverlib/utils/message.py +2 -3
neverlib/utils/pcm.py +42 -0
neverlib/utils/utils.py +108 -91
neverlib/vad/README.md +5 -5
neverlib/vad/__init__.py +2 -2
neverlib/vad/utils.py +1 -1
{neverlib-0.2.8.dist-info → neverlib-0.3.0.dist-info}/METADATA +17 -3
neverlib-0.3.0.dist-info/RECORD +120 -0
neverlib/.claude/settings.local.json +0 -9
neverlib/.history/Docs/audio_aug/del_20250827162530.py +0 -0
neverlib/.history/Docs/audio_aug/del_20250827162540.py +0 -2
neverlib/.history/Docs/audio_aug/del_20250827162541.py +0 -7
neverlib/.history/Docs/audio_aug/del_20250827162606.py +0 -7
neverlib/.history/Docs/audio_aug/del_20250827162637.py +0 -8
neverlib/.history/Docs/audio_aug/del_20250827162645.py +0 -8
neverlib/.history/Docs/audio_aug/del_20250827162723.py +0 -9
neverlib/.history/Docs/audio_aug/del_20250827162739.py +0 -9
neverlib/.history/Docs/audio_aug/test_snr_20250806011311.py +0 -0
neverlib/.history/Docs/audio_aug/test_snr_20250806011331.py +0 -75
neverlib/.history/Docs/audio_aug/test_snr_20250806011342.py +0 -57
neverlib/.history/Docs/audio_aug/test_snr_20250806011352.py +0 -57
neverlib/.history/Docs/audio_aug/test_snr_20250806011403.py +0 -57
neverlib/.history/Docs/audio_aug/test_snr_20250806011413.py +0 -57
neverlib/.history/Docs/audio_aug/test_snr_20250806011435.py +0 -55
neverlib/.history/Docs/audio_aug/test_snr_20250827161751.py +0 -55
neverlib/.history/Docs/audio_aug/test_snr_20250827161754.py +0 -55
neverlib/.history/Docs/audio_aug/test_snr_20250827161833.py +0 -54
neverlib/.history/Docs/audio_aug/test_snr_20250827162017.py +0 -56
neverlib/.history/Docs/audio_aug/test_snr_20250827162021.py +0 -57
neverlib/.history/Docs/audio_aug/test_snr_20250827162028.py +0 -57
neverlib/.history/Docs/audio_aug/test_snr_20250827162033.py +0 -55
neverlib/.history/Docs/audio_aug_test/del_20250827162738.py +0 -9
neverlib/.history/Docs/audio_aug_test/del_20250827162819.py +0 -9
neverlib/.history/Docs/audio_aug_test/del_20250827162830.py +0 -9
neverlib/.history/Docs/audio_aug_test/del_20250827162846.py +0 -9
neverlib/.history/Docs/audio_aug_test/del_20250827162851.py +0 -9
neverlib/.history/Docs/audio_aug_test/del_20250827162903.py +0 -10
neverlib/.history/Docs/audio_aug_test/del_20250827162921.py +0 -10
neverlib/.history/Docs/audio_aug_test/del_20250827162926.py +0 -10
neverlib/.history/Docs/audio_aug_test/del_20250827163030.py +0 -10
neverlib/.history/Docs/audio_aug_test/del_20250827163032.py +0 -10
neverlib/.history/Docs/vad/1_20250810032405.py +0 -0
neverlib/.history/Docs/vad/1_20250810032417.py +0 -39
neverlib/.history/QA/html2markdown_20250822234112.md +0 -0
neverlib/.history/QA/html2markdown_20250822234140.py +0 -9
neverlib/.history/QA/html2markdown_20250822234141.md +0 -9
neverlib/.history/QA/html2markdown_20250822234159.py +0 -12
neverlib/.history/QA/html2markdown_20250822234200.py +0 -17
neverlib/.history/QA/html2markdown_20250822234236.py +0 -17
neverlib/.history/QA/html2markdown_20250822234340.py +0 -14
neverlib/.history/QA/html2markdown_20250822234522.py +0 -18
neverlib/.history/QA/html2markdown_20250822234601.py +0 -20
neverlib/.history/QA/html2markdown_20250822234615.py +0 -22
neverlib/.history/QA/html2markdown_20250822234715.py +0 -28
neverlib/.history/QA/html2markdown_20250822234720.py +0 -27
neverlib/.history/QA/html2markdown_20250822234903.py +0 -27
neverlib/.history/__init___20250805234212.py +0 -41
neverlib/.history/__init___20250904102635.py +0 -39
neverlib/.history/__init___20250904102836.py +0 -34
neverlib/.history/__init___20250904102838.py +0 -39
neverlib/.history/__init___20250904102851.py +0 -33
neverlib/.history/audio_aug/audio_aug_20250806010451.py +0 -125
neverlib/.history/audio_aug/audio_aug_20250806010750.py +0 -138
neverlib/.history/audio_aug/audio_aug_20250806010759.py +0 -140
neverlib/.history/audio_aug/audio_aug_20250806010803.py +0 -140
neverlib/.history/audio_aug/audio_aug_20250806010809.py +0 -140
neverlib/.history/audio_aug/audio_aug_20250806011108.py +0 -140
neverlib/.history/audio_aug/audio_aug_20250826155913.py +0 -158
neverlib/.history/audio_aug/audio_aug_20250826164159.py +0 -159
neverlib/.history/audio_aug/audio_aug_20250826164217.py +0 -160
neverlib/.history/audio_aug/audio_aug_20250826164408.py +0 -161
neverlib/.history/audio_aug/audio_aug_20250826164423.py +0 -161
neverlib/.history/audio_aug/audio_aug_20250826164529.py +0 -161
neverlib/.history/audio_aug/audio_aug_20250826164824.py +0 -161
neverlib/.history/audio_aug/audio_aug_20250826164932.py +0 -162
neverlib/.history/audio_aug/audio_aug_20250826164947.py +0 -162
neverlib/.history/audio_aug/audio_aug_20250826165403.py +0 -162
neverlib/.history/audio_aug/audio_aug_20250826165421.py +0 -162
neverlib/.history/audio_aug/audio_aug_20250826165509.py +0 -163
neverlib/.history/audio_aug/audio_aug_20250826165702.py +0 -163
neverlib/.history/audio_aug/audio_aug_20250826165732.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826170041.py +0 -163
neverlib/.history/audio_aug/audio_aug_20250826170105.py +0 -164
neverlib/.history/audio_aug/audio_aug_20250826170154.py +0 -164
neverlib/.history/audio_aug/audio_aug_20250826170220.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826170221.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826170228.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826170231.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826212001.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826220038.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826220133.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826220148.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826220154.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826220156.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826220314.py +0 -165
neverlib/.history/audio_aug/audio_aug_20250826220343.py +0 -184
neverlib/.history/audio_aug/audio_aug_20250826220345.py +0 -184
neverlib/.history/audio_aug/audio_aug_20250826220349.py +0 -184
neverlib/.history/audio_aug/audio_aug_20250826220429.py +0 -184
neverlib/.history/audio_aug/audio_aug_20250826220447.py +0 -184
neverlib/.history/audio_aug/audio_aug_20250826220601.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826220638.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826220641.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826220647.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826220653.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826220655.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826220731.py +0 -185
neverlib/.history/audio_aug/audio_aug_20250826220739.py +0 -185
neverlib/.history/audio_aug/audio_aug_20250826220747.py +0 -185
neverlib/.history/audio_aug/audio_aug_20250826220801.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826220822.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826220901.py +0 -186
neverlib/.history/audio_aug/audio_aug_20250826221107.py +0 -187
neverlib/.history/audio_aug/audio_aug_20250826221310.py +0 -188
neverlib/.history/audio_aug/audio_aug_20250826221353.py +0 -191
neverlib/.history/audio_aug/audio_aug_20250826221821.py +0 -191
neverlib/.history/audio_aug/audio_aug_20250826221838.py +0 -191
neverlib/.history/audio_aug/audio_aug_20250826221906.py +0 -191
neverlib/.history/audio_aug/audio_aug_20250826221930.py +0 -191
neverlib/.history/audio_aug/audio_aug_20250826221939.py +0 -191
neverlib/.history/audio_aug/audio_aug_20250826221955.py +0 -191
neverlib/.history/audio_aug/audio_aug_20250826222008.py +0 -197
neverlib/.history/audio_aug/audio_aug_20250826222017.py +0 -200
neverlib/.history/audio_aug/audio_aug_20250826222046.py +0 -203
neverlib/.history/audio_aug/audio_aug_20250826222105.py +0 -203
neverlib/.history/audio_aug/audio_aug_20250826222206.py +0 -203
neverlib/.history/audio_aug/audio_aug_20250826222302.py +0 -203
neverlib/.history/audio_aug/audio_aug_20250826222336.py +0 -203
neverlib/.history/audio_aug/audio_aug_20250826222455.py +0 -204
neverlib/.history/audio_aug/audio_aug_20250826222526.py +0 -204
neverlib/.history/audio_aug/audio_aug_20250826222541.py +0 -204
neverlib/.history/audio_aug/audio_aug_20250826222624.py +0 -202
neverlib/.history/audio_aug/audio_aug_20250826222714.py +0 -205
neverlib/.history/audio_aug/audio_aug_20250826222820.py +0 -205
neverlib/.history/audio_aug/audio_aug_20250826222827.py +0 -205
neverlib/.history/audio_aug/audio_aug_20250826222927.py +0 -232
neverlib/.history/audio_aug/audio_aug_20250826223009.py +0 -232
neverlib/.history/audio_aug/audio_aug_20250826223054.py +0 -232
neverlib/.history/audio_aug/audio_aug_20250826223225.py +0 -233
neverlib/.history/audio_aug/audio_aug_20250826223344.py +0 -236
neverlib/.history/audio_aug/audio_aug_20250826223356.py +0 -236
neverlib/.history/audio_aug/audio_aug_20250826223955.py +0 -242
neverlib/.history/audio_aug/audio_aug_20250826224210.py +0 -240
neverlib/.history/audio_aug/audio_aug_20250826224250.py +0 -242
neverlib/.history/audio_aug/audio_aug_20250826224323.py +0 -280
neverlib/.history/audio_aug/audio_aug_20250826224452.py +0 -263
neverlib/.history/audio_aug/audio_aug_20250826224455.py +0 -263
neverlib/.history/audio_aug/audio_aug_20250826224502.py +0 -263
neverlib/.history/audio_aug/audio_aug_20250826224528.py +0 -263
neverlib/.history/audio_aug/audio_aug_20250826224658.py +0 -263
neverlib/.history/audio_aug/audio_aug_20250826224833.py +0 -264
neverlib/.history/audio_aug/audio_aug_20250826225013.py +0 -269
neverlib/.history/audio_aug/audio_aug_20250826225050.py +0 -269
neverlib/.history/audio_aug/audio_aug_20250826225241.py +0 -268
neverlib/.history/audio_aug/audio_aug_20250826225315.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250826225404.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250826225502.py +0 -265
neverlib/.history/audio_aug/audio_aug_20250826225950.py +0 -267
neverlib/.history/audio_aug/audio_aug_20250826225959.py +0 -268
neverlib/.history/audio_aug/audio_aug_20250826230222.py +0 -271
neverlib/.history/audio_aug/audio_aug_20250826230248.py +0 -270
neverlib/.history/audio_aug/audio_aug_20250826230638.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250826230755.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250826230941.py +0 -265
neverlib/.history/audio_aug/audio_aug_20250826231054.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250826231117.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250826231219.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250826232330.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250826232352.py +0 -266
neverlib/.history/audio_aug/audio_aug_20250827152748.py +0 -268
neverlib/.history/audio_aug/audio_aug_20250827152806.py +0 -268
neverlib/.history/audio_aug/audio_aug_20250827152808.py +0 -268
neverlib/.history/audio_aug/audio_aug_20250827152917.py +0 -283
neverlib/.history/audio_aug/audio_aug_20250827152929.py +0 -281
neverlib/.history/audio_aug/audio_aug_20250827153100.py +0 -286
neverlib/.history/audio_aug/audio_aug_20250827153102.py +0 -286
neverlib/.history/audio_aug/audio_aug_20250827153301.py +0 -295
neverlib/.history/audio_aug/audio_aug_20250827153331.py +0 -298
neverlib/.history/audio_aug/audio_aug_20250827153525.py +0 -303
neverlib/.history/audio_aug/audio_aug_20250827153533.py +0 -304
neverlib/.history/audio_aug/audio_aug_20250827153541.py +0 -321
neverlib/.history/audio_aug/audio_aug_20250827153805.py +0 -322
neverlib/.history/audio_aug/audio_aug_20250827153832.py +0 -323
neverlib/.history/audio_aug/audio_aug_20250827153836.py +0 -324
neverlib/.history/audio_aug/audio_aug_20250827153846.py +0 -324
neverlib/.history/audio_aug/audio_aug_20250827153859.py +0 -325
neverlib/.history/audio_aug/audio_aug_20250827154453.py +0 -337
neverlib/.history/audio_aug/audio_aug_20250827154513.py +0 -355
neverlib/.history/audio_aug/audio_aug_20250827154538.py +0 -356
neverlib/.history/audio_aug/audio_aug_20250827154541.py +0 -357
neverlib/.history/audio_aug/audio_aug_20250827154612.py +0 -357
neverlib/.history/audio_aug/audio_aug_20250827154657.py +0 -360
neverlib/.history/audio_aug/audio_aug_20250827154708.py +0 -360
neverlib/.history/audio_aug/audio_aug_20250827154728.py +0 -366
neverlib/.history/audio_aug/audio_aug_20250827154755.py +0 -367
neverlib/.history/audio_aug/audio_aug_20250827154800.py +0 -367
neverlib/.history/audio_aug/audio_aug_20250827154917.py +0 -368
neverlib/.history/audio_aug/audio_aug_20250827154928.py +0 -369
neverlib/.history/audio_aug/audio_aug_20250827154932.py +0 -370
neverlib/.history/audio_aug/audio_aug_20250827154947.py +0 -372
neverlib/.history/audio_aug/audio_aug_20250827155015.py +0 -375
neverlib/.history/audio_aug/audio_aug_20250827155106.py +0 -375
neverlib/.history/audio_aug/audio_aug_20250827155114.py +0 -393
neverlib/.history/audio_aug/audio_aug_20250827155207.py +0 -415
neverlib/.history/audio_aug/audio_aug_20250827155300.py +0 -415
neverlib/.history/audio_aug/audio_aug_20250827155321.py +0 -471
neverlib/.history/audio_aug/audio_aug_20250827164703.py +0 -471
neverlib/.history/audio_aug/audio_aug_20250827164749.py +0 -471
neverlib/.history/audio_aug/audio_aug_20250827165252.py +0 -472
neverlib/.history/audio_aug/audio_aug_20250827165334.py +0 -472
neverlib/.history/audio_aug/audio_aug_20250827165404.py +0 -473
neverlib/.history/audio_aug/audio_aug_20250827165610.py +0 -473
neverlib/.history/audio_aug/audio_aug_20250827165805.py +0 -473
neverlib/.history/audio_aug/audio_aug_20250827170056.py +0 -473
neverlib/.history/audio_aug/audio_aug_20250827170106.py +0 -472
neverlib/.history/audio_aug/audio_aug_20250827170143.py +0 -472
neverlib/.history/audio_aug/audio_aug_20250827170216.py +0 -472
neverlib/.history/audio_aug/audio_aug_20250827170218.py +0 -472
neverlib/.history/audio_aug/audio_aug_20250827170314.py +0 -472
neverlib/.history/audio_aug/audio_aug_20250827171500.py +0 -471
neverlib/.history/audio_aug/audio_aug_20250827172347.py +0 -471
neverlib/.history/audio_aug/audio_aug_20250827172558.py +0 -470
neverlib/.history/audio_aug/audio_aug_20250827172559.py +0 -470
neverlib/.history/audio_aug/audio_aug_20250827172801.py +0 -470
neverlib/.history/audio_aug/audio_aug_20250827182522.py +0 -470
neverlib/.history/audio_aug/audio_aug_20250827182526.py +0 -470
neverlib/.history/audio_aug/audio_aug_20250827182626.py +0 -470
neverlib/.history/audio_aug/audio_aug_20250827182715.py +0 -470
neverlib/.history/audio_aug/audio_aug_20250904185444.py +0 -470
neverlib/.history/audio_aug/audio_aug_20250904185538.py +0 -445
neverlib/.history/dataAnalyze/__init___20250805234204.py +0 -87
neverlib/.history/dataAnalyze/__init___20250806204125.py +0 -14
neverlib/.history/dataAnalyze/__init___20250806204139.py +0 -14
neverlib/.history/dataAnalyze/__init___20250806204159.py +0 -14
neverlib/.history/data_analyze/__init___20250806204158.py +0 -14
neverlib/.history/data_analyze/__init___20250827163248.py +0 -14
neverlib/.history/filter/__init___20250820103351.py +0 -70
neverlib/.history/filter/__init___20250821102348.py +0 -70
neverlib/.history/filter/__init___20250821102405.py +0 -14
neverlib/.history/filter/auto_eq/__init___20250819213121.py +0 -36
neverlib/.history/filter/auto_eq/__init___20250821102241.py +0 -36
neverlib/.history/filter/auto_eq/__init___20250821102259.py +0 -36
neverlib/.history/filter/auto_eq/__init___20250821102307.py +0 -36
neverlib/.history/filter/auto_eq/__init___20250821102310.py +0 -36
neverlib/.history/filter/auto_eq/__init___20250821102318.py +0 -36
neverlib/.history/filter/auto_eq/__init___20250821102507.py +0 -36
neverlib/.history/filter/auto_eq/de_eq_20250820103848.py +0 -361
neverlib/.history/filter/auto_eq/de_eq_20250821102422.py +0 -360
neverlib/.history/filter/auto_eq/freq_eq_20250805234206.py +0 -75
neverlib/.history/filter/auto_eq/freq_eq_20250820140732.py +0 -75
neverlib/.history/filter/auto_eq/freq_eq_20250820140745.py +0 -75
neverlib/.history/filter/auto_eq/freq_eq_20250820140816.py +0 -75
neverlib/.history/filter/auto_eq/freq_eq_20250820140938.py +0 -77
neverlib/.history/filter/auto_eq/freq_eq_20250820141003.py +0 -77
neverlib/.history/filter/auto_eq/freq_eq_20250820141006.py +0 -77
neverlib/.history/filter/auto_eq/freq_eq_20250820141019.py +0 -77
neverlib/.history/filter/auto_eq/freq_eq_20250820141049.py +0 -77
neverlib/.history/filter/auto_eq/freq_eq_20250820141211.py +0 -77
neverlib/.history/filter/auto_eq/freq_eq_20250820141227.py +0 -77
neverlib/.history/filter/auto_eq/freq_eq_20250820141311.py +0 -78
neverlib/.history/filter/auto_eq/freq_eq_20250820141340.py +0 -78
neverlib/.history/filter/auto_eq/freq_eq_20250820141712.py +0 -78
neverlib/.history/filter/auto_eq/freq_eq_20250820141733.py +0 -78
neverlib/.history/filter/auto_eq/freq_eq_20250820141755.py +0 -78
neverlib/.history/filter/auto_eq/freq_eq_20250821102434.py +0 -76
neverlib/.history/filter/auto_eq/freq_eq_20250821102500.py +0 -76
neverlib/.history/filter/auto_eq/freq_eq_20250821102502.py +0 -76
neverlib/.history/filter/auto_eq/freq_eq_20250821143140.py +0 -76
neverlib/.history/filter/auto_eq/freq_eq_20250821153208.py +0 -76
neverlib/.history/filter/auto_eq/freq_eq_20250821153214.py +0 -76
neverlib/.history/filter/auto_eq/ga_eq_basic_20250820102957.py +0 -380
neverlib/.history/filter/auto_eq/ga_eq_basic_20250820113054.py +0 -380
neverlib/.history/filter/auto_eq/ga_eq_basic_20250820113150.py +0 -380
neverlib/.history/filter/auto_eq/ga_eq_basic_20250820113520.py +0 -385
neverlib/.history/filter/auto_eq/ga_eq_basic_20250820113525.py +0 -385
neverlib/.history/filter/auto_eq/ga_eq_basic_20250821102212.py +0 -385
neverlib/.history/filter/auto_eq/ga_eq_basic_20250901110521.py +0 -385
neverlib/.history/filter/auto_eq/ga_eq_basic_20250901110652.py +0 -385
neverlib/.history/filter/common_20250806002134.py +0 -37
neverlib/.history/filter/common_20250821120448.py +0 -49
neverlib/.history/filter/common_20250821120453.py +0 -49
neverlib/.history/metrics/dnsmos_20250806001612.py +0 -160
neverlib/.history/metrics/dnsmos_20250815180659.py +0 -160
neverlib/.history/metrics/dnsmos_20250815180701.py +0 -158
neverlib/.history/metrics/dnsmos_20250815181321.py +0 -154
neverlib/.history/metrics/dnsmos_20250815181327.py +0 -154
neverlib/.history/metrics/dnsmos_20250815181331.py +0 -154
neverlib/.history/metrics/dnsmos_20250815181620.py +0 -154
neverlib/.history/metrics/dnsmos_20250815181631.py +0 -154
neverlib/.history/metrics/dnsmos_20250815181742.py +0 -154
neverlib/.history/metrics/dnsmos_20250815181824.py +0 -153
neverlib/.history/metrics/dnsmos_20250815181834.py +0 -153
neverlib/.history/metrics/dnsmos_20250815181922.py +0 -153
neverlib/.history/metrics/dnsmos_20250815182011.py +0 -147
neverlib/.history/metrics/dnsmos_20250815182036.py +0 -144
neverlib/.history/metrics/dnsmos_20250815182936.py +0 -143
neverlib/.history/metrics/dnsmos_20250815182942.py +0 -143
neverlib/.history/metrics/dnsmos_20250815183032.py +0 -137
neverlib/.history/metrics/dnsmos_20250815183101.py +0 -144
neverlib/.history/metrics/dnsmos_20250815183121.py +0 -144
neverlib/.history/metrics/dnsmos_20250815183123.py +0 -143
neverlib/.history/metrics/dnsmos_20250815183214.py +0 -143
neverlib/.history/metrics/dnsmos_20250815183240.py +0 -143
neverlib/.history/metrics/dnsmos_20250815183248.py +0 -144
neverlib/.history/metrics/dnsmos_20250815183407.py +0 -142
neverlib/.history/metrics/dnsmos_20250815183409.py +0 -142
neverlib/.history/metrics/dnsmos_20250815183431.py +0 -142
neverlib/.history/metrics/dnsmos_20250815183507.py +0 -140
neverlib/.history/metrics/dnsmos_20250815183513.py +0 -139
neverlib/.history/metrics/dnsmos_20250815183618.py +0 -139
neverlib/.history/metrics/dnsmos_20250815183709.py +0 -140
neverlib/.history/metrics/dnsmos_20250815183756.py +0 -137
neverlib/.history/metrics/dnsmos_20250815183815.py +0 -128
neverlib/.history/metrics/dnsmos_20250815183827.py +0 -129
neverlib/.history/metrics/dnsmos_20250815183913.py +0 -117
neverlib/.history/metrics/dnsmos_20250815183914.py +0 -117
neverlib/.history/metrics/dnsmos_20250815184003.py +0 -118
neverlib/.history/metrics/dnsmos_20250815184040.py +0 -118
neverlib/.history/metrics/dnsmos_20250815184049.py +0 -118
neverlib/.history/metrics/dnsmos_20250815184104.py +0 -117
neverlib/.history/metrics/dnsmos_20250815184200.py +0 -117
neverlib/.history/metrics/lpc_lsp_metric_20250816015944.py +0 -128
neverlib/.history/metrics/lpc_lsp_metric_20250816020142.py +0 -128
neverlib/.history/metrics/lpc_lsp_metric_20250816020156.py +0 -128
neverlib/.history/metrics/lpc_lsp_metric_20250816020554.py +0 -130
neverlib/.history/metrics/lpc_lsp_metric_20250816020600.py +0 -125
neverlib/.history/metrics/lpc_lsp_metric_20250816020631.py +0 -120
neverlib/.history/metrics/lpc_lsp_metric_20250816020746.py +0 -118
neverlib/.history/metrics/lpc_me_20250816013111.py +0 -0
neverlib/.history/metrics/lpc_me_20250816013129.py +0 -121
neverlib/.history/metrics/lpc_me_20250816015430.py +0 -103
neverlib/.history/metrics/lpc_me_20250816015535.py +0 -96
neverlib/.history/metrics/lpc_me_20250816015542.py +0 -96
neverlib/.history/metrics/lpc_me_20250816015636.py +0 -97
neverlib/.history/metrics/lpc_me_20250816015658.py +0 -104
neverlib/.history/metrics/lpc_me_20250816015703.py +0 -100
neverlib/.history/metrics/lpc_me_20250816015945.py +0 -128
neverlib/.history/metrics/snr_20250806010538.py +0 -177
neverlib/.history/metrics/snr_20250806211634.py +0 -184
neverlib/.history/metrics/snr_20250827224201.py +0 -182
neverlib/.history/metrics/snr_20250827234019.py +0 -186
neverlib/.history/metrics/snr_20250827234028.py +0 -186
neverlib/.history/metrics/snr_20250827234030.py +0 -186
neverlib/.history/metrics/spec_20250805234209.py +0 -45
neverlib/.history/metrics/spec_20250816135530.py +0 -11
neverlib/.history/metrics/spec_20250816135654.py +0 -16
neverlib/.history/metrics/spec_20250816135736.py +0 -68
neverlib/.history/metrics/spec_20250816135904.py +0 -75
neverlib/.history/metrics/spec_20250816135921.py +0 -82
neverlib/.history/metrics/spec_20250816140111.py +0 -82
neverlib/.history/metrics/spec_20250816140543.py +0 -136
neverlib/.history/metrics/spec_20250816140559.py +0 -172
neverlib/.history/metrics/spec_20250816140602.py +0 -172
neverlib/.history/metrics/spec_20250816140608.py +0 -172
neverlib/.history/metrics/spec_20250816140654.py +0 -148
neverlib/.history/metrics/spec_20250816140705.py +0 -144
neverlib/.history/metrics/spec_20250816140755.py +0 -138
neverlib/.history/metrics/spec_20250816140823.py +0 -170
neverlib/.history/metrics/spec_20250816140832.py +0 -170
neverlib/.history/metrics/spec_20250816140833.py +0 -170
neverlib/.history/metrics/spec_20250816140922.py +0 -147
neverlib/.history/metrics/spec_20250816141148.py +0 -107
neverlib/.history/metrics/spec_20250816141219.py +0 -123
neverlib/.history/metrics/spec_20250816141732.py +0 -178
neverlib/.history/metrics/spec_20250816141740.py +0 -178
neverlib/.history/metrics/spec_20250816142030.py +0 -178
neverlib/.history/metrics/spec_20250816142107.py +0 -135
neverlib/.history/metrics/spec_20250816142126.py +0 -135
neverlib/.history/metrics/spec_20250816142410.py +0 -135
neverlib/.history/metrics/spec_20250816142415.py +0 -136
neverlib/.history/metrics/spec_metric_20250816135156.py +0 -0
neverlib/.history/metrics/spec_metric_20250816135226.py +0 -5
neverlib/.history/metrics/spec_metric_20250816135227.py +0 -10
neverlib/.history/metrics/spec_metric_20250816135306.py +0 -15
neverlib/.history/metrics/spec_metric_20250816135442.py +0 -31
neverlib/.history/metrics/spec_metric_20250816135448.py +0 -31
neverlib/.history/metrics/spec_metric_20250816135520.py +0 -29
neverlib/.history/metrics/spec_metric_20250816135537.py +0 -63
neverlib/.history/metrics/spec_metric_20250816135653.py +0 -65
neverlib/.history/utils/audio_split_20250805234209.py +0 -268
neverlib/.history/utils/audio_split_20250904185309.py +0 -268
neverlib/.history/utils/utils_20250813165516.py +0 -330
neverlib/.history/utils/utils_20250904181341.py +0 -328
neverlib/.history/utils/utils_20250904185546.py +0 -352
neverlib/.history/utils/utils_20250904185548.py +0 -353
neverlib/.history/utils/utils_20250904185603.py +0 -353
neverlib/.history/utils/utils_20250904185636.py +0 -353
neverlib/.history/utils/utils_20250904185658.py +0 -358
neverlib/.history/utils/utils_20250904190053.py +0 -359
neverlib/.history/vad/PreProcess_20250805234211.py +0 -63
neverlib/.history/vad/PreProcess_20250809232455.py +0 -63
neverlib/.history/vad/PreProcess_20250816020725.py +0 -66
neverlib/.history/vad/VAD_Silero_20250805234211.py +0 -50
neverlib/.history/vad/VAD_Silero_20250809232456.py +0 -50
neverlib/.history/vad/VAD_WebRTC_20250805234211.py +0 -61
neverlib/.history/vad/VAD_WebRTC_20250809232456.py +0 -61
neverlib/.history/vad/VAD_funasr_20250805234211.py +0 -54
neverlib/.history/vad/VAD_funasr_20250809232456.py +0 -54
neverlib/.history/vad/VAD_vadlib_20250805234211.py +0 -70
neverlib/.history/vad/VAD_vadlib_20250809232455.py +0 -70
neverlib/.history/vad/VAD_whisper_20250805234211.py +0 -55
neverlib/.history/vad/VAD_whisper_20250809232456.py +0 -55
neverlib/.specstory/.what-is-this.md +0 -69
neverlib/.specstory/history/2025-08-05_17-06Z-/350/277/231/344/270/200/346/255/245/347/232/204/347/233/256/347/232/204/346/230/257/344/273/200/344/271/210.md +0 -424
neverlib/.specstory/history/2025-08-22_02-10Z-/345/256/214/345/226/204/345/207/275/346/225/260/347/232/204/345/212/237/350/203/275/345/222/214/345/217/230/351/207/217/345/220/215/345/273/272/350/256/256.md +0 -247
neverlib/.specstory/history/2025-08-26_11-54Z-oserror-missing-shared-object-file.md +0 -87
neverlib/.specstory/history/2025-08-27_08-07Z-/345/256/214/345/226/204/346/265/213/350/257/225/346/226/207/346/241/243/347/232/204/350/256/250/350/256/272.md +0 -296
neverlib/.specstory/history/2025-08-27_08-29Z-delete-python-file-command.md +0 -211
neverlib/.specstory/history/2025-08-27_09-05Z-/345/234/250jupyter/344/270/255/346/222/255/346/224/276/351/237/263/351/242/221/347/232/204/344/273/243/347/240/201/344/277/256/346/224/271.md +0 -357
neverlib-0.2.8.dist-info/RECORD +0 -510
{neverlib-0.2.8.dist-info → neverlib-0.3.0.dist-info}/WHEEL +0 -0
{neverlib-0.2.8.dist-info → neverlib-0.3.0.dist-info}/licenses/LICENSE +0 -0
{neverlib-0.2.8.dist-info → neverlib-0.3.0.dist-info}/top_level.txt +0 -0

neverlib/.history/metrics/spec_20250816142415.py DELETED Viewed

@@ -1,136 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-08-16 13:51:57
-Description: 音频信号频域客观度量指标计算工具
-主要功能:
-1. SD (Spectral Distance) - 频谱距离
-   - 计算两个音频信号在频域上的差异程度
-   - 适用于音频质量评估和信号相似性分析
-2. LSD (Log-Spectral Distance) - 对数谱距离
-   - 在对数功率谱域计算信号距离
-   - 更符合人耳听觉特性，常用于语音质量评估
-3. MCD (Mel-Cepstral Distance) - 梅尔倒谱距离
-   - 基于MFCC特征的音频相似性度量
-   - 广泛应用于语音合成、语音识别等任务
-'''
-import librosa
-import numpy as np
-import soundfile as sf
-from neverlib.utils import EPS
-def sd(ref_wav, test_wav, n_fft=2048, hop_length=512, win_length=None):
-    """
-    计算两个音频信号之间的频谱距离 (Spectral Distance)。
-    该指标衡量两个信号在频域上的差异程度。
-    Args:
-        ref_wav (np.ndarray): 参考音频信号 (一维数组)
-        test_wav (np.ndarray): 测试音频信号 (一维数组)
-        n_fft (int): FFT点数，决定频率分辨率，默认为2048
-        hop_length (int): 帧移，决定时间分辨率，默认为512
-        win_length (int, optional): 窗长，如果为None则默认为n_fft
-    Returns:
-        float: 频谱距离值，值越小表示两个信号越相似
-    """
-    assert len(ref_wav) == len(test_wav), "输入信号长度必须相同"
-    # 计算短时傅里叶变换
-    ref_spec = librosa.stft(ref_wav, n_fft=n_fft, hop_length=hop_length, win_length=win_length)
-    test_spec = librosa.stft(test_wav, n_fft=n_fft, hop_length=hop_length, win_length=win_length)
-    # 计算频谱距离：均方根误差
-    spec_diff = ref_spec - test_spec
-    squared_diff = np.abs(spec_diff) ** 2
-    mean_squared_diff = np.mean(squared_diff)
-    sd_value = np.sqrt(mean_squared_diff)
-    return sd_value
-def lsd(ref_wav, test_wav, n_fft=2048, hop_length=512, win_length=None):
-    """
-    计算两个一维音频信号之间的对数谱距离 (Log-Spectral Distance, LSD)。
-    该实现遵循标准的LSD定义: 整体均方根误差。
-    Args:
-        ref_wav (np.ndarray): 原始的、干净的参考信号 (一维数组)。
-        test_wav (np.ndarray): 模型估计或处理后的信号 (一维数组)。
-        n_fft (int): FFT点数, 决定了频率分辨率。
-        hop_length (int): 帧移, 决定了时间分辨率。
-        win_length (int, optional): 窗长。如果为None, 则默认为n_fft。
-        epsilon (float): 一个非常小的数值, 用于防止对零取对数, 保证数值稳定性。
-    Returns:
-        float: 对数谱距离值, 单位为分贝 (dB)。
-    """
-    assert ref_wav.ndim == 1 and test_wav.ndim == 1, "输入信号必须是一维数组。"
-    if win_length is None:
-        win_length = n_fft
-    ref_stft = librosa.stft(ref_wav, n_fft=n_fft, hop_length=hop_length, win_length=win_length) # (F,T)
-    test_stft = librosa.stft(test_wav, n_fft=n_fft, hop_length=hop_length, win_length=win_length) # (F,T)
-    ref_power_spec = np.abs(ref_stft) ** 2 # (F,T)
-    test_power_spec = np.abs(test_stft) ** 2 # (F,T)
-    ref_log_power_spec = 10 * np.log10(ref_power_spec + EPS)
-    test_log_power_spec = 10 * np.log10(test_power_spec + EPS)
-    squared_error = (ref_log_power_spec - test_log_power_spec) ** 2
-    lsd_val = np.sqrt(np.mean(squared_error))
-    return lsd_val
-def mcd(ref_wav, test_wav, sr=16000, n_mfcc=13):
-    """
-    计算两个音频信号之间的梅尔倒谱距离 (Mel-Cepstral Distance, MCD)。
-    该指标常用于语音合成质量评估，值越小表示两个信号越相似。
-    Args:
-        ref_wav (np.ndarray): 参考音频信号 (一维数组)
-        test_wav (np.ndarray): 测试音频信号 (一维数组)
-        sr (int): 采样率，默认为16000Hz
-        n_mfcc (int): MFCC系数个数，默认为13
-    Returns:
-        float: 梅尔倒谱距离值，值越小表示两个信号越相似
-    """
-    assert len(ref_wav) == len(test_wav), "输入信号长度必须相同"
-    # 计算MFCC特征
-    ref_mfcc = librosa.feature.mfcc(y=ref_wav, sr=sr, n_mfcc=n_mfcc)
-    test_mfcc = librosa.feature.mfcc(y=test_wav, sr=sr, n_mfcc=n_mfcc)
-    # 计算MCD (跳过0阶系数，因为0阶主要表示能量)
-    diff = ref_mfcc[1:] - test_mfcc[1:]
-    mcd_value = (10.0 / np.log(10)) * np.sqrt(2 * np.mean(np.sum(diff ** 2, axis=0)))
-    return mcd_value
-if __name__ == "__main__":
-    ref_file = "../data/vad_example.wav"   # 参考语音文件路径
-    test_file = "../data/vad_example.wav" # 测试语音文件路径
-    ref_wav, ref_sr = sf.read(ref_file)
-    test_wav, test_sr = sf.read(test_file)
-    assert ref_sr == test_sr == 16000, "采样率必须为16000Hz"
-    assert len(ref_wav) == len(test_wav), "音频长度必须相同"
-    mcd_value = mcd(ref_wav, test_wav)
-    print(f"梅尔倒谱距离: {mcd_value:.2f}")
-    lsd_value = lsd(ref_wav, test_wav)
-    print(f"对数谱距离: {lsd_value:.2f}")
-    sd_value = sd(ref_wav, test_wav)
-    print(f"频谱距离: {sd_value:.2f}")

neverlib/.history/metrics/spec_metric_20250816135156.py DELETED Viewed

File without changes

neverlib/.history/metrics/spec_metric_20250816135226.py DELETED Viewed

@@ -1,5 +0,0 @@
-def mcd(ref_spec, test_spec):
-    #

neverlib/.history/metrics/spec_metric_20250816135227.py DELETED Viewed

@@ -1,10 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-08-16 13:51:57
-Description:
-'''
-def mcd(ref_spec, test_spec):
-    #

neverlib/.history/metrics/spec_metric_20250816135306.py DELETED Viewed

@@ -1,15 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-08-16 13:51:57
-Description:
-'''
-def mcd(ref_spec, test_spec):
-    """
-    梅尔倒谱距离 Mel-Cepstral Distance（MCD）
-    ref_spec: 参考频谱
-    test_spec: 测试频谱
-    """

neverlib/.history/metrics/spec_metric_20250816135442.py DELETED Viewed

@@ -1,31 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-08-16 13:51:57
-Description:
-'''
-import librosa
-import numpy as np
-import soundfile as sf
-def mcd(ref_wav, test_wav, sr=16000):
-    """
-    梅尔倒谱距离 Mel-Cepstral Distance（MCD）
-    ref_spec: 参考频谱
-    test_spec: 测试频谱
-    """
-    ref_wav, ref_sr = sf.read(ref_wav)
-    test_wav, test_sr = sf.read(test_wav)
-    assert ref_sr == test_sr == sr, "采样率必须为16000Hz"
-    assert len(ref_wav) == len(test_wav), "音频长度必须相同"
-    ref_mfc = librosa.feature.mfcc(y=ref_wav, sr=sr)
-    test_mfc = librosa.feature.mfcc(y=test_wav, sr=sr)
-    mcd = np.mean(np.abs(ref_mfc - test_mfc))
-    return mcd

neverlib/.history/metrics/spec_metric_20250816135448.py DELETED Viewed

@@ -1,31 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-08-16 13:51:57
-Description:
-'''
-import librosa
-import numpy as np
-import soundfile as sf
-def mcd(ref_wav, test_wav, sr=16000):
-    """
-    梅尔倒谱距离 Mel-Cepstral Distance（MCD）
-    ref_spec: 参考频谱
-    test_spec: 测试频谱
-    """
-    ref_wav, ref_sr = sf.read(ref_wav)
-    test_wav, test_sr = sf.read(test_wav)
-    assert ref_sr == test_sr == sr, "采样率必须为16000Hz"
-    assert len(ref_wav) == len(test_wav), "音频长度必须相同"
-    ref_mfc = librosa.feature.mfcc(y=ref_wav, sr=sr)
-    test_mfc = librosa.feature.mfcc(y=test_wav, sr=sr)
-    # 计算 MCD (跳过 0 阶)
-    return mcd

neverlib/.history/metrics/spec_metric_20250816135520.py DELETED Viewed

@@ -1,29 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-08-16 13:51:57
-Description:
-'''
-import librosa
-import numpy as np
-import soundfile as sf
-def mcd(ref_wav, test_wav, sr=16000):
-    """
-    梅尔倒谱距离 Mel-Cepstral Distance
-    ref_spec: 参考频谱
-    test_spec: 测试频谱
-    """
-    ref_wav, ref_sr = sf.read(ref_wav)
-    test_wav, test_sr = sf.read(test_wav)
-    assert ref_sr == test_sr == sr, "采样率必须为16000Hz"
-    assert len(ref_wav) == len(test_wav), "音频长度必须相同"
-    ref_mfcc = librosa.feature.mfcc(y=ref_wav, sr=sr)
-    test_mfcc = librosa.feature.mfcc(y=test_wav, sr=sr)
-    # 计算 MCD (跳过 0 阶)
-    diff = ref_mfcc[1:] - test_mfcc[1:]
-    mcd = (10.0 / np.log(10)) * np.sqrt(2 * np.mean(np.sum(diff ** 2, axis=0)))
-    return mcd

neverlib/.history/metrics/spec_metric_20250816135537.py DELETED Viewed

@@ -1,63 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-08-16 13:51:57
-Description:
-'''
-import librosa
-import numpy as np
-import soundfile as sf
-def lsd(reference, estimate, n_fft=2048, hop_length=512, win_length=None):
-    """
-    计算两个一维音频信号之间的对数谱距离 (Log-Spectral Distance, LSD)。
-    该实现遵循标准的LSD定义: 整体均方根误差。
-    Args:
-        reference (np.ndarray): 原始的、干净的参考信号 (一维数组)。
-        estimate (np.ndarray): 模型估计或处理后的信号 (一维数组)。
-        n_fft (int): FFT点数, 决定了频率分辨率。
-        hop_length (int): 帧移, 决定了时间分辨率。
-        win_length (int, optional): 窗长。如果为None, 则默认为n_fft。
-        epsilon (float): 一个非常小的数值, 用于防止对零取对数, 保证数值稳定性。
-    Returns:
-        float: 对数谱距离值, 单位为分贝 (dB)。
-    """
-    assert reference.ndim == 1 and estimate.ndim == 1, "输入信号必须是一维数组。"
-    if win_length is None:
-        win_length = n_fft
-    reference_stft = librosa.stft(reference, n_fft=n_fft, hop_length=hop_length, win_length=win_length) # (F,T)
-    estimate_stft = librosa.stft(estimate, n_fft=n_fft, hop_length=hop_length, win_length=win_length) # (F,T)
-    reference_power_spec = np.abs(reference_stft) ** 2 # (F,T)
-    estimate_power_spec = np.abs(estimate_stft) ** 2 # (F,T)
-    reference_log_power_spec = 10 * np.log10(reference_power_spec + EPS)
-    estimate_log_power_spec = 10 * np.log10(estimate_power_spec + EPS)
-    squared_error = (reference_log_power_spec - estimate_log_power_spec) ** 2
-    lsd_val = np.sqrt(np.mean(squared_error))
-    return lsd_val
-def mcd(ref_wav, test_wav, sr=16000):
-    """
-    梅尔倒谱距离 Mel-Cepstral Distance
-    ref_spec: 参考频谱
-    test_spec: 测试频谱
-    """
-    ref_wav, ref_sr = sf.read(ref_wav)
-    test_wav, test_sr = sf.read(test_wav)
-    assert ref_sr == test_sr == sr, "采样率必须为16000Hz"
-    assert len(ref_wav) == len(test_wav), "音频长度必须相同"
-    ref_mfcc = librosa.feature.mfcc(y=ref_wav, sr=sr)
-    test_mfcc = librosa.feature.mfcc(y=test_wav, sr=sr)
-    # 计算 MCD (跳过 0 阶)
-    diff = ref_mfcc[1:] - test_mfcc[1:]
-    mcd = (10.0 / np.log(10)) * np.sqrt(2 * np.mean(np.sum(diff ** 2, axis=0)))
-    return mcd

neverlib/.history/metrics/spec_metric_20250816135653.py DELETED Viewed

@@ -1,65 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-08-16 13:51:57
-Description:
-'''
-import librosa
-import numpy as np
-import soundfile as sf
-from utils import EPS
-def lsd(ref_wav, test_wav, n_fft=2048, hop_length=512, win_length=None):
-    """
-    计算两个一维音频信号之间的对数谱距离 (Log-Spectral Distance, LSD)。
-    该实现遵循标准的LSD定义: 整体均方根误差。
-    Args:
-        ref_wav (np.ndarray): 原始的、干净的参考信号 (一维数组)。
-        test_wav (np.ndarray): 模型估计或处理后的信号 (一维数组)。
-        n_fft (int): FFT点数, 决定了频率分辨率。
-        hop_length (int): 帧移, 决定了时间分辨率。
-        win_length (int, optional): 窗长。如果为None, 则默认为n_fft。
-        epsilon (float): 一个非常小的数值, 用于防止对零取对数, 保证数值稳定性。
-    Returns:
-        float: 对数谱距离值, 单位为分贝 (dB)。
-    """
-    assert ref_wav.ndim == 1 and test_wav.ndim == 1, "输入信号必须是一维数组。"
-    if win_length is None:
-        win_length = n_fft
-    ref_stft = librosa.stft(ref_wav, n_fft=n_fft, hop_length=hop_length, win_length=win_length) # (F,T)
-    test_stft = librosa.stft(test_wav, n_fft=n_fft, hop_length=hop_length, win_length=win_length) # (F,T)
-    ref_power_spec = np.abs(ref_stft) ** 2 # (F,T)
-    test_power_spec = np.abs(test_stft) ** 2 # (F,T)
-    ref_log_power_spec = 10 * np.log10(ref_power_spec + EPS)
-    test_log_power_spec = 10 * np.log10(test_power_spec + EPS)
-    squared_error = (ref_log_power_spec - test_log_power_spec) ** 2
-    lsd_val = np.sqrt(np.mean(squared_error))
-    return lsd_val
-def mcd(ref_wav, test_wav, sr=16000):
-    """
-    梅尔倒谱距离 Mel-Cepstral Distance
-    ref_spec: 参考频谱
-    test_spec: 测试频谱
-    """
-    ref_wav, ref_sr = sf.read(ref_wav)
-    test_wav, test_sr = sf.read(test_wav)
-    assert ref_sr == test_sr == sr, "采样率必须为16000Hz"
-    assert len(ref_wav) == len(test_wav), "音频长度必须相同"
-    ref_mfcc = librosa.feature.mfcc(y=ref_wav, sr=sr)
-    test_mfcc = librosa.feature.mfcc(y=test_wav, sr=sr)
-    # 计算 MCD (跳过 0 阶)
-    diff = ref_mfcc[1:] - test_mfcc[1:]
-    mcd = (10.0 / np.log(10)) * np.sqrt(2 * np.mean(np.sum(diff ** 2, axis=0)))
-    return mcd

neverlib/.history/utils/audio_split_20250805234209.py DELETED Viewed

@@ -1,268 +0,0 @@
-'''
-Author: 凌逆战 | Never
-Date: 2025-04-10 18:07:03
-Description: 音频切割
-'''
-import os
-import random
-import subprocess
-from tqdm import tqdm
-import soundfile as sf
-import numpy as np
-from .utils import get_path_list
-from pydub import AudioSegment
-def audio_split_ffmpeg(source_path, target_path, sr, channel_num, duration, endwith="*.pcm"):
-    """ 切割音频切不准, 会留点尾巴0.016s
-    使用ffmpeg分割音频, 分割为短音频(单位:秒), 似乎无法非常准确的分割到指定长度
-    :param source_path: 源音频路径
-    :param target_path: 目标音频路径
-    :param sr: 源音频采样率
-    :param channel_num: 源音频声道数
-    :param duration: 分割为时长(短音频)(单位:秒)
-    :param endwith: 音频格式(支持pcm和wav)
-    """
-    wav_path_list = get_path_list(source_path, end=endwith)
-    print("待分割的音频数: ", len(wav_path_list))
-    for wav_path in wav_path_list:
-        wav_folder = wav_path[:-4].replace(source_path, target_path)
-        os.makedirs(wav_folder, exist_ok=True)
-        if endwith == "*.pcm":
-            # 将pcm文件切割成30s的语音, 有括号会报错
-            # ffmpeg -f s16le -ar 16000 -ac 6 -i ./NO.1_A3035_2.pcm -f segment -segment_time 30 -c copy NO.1_A3035_2/%03d.wav
-            command = ["ffmpeg", "-f", "s16le", "-ar", f"{sr}", "-ac", str(channel_num),
-                       "-i", wav_path, "-f", "segment", "-segment_time",
-                       f"{duration}", "-c", "copy", f"{wav_folder}/%03d.wav"]
-            subprocess.run(command, check=True)
-        elif endwith == "*.wav":
-            # ffmpeg -i ./NO.1_A3035_2.wav -f segment -segment_time 30 -c copy NO.1_A3035_2/%03d.wav
-            command = ["ffmpeg", "-i", wav_path, "-f", "segment", "-segment_time",
-                       f"{duration}", "-c", "copy", f"{wav_folder}/%03d.wav"]
-            subprocess.run(command, check=True)
-        else:
-            assert False, "不支持的音频格式"
-    print("分割完毕: done!")
-def audio_split_sox(source_path, target_path, duration, endwith="*.wav"):
-    """
-    使用sox分割音频, 分割为短音频(单位:秒), 可以非常准确的分割到指定长度
-    :param source_path: 源音频路径
-    :param target_path: 目标音频路径
-    :param duration: 分割为时长(短音频)(单位:秒)
-    :param endwith: 音频格式(只支持wav)
-    """
-    wav_path_list = get_path_list(source_path, end=endwith)
-    for wav_path in wav_path_list:
-        wav_folder = wav_path[:-4].replace(source_path, target_path)
-        os.makedirs(wav_folder, exist_ok=True)
-        output_pattern = f"{wav_folder}/%.wav"
-        if endwith == "*.wav":
-            # 对 WAV 文件直接进行分割
-            os.system(f"sox {wav_path} {output_pattern} trim 0 {str(duration)} : newfile : restart")
-        else:
-            assert False, "不支持的音频格式"
-    print("分割完毕: done!")
-def audio_split_np(source_path, target_path, sr, channel_num, duration, endwith="*.pcm"):
-    """
-    使用numpy读取pcm文件并切割保存为wav文件, 保持通道数一致, 保存不足30秒的最后一段音频
-    :param source_path: 源音频路径
-    :param target_path: 目标音频路径
-    :param sr: 采样率
-    :param channel_num: 声道数
-    :param duration: 分割的时长 (秒)
-    :param endwith: 音频格式 (支持 pcm)
-    """
-    assert endwith == "*.pcm", "只支持pcm格式的音频"
-    wav_path_list = get_path_list(source_path, end=endwith)  # 获取音频文件列表
-    print("待分割的音频数: ", len(wav_path_list))
-    segment_length_samples = duration * sr  # 每个切片音频的采样点数
-    for wav_path in wav_path_list:
-        print("正在分割: ", wav_path)
-        wav_folder = wav_path[:-4].replace(source_path, target_path)
-        os.makedirs(wav_folder, exist_ok=True)
-        # 注意读取时使用正确的dtype(例如int16表示16位PCM)
-        pcm_data = np.fromfile(wav_path, dtype=np.int16)
-        pcm_data = pcm_data[:(len(pcm_data) // channel_num) * channel_num]
-        pcm_data = pcm_data.reshape(-1, channel_num)
-        # 计算分割的数量
-        num_segments = len(pcm_data) // segment_length_samples
-        # 切割并保存每段音频
-        for i in tqdm(range(num_segments)):
-            start_idx = i * segment_length_samples
-            end_idx = (i + 1) * segment_length_samples
-            segment = pcm_data[start_idx:end_idx]
-            segment_filename = os.path.join(wav_folder, f"{i + 1:03d}.wav")   # 保存为wav文件
-            sf.write(segment_filename, segment, sr, subtype='PCM_16')
-        # 如果剩余部分少于30秒, 保存最后一段不足30秒的音频
-        remaining_samples = len(pcm_data) % segment_length_samples
-        if remaining_samples > 0:
-            segment = pcm_data[-remaining_samples:]
-            # 保存剩余部分
-            remaining_filename = os.path.join(wav_folder, f"{num_segments + 1:03d}.wav")
-            sf.write(remaining_filename, segment, sr, subtype='PCM_16')
-    print("分割完毕: done!")
-def audio_split_pydub(source_path, target_path, sr, channel_num, duration, endwith="*.pcm", sample_width=2):
-    """
-    使用pydub分割音频, 进行精确的分割
-    :param source_path: 源音频路径
-    :param target_path: 目标音频路径
-    :param sr: 源音频采样率
-    :param channel_num: 源音频声道数
-    :param duration: 分割为时长(短音频)(单位:秒), 必须是1s的整数倍
-    :param endwith: 音频格式(支持pcm和wav)
-    :param sample_width: 音频的样本宽度(字节数), 默认为2, 表示16位音频
-    """
-    assert duration % 1 == 0, "duration必须是1s的整数倍"
-    wav_path_list = get_path_list(source_path, end=endwith)  # 获取音频文件列表
-    print("待分割的音频数: ", len(wav_path_list))
-    for wav_path in wav_path_list:
-        print("正在分割: ", wav_path)
-        wav_folder = wav_path[:-4].replace(source_path, target_path)  # 设置目标文件夹
-        os.makedirs(wav_folder, exist_ok=True)
-        # 使用pydub加载音频
-        if endwith == "*.pcm":
-            # 读取pcm文件, 指定采样率、声道数和样本宽度
-            audio = AudioSegment.from_file(wav_path, format="raw", channels=channel_num, frame_rate=sr, sample_width=sample_width)
-        elif endwith == "*.wav":
-            # 读取wav文件
-            audio = AudioSegment.from_wav(wav_path)
-        else:
-            assert False, "不支持的音频格式"
-        # 计算每段的时长(以毫秒为单位)
-        segment_length = duration * 1000  # 转换为毫秒
-        # 切割音频并保存为多个文件
-        segment_number = 1
-        for i in tqdm(range(0, len(audio), segment_length)):
-            segment = audio[i:i + segment_length]
-            segment_filename = os.path.join(wav_folder, f"{segment_number:03d}.wav")
-            segment.export(segment_filename, format="wav")
-            segment_number += 1
-    print("分割完毕: done!")
-def audio_split_random(source_dir, target_dir, min_duration=3, max_duration=10, sr=16000):
-    """
-    将音频切割成 3 到 10 秒的多个片段并保存。
-    参数:
-    - input_audio_path: 输入音频文件路径
-    - output_dir: 输出音频文件夹路径
-    - min_duration: 最短切割片段长度 (秒), 默认3秒
-    - max_duration: 最长切割片段长度 (秒), 默认10秒
-    - sample_rate: 采样率, 默认16000
-    """
-    wav_path_list = get_path_list(source_dir, "*.wav")
-    for wav_path in wav_path_list:
-        output_dir = wav_path[:-4].replace(source_dir, target_dir)
-        os.makedirs(output_dir, exist_ok=True)
-        wav, wav_sr = sf.read(wav_path, always_2d=True)
-        assert wav_sr == sr, f"音频采样率不匹配: {wav_sr} != {sr}"
-        count = 0
-        while len(wav) > max_duration * sr:
-            segment_len = random.randint(min_duration * sr, max_duration * sr)
-            segment = wav[0: segment_len]
-            wav = wav[segment_len:]
-            count += 1
-            sf.write(os.path.join(output_dir, f"{count}.wav"), segment, sr)
-        sf.write(os.path.join(output_dir, f"{count + 1}.wav"), wav, sr)
-def audio_split_VADfunasr(source_dir, target_dir, sr=16000):
-    """
-    使用funasr的vad模型将音频中的语音分割成短句
-    """
-    from filter import HPFilter
-    from audio_aug import volume_norm
-    from funasr import AutoModel
-    model = AutoModel(model="fsmn-vad", model_revision="v2.0.4")
-    wav_path_list = get_path_list(source_dir, "*.wav")
-    for wav_path in wav_path_list:
-        wav_folder = wav_path[:-4].replace(source_dir, target_dir)
-        os.makedirs(wav_folder, exist_ok=True)
-        wav_orig, wav_sr = sf.read(wav_path, always_2d=True)
-        assert wav_sr == sr, f"音频采样率为{wav_sr}, 期望为{sr}"
-        wav = HPFilter(wav_orig[:, 0], sr=sr, order=6, cutoff=100)
-        wav = volume_norm(wav)
-        res_list = model.generate(input=wav)
-        for res in res_list:
-            for i, value_item in enumerate(res["value"]):
-                start, end = value_item
-                start, end = int(start * wav_sr / 1000), int(end * wav_sr / 1000)
-                # short_wav = wav_orig[start - int(0.5 * sr):end + int(0.5 * sr)]
-                # duration = (end - start) / sr
-                # assert len(short_wav) > sr * 3, f"{end/sr:.2f}-{start/sr:.2f}={duration:.2f}"
-                sf.write(os.path.join(wav_folder, f"{i}.wav"), wav_orig[start:end], sr)
-        # break
-def audio_split_VADsilero(source_dir, target_dir, sr, threshold=0.4,
-                          min_speech_duration_ms=400, min_silence_duration_ms=400,
-                          window_size_samples=512, speech_pad_ms=500):
-    """
-    使用silero的vad模型将音频中的语音分割成短句
-    source_dir: 音频文件目录
-    target_dir: 分割后的音频文件目录
-    sr: 音频采样率
-    threshold: 阈值
-    min_speech_duration_ms: 语音块的最小持续时间 ms
-    min_silence_duration_ms: 语音块之间的最小静音时间 ms
-    window_size_samples: 512\1024\1536
-    """
-    import torch
-    from filter import HPFilter
-    from audio_aug import volume_norm
-    model, utils = torch.hub.load(repo_or_dir='snakers4/silero-vad', model='silero_vad', force_reload=False, onnx=True)
-    (get_speech_timestamps, save_audio, read_audio, VADIterator, collect_chunks) = utils
-    wav_path_list = get_path_list(source_dir, "*.wav")
-    for wav_path in wav_path_list:
-        wav_folder = wav_path[:-4].replace(source_dir, target_dir)
-        os.makedirs(wav_folder, exist_ok=True)
-        wav_orig, wav_sr = sf.read(wav_path, always_2d=True)
-        assert wav_sr == sr, f"音频采样率为{wav_sr}, 期望为{sr}"
-        wav = HPFilter(wav_orig[:, 0], sr=sr, order=6, cutoff=100)
-        wav = volume_norm(wav)
-        speech_timestamps = get_speech_timestamps(wav, model,
-                                                  sampling_rate=sr,
-                                                  threshold=threshold,
-                                                  min_speech_duration_ms=min_speech_duration_ms,  # 语音块的最小持续时间 ms
-                                                  min_silence_duration_ms=min_silence_duration_ms,  # 语音块之间的最小静音时间 ms
-                                                  window_size_samples=window_size_samples,  # 512\1024\1536
-                                                  speech_pad_ms=speech_pad_ms,  # 最后的语音块由两侧的speech_pad_ms填充
-                                                  )
-        for i, timestamp in enumerate(speech_timestamps):
-            wav_vad = wav_orig[timestamp["start"]:timestamp["end"]]
-            sf.write(os.path.join(wav_folder, f"{i}.wav"), wav_vad, sr)

neverlib 0.2.8__py3-none-any.whl → 0.3.0__py3-none-any.whl

neverlib 0.2.8py3-none-any.whl → 0.3.0py3-none-any.whl