neverlib 0.2.4__py3-none-any.whl → 0.2.6__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- neverlib/.history/Docs/audio_aug/del_20250827162530.py +0 -0
- neverlib/.history/Docs/audio_aug/del_20250827162540.py +2 -0
- neverlib/.history/Docs/audio_aug/del_20250827162541.py +7 -0
- neverlib/.history/Docs/audio_aug/del_20250827162606.py +7 -0
- neverlib/.history/Docs/audio_aug/del_20250827162637.py +8 -0
- neverlib/.history/Docs/audio_aug/del_20250827162645.py +8 -0
- neverlib/.history/Docs/audio_aug/del_20250827162723.py +9 -0
- neverlib/.history/Docs/audio_aug/del_20250827162739.py +9 -0
- neverlib/.history/Docs/audio_aug/test_snr_20250827161751.py +55 -0
- neverlib/.history/Docs/audio_aug/test_snr_20250827161754.py +55 -0
- neverlib/.history/Docs/audio_aug/test_snr_20250827161833.py +54 -0
- neverlib/.history/Docs/audio_aug/test_snr_20250827162017.py +56 -0
- neverlib/.history/Docs/audio_aug/test_snr_20250827162021.py +57 -0
- neverlib/.history/Docs/audio_aug/test_snr_20250827162028.py +57 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827162738.py +9 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827162819.py +9 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827162830.py +9 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827162846.py +9 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827162851.py +9 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827162903.py +10 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827162921.py +10 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827162926.py +10 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827163030.py +10 -0
- neverlib/.history/Docs/audio_aug_test/del_20250827163032.py +10 -0
- neverlib/.history/QA/html2markdown_20250822234112.md +0 -0
- neverlib/.history/QA/html2markdown_20250822234140.py +9 -0
- neverlib/.history/QA/html2markdown_20250822234141.md +9 -0
- neverlib/.history/QA/html2markdown_20250822234159.py +12 -0
- neverlib/.history/QA/html2markdown_20250822234200.py +17 -0
- neverlib/.history/QA/html2markdown_20250822234236.py +17 -0
- neverlib/.history/QA/html2markdown_20250822234340.py +14 -0
- neverlib/.history/QA/html2markdown_20250822234522.py +18 -0
- neverlib/.history/QA/html2markdown_20250822234601.py +20 -0
- neverlib/.history/QA/html2markdown_20250822234615.py +22 -0
- neverlib/.history/QA/html2markdown_20250822234715.py +28 -0
- neverlib/.history/QA/html2markdown_20250822234720.py +27 -0
- neverlib/.history/QA/html2markdown_20250822234903.py +27 -0
- neverlib/.history/__init___20250805234212.py +41 -0
- neverlib/.history/__init___20250904102635.py +39 -0
- neverlib/.history/__init___20250904102836.py +34 -0
- neverlib/.history/__init___20250904102838.py +39 -0
- neverlib/.history/__init___20250904102851.py +33 -0
- neverlib/.history/audio_aug/audio_aug_20250826155913.py +158 -0
- neverlib/.history/audio_aug/audio_aug_20250826164159.py +159 -0
- neverlib/.history/audio_aug/audio_aug_20250826164217.py +160 -0
- neverlib/.history/audio_aug/audio_aug_20250826164408.py +161 -0
- neverlib/.history/audio_aug/audio_aug_20250826164423.py +161 -0
- neverlib/.history/audio_aug/audio_aug_20250826164529.py +161 -0
- neverlib/.history/audio_aug/audio_aug_20250826164824.py +161 -0
- neverlib/.history/audio_aug/audio_aug_20250826164932.py +162 -0
- neverlib/.history/audio_aug/audio_aug_20250826164947.py +162 -0
- neverlib/.history/audio_aug/audio_aug_20250826165403.py +162 -0
- neverlib/.history/audio_aug/audio_aug_20250826165421.py +162 -0
- neverlib/.history/audio_aug/audio_aug_20250826165509.py +163 -0
- neverlib/.history/audio_aug/audio_aug_20250826165702.py +163 -0
- neverlib/.history/audio_aug/audio_aug_20250826165732.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826170041.py +163 -0
- neverlib/.history/audio_aug/audio_aug_20250826170105.py +164 -0
- neverlib/.history/audio_aug/audio_aug_20250826170154.py +164 -0
- neverlib/.history/audio_aug/audio_aug_20250826170220.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826170221.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826170228.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826170231.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826212001.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826220038.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826220133.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826220148.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826220154.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826220156.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826220314.py +165 -0
- neverlib/.history/audio_aug/audio_aug_20250826220343.py +184 -0
- neverlib/.history/audio_aug/audio_aug_20250826220345.py +184 -0
- neverlib/.history/audio_aug/audio_aug_20250826220349.py +184 -0
- neverlib/.history/audio_aug/audio_aug_20250826220429.py +184 -0
- neverlib/.history/audio_aug/audio_aug_20250826220447.py +184 -0
- neverlib/.history/audio_aug/audio_aug_20250826220601.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826220638.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826220641.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826220647.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826220653.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826220655.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826220731.py +185 -0
- neverlib/.history/audio_aug/audio_aug_20250826220739.py +185 -0
- neverlib/.history/audio_aug/audio_aug_20250826220747.py +185 -0
- neverlib/.history/audio_aug/audio_aug_20250826220801.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826220822.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826220901.py +186 -0
- neverlib/.history/audio_aug/audio_aug_20250826221107.py +187 -0
- neverlib/.history/audio_aug/audio_aug_20250826221310.py +188 -0
- neverlib/.history/audio_aug/audio_aug_20250826221353.py +191 -0
- neverlib/.history/audio_aug/audio_aug_20250826221821.py +191 -0
- neverlib/.history/audio_aug/audio_aug_20250826221838.py +191 -0
- neverlib/.history/audio_aug/audio_aug_20250826221906.py +191 -0
- neverlib/.history/audio_aug/audio_aug_20250826221930.py +191 -0
- neverlib/.history/audio_aug/audio_aug_20250826221939.py +191 -0
- neverlib/.history/audio_aug/audio_aug_20250826221955.py +191 -0
- neverlib/.history/audio_aug/audio_aug_20250826222008.py +197 -0
- neverlib/.history/audio_aug/audio_aug_20250826222017.py +200 -0
- neverlib/.history/audio_aug/audio_aug_20250826222046.py +203 -0
- neverlib/.history/audio_aug/audio_aug_20250826222105.py +203 -0
- neverlib/.history/audio_aug/audio_aug_20250826222206.py +203 -0
- neverlib/.history/audio_aug/audio_aug_20250826222302.py +203 -0
- neverlib/.history/audio_aug/audio_aug_20250826222336.py +203 -0
- neverlib/.history/audio_aug/audio_aug_20250826222455.py +204 -0
- neverlib/.history/audio_aug/audio_aug_20250826222526.py +204 -0
- neverlib/.history/audio_aug/audio_aug_20250826222541.py +204 -0
- neverlib/.history/audio_aug/audio_aug_20250826222624.py +202 -0
- neverlib/.history/audio_aug/audio_aug_20250826222714.py +205 -0
- neverlib/.history/audio_aug/audio_aug_20250826222820.py +205 -0
- neverlib/.history/audio_aug/audio_aug_20250826222827.py +205 -0
- neverlib/.history/audio_aug/audio_aug_20250826222927.py +232 -0
- neverlib/.history/audio_aug/audio_aug_20250826223009.py +232 -0
- neverlib/.history/audio_aug/audio_aug_20250826223054.py +232 -0
- neverlib/.history/audio_aug/audio_aug_20250826223225.py +233 -0
- neverlib/.history/audio_aug/audio_aug_20250826223344.py +236 -0
- neverlib/.history/audio_aug/audio_aug_20250826223356.py +236 -0
- neverlib/.history/audio_aug/audio_aug_20250826223955.py +242 -0
- neverlib/.history/audio_aug/audio_aug_20250826224210.py +240 -0
- neverlib/.history/audio_aug/audio_aug_20250826224250.py +242 -0
- neverlib/.history/audio_aug/audio_aug_20250826224323.py +280 -0
- neverlib/.history/audio_aug/audio_aug_20250826224452.py +263 -0
- neverlib/.history/audio_aug/audio_aug_20250826224455.py +263 -0
- neverlib/.history/audio_aug/audio_aug_20250826224502.py +263 -0
- neverlib/.history/audio_aug/audio_aug_20250826224528.py +263 -0
- neverlib/.history/audio_aug/audio_aug_20250826224658.py +263 -0
- neverlib/.history/audio_aug/audio_aug_20250826224833.py +264 -0
- neverlib/.history/audio_aug/audio_aug_20250826225013.py +269 -0
- neverlib/.history/audio_aug/audio_aug_20250826225050.py +269 -0
- neverlib/.history/audio_aug/audio_aug_20250826225241.py +268 -0
- neverlib/.history/audio_aug/audio_aug_20250826225315.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250826225404.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250826225502.py +265 -0
- neverlib/.history/audio_aug/audio_aug_20250826225950.py +267 -0
- neverlib/.history/audio_aug/audio_aug_20250826225959.py +268 -0
- neverlib/.history/audio_aug/audio_aug_20250826230222.py +271 -0
- neverlib/.history/audio_aug/audio_aug_20250826230248.py +270 -0
- neverlib/.history/audio_aug/audio_aug_20250826230638.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250826230755.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250826230941.py +265 -0
- neverlib/.history/audio_aug/audio_aug_20250826231054.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250826231117.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250826231219.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250826232330.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250826232352.py +266 -0
- neverlib/.history/audio_aug/audio_aug_20250827152748.py +268 -0
- neverlib/.history/audio_aug/audio_aug_20250827152806.py +268 -0
- neverlib/.history/audio_aug/audio_aug_20250827152808.py +268 -0
- neverlib/.history/audio_aug/audio_aug_20250827152917.py +283 -0
- neverlib/.history/audio_aug/audio_aug_20250827152929.py +281 -0
- neverlib/.history/audio_aug/audio_aug_20250827153100.py +286 -0
- neverlib/.history/audio_aug/audio_aug_20250827153102.py +286 -0
- neverlib/.history/audio_aug/audio_aug_20250827153301.py +295 -0
- neverlib/.history/audio_aug/audio_aug_20250827153331.py +298 -0
- neverlib/.history/audio_aug/audio_aug_20250827153525.py +303 -0
- neverlib/.history/audio_aug/audio_aug_20250827153533.py +304 -0
- neverlib/.history/audio_aug/audio_aug_20250827153541.py +321 -0
- neverlib/.history/audio_aug/audio_aug_20250827153805.py +322 -0
- neverlib/.history/audio_aug/audio_aug_20250827153832.py +323 -0
- neverlib/.history/audio_aug/audio_aug_20250827153836.py +324 -0
- neverlib/.history/audio_aug/audio_aug_20250827153846.py +324 -0
- neverlib/.history/audio_aug/audio_aug_20250827153859.py +325 -0
- neverlib/.history/audio_aug/audio_aug_20250827154453.py +337 -0
- neverlib/.history/audio_aug/audio_aug_20250827154513.py +355 -0
- neverlib/.history/audio_aug/audio_aug_20250827154538.py +356 -0
- neverlib/.history/audio_aug/audio_aug_20250827154541.py +357 -0
- neverlib/.history/audio_aug/audio_aug_20250827154612.py +357 -0
- neverlib/.history/audio_aug/audio_aug_20250827154657.py +360 -0
- neverlib/.history/audio_aug/audio_aug_20250827154708.py +360 -0
- neverlib/.history/audio_aug/audio_aug_20250827154728.py +366 -0
- neverlib/.history/audio_aug/audio_aug_20250827154755.py +367 -0
- neverlib/.history/audio_aug/audio_aug_20250827154800.py +367 -0
- neverlib/.history/audio_aug/audio_aug_20250827154917.py +368 -0
- neverlib/.history/audio_aug/audio_aug_20250827154928.py +369 -0
- neverlib/.history/audio_aug/audio_aug_20250827154932.py +370 -0
- neverlib/.history/audio_aug/audio_aug_20250827154947.py +372 -0
- neverlib/.history/audio_aug/audio_aug_20250827155015.py +375 -0
- neverlib/.history/audio_aug/audio_aug_20250827155106.py +375 -0
- neverlib/.history/audio_aug/audio_aug_20250827155114.py +393 -0
- neverlib/.history/audio_aug/audio_aug_20250827155207.py +415 -0
- neverlib/.history/audio_aug/audio_aug_20250827155300.py +415 -0
- neverlib/.history/audio_aug/audio_aug_20250827155321.py +471 -0
- neverlib/.history/audio_aug/audio_aug_20250827164703.py +471 -0
- neverlib/.history/audio_aug/audio_aug_20250827164749.py +471 -0
- neverlib/.history/audio_aug/audio_aug_20250827165252.py +472 -0
- neverlib/.history/audio_aug/audio_aug_20250827165334.py +472 -0
- neverlib/.history/audio_aug/audio_aug_20250827165404.py +473 -0
- neverlib/.history/audio_aug/audio_aug_20250827165610.py +473 -0
- neverlib/.history/audio_aug/audio_aug_20250827165805.py +473 -0
- neverlib/.history/audio_aug/audio_aug_20250827170056.py +473 -0
- neverlib/.history/audio_aug/audio_aug_20250827170106.py +472 -0
- neverlib/.history/audio_aug/audio_aug_20250827170143.py +472 -0
- neverlib/.history/audio_aug/audio_aug_20250827170216.py +472 -0
- neverlib/.history/audio_aug/audio_aug_20250827170218.py +472 -0
- neverlib/.history/audio_aug/audio_aug_20250827170314.py +472 -0
- neverlib/.history/audio_aug/audio_aug_20250827171500.py +471 -0
- neverlib/.history/audio_aug/audio_aug_20250827172347.py +471 -0
- neverlib/.history/audio_aug/audio_aug_20250827172558.py +470 -0
- neverlib/.history/audio_aug/audio_aug_20250827172559.py +470 -0
- neverlib/.history/audio_aug/audio_aug_20250827172801.py +470 -0
- neverlib/.history/audio_aug/audio_aug_20250827182522.py +470 -0
- neverlib/.history/audio_aug/audio_aug_20250827182526.py +470 -0
- neverlib/.history/audio_aug/audio_aug_20250827182626.py +470 -0
- neverlib/.history/audio_aug/audio_aug_20250827182715.py +470 -0
- neverlib/.history/audio_aug/audio_aug_20250904185444.py +470 -0
- neverlib/.history/audio_aug/audio_aug_20250904185538.py +445 -0
- neverlib/.history/data_analyze/__init___20250806204158.py +14 -0
- neverlib/.history/data_analyze/__init___20250827163248.py +14 -0
- neverlib/.history/filter/auto_eq/freq_eq_20250821143140.py +76 -0
- neverlib/.history/filter/auto_eq/freq_eq_20250821153208.py +76 -0
- neverlib/.history/filter/auto_eq/freq_eq_20250821153214.py +76 -0
- neverlib/.history/filter/auto_eq/ga_eq_basic_20250901110521.py +385 -0
- neverlib/.history/filter/auto_eq/ga_eq_basic_20250901110652.py +385 -0
- neverlib/.history/filter/common_20250806002134.py +37 -0
- neverlib/.history/filter/common_20250821120448.py +49 -0
- neverlib/.history/filter/common_20250821120453.py +49 -0
- neverlib/.history/metrics/snr_20250827224201.py +182 -0
- neverlib/.history/metrics/snr_20250827234019.py +186 -0
- neverlib/.history/metrics/snr_20250827234028.py +186 -0
- neverlib/.history/metrics/snr_20250827234030.py +186 -0
- neverlib/.history/utils/audio_split_20250805234209.py +268 -0
- neverlib/.history/utils/audio_split_20250904185309.py +268 -0
- neverlib/.history/utils/utils_20250813165516.py +330 -0
- neverlib/.history/utils/utils_20250904181341.py +328 -0
- neverlib/.history/utils/utils_20250904185546.py +352 -0
- neverlib/.history/utils/utils_20250904185548.py +353 -0
- neverlib/.history/utils/utils_20250904185603.py +353 -0
- neverlib/.history/utils/utils_20250904185636.py +353 -0
- neverlib/.history/utils/utils_20250904185658.py +358 -0
- neverlib/.history/utils/utils_20250904190053.py +359 -0
- neverlib/.specstory/history/2025-08-22_02-10Z-/345/256/214/345/226/204/345/207/275/346/225/260/347/232/204/345/212/237/350/203/275/345/222/214/345/217/230/351/207/217/345/220/215/345/273/272/350/256/256.md +247 -0
- neverlib/.specstory/history/2025-08-26_11-54Z-oserror-missing-shared-object-file.md +87 -0
- neverlib/.specstory/history/2025-08-27_08-07Z-/345/256/214/345/226/204/346/265/213/350/257/225/346/226/207/346/241/243/347/232/204/350/256/250/350/256/272.md +296 -0
- neverlib/.specstory/history/2025-08-27_08-29Z-delete-python-file-command.md +211 -0
- neverlib/.specstory/history/2025-08-27_09-05Z-/345/234/250jupyter/344/270/255/346/222/255/346/224/276/351/237/263/351/242/221/347/232/204/344/273/243/347/240/201/344/277/256/346/224/271.md +357 -0
- neverlib/Docs/audio_aug_test/test_snr.py +55 -0
- neverlib/Docs/audio_aug_test/test_volume.py +0 -0
- neverlib/QA/html2markdown.py +27 -0
- neverlib/__init__.py +10 -20
- neverlib/audio_aug/__init__.py +6 -1
- neverlib/audio_aug/audio_aug.py +360 -55
- neverlib/data_analyze/__init__.py +8 -2
- neverlib/data_analyze/temporal_features.py +1 -1
- neverlib/filter/__init__.py +9 -3
- neverlib/filter/auto_eq/freq_eq.py +1 -1
- neverlib/filter/auto_eq/ga_eq_basic.py +3 -3
- neverlib/filter/common.py +12 -0
- neverlib/metrics/snr.py +5 -3
- neverlib/utils/__init__.py +14 -7
- neverlib/utils/lazy_module.py +81 -0
- neverlib/utils/message.py +3 -8
- neverlib/utils/utils.py +32 -3
- neverlib/vad/__init__.py +16 -9
- neverlib/vad/utils.py +20 -6
- {neverlib-0.2.4.dist-info → neverlib-0.2.6.dist-info}/METADATA +21 -17
- neverlib-0.2.6.dist-info/RECORD +467 -0
- neverlib-0.2.4.dist-info/RECORD +0 -229
- /neverlib/{Docs/audio_aug/test_snr.py → .history/Docs/audio_aug/test_snr_20250827162033.py} +0 -0
- {neverlib-0.2.4.dist-info → neverlib-0.2.6.dist-info}/WHEEL +0 -0
- {neverlib-0.2.4.dist-info → neverlib-0.2.6.dist-info}/licenses/LICENSE +0 -0
- {neverlib-0.2.4.dist-info → neverlib-0.2.6.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,358 @@
|
|
|
1
|
+
# -*- coding:utf-8 -*-
|
|
2
|
+
# Author:凌逆战 | Never
|
|
3
|
+
# Date: 2023/9/25
|
|
4
|
+
"""
|
|
5
|
+
folder处理
|
|
6
|
+
"""
|
|
7
|
+
import os
|
|
8
|
+
import random
|
|
9
|
+
import shutil
|
|
10
|
+
import fnmatch
|
|
11
|
+
from tqdm import tqdm
|
|
12
|
+
from datetime import datetime
|
|
13
|
+
import soundfile as sf
|
|
14
|
+
import numpy as np
|
|
15
|
+
EPS = np.finfo(float).eps
|
|
16
|
+
|
|
17
|
+
|
|
18
|
+
def get_path_list(source_path, end="*.wav", shuffle=False):
|
|
19
|
+
wav_list = []
|
|
20
|
+
for root, dirnames, filenames in os.walk(source_path):
|
|
21
|
+
# 实现列表特殊字符的过滤或筛选,返回符合匹配“.wav”字符列表
|
|
22
|
+
for filename in fnmatch.filter(filenames, end):
|
|
23
|
+
wav_list.append(os.path.join(root, filename))
|
|
24
|
+
if os.environ.get("LOCAL_RANK", "0") == "0":
|
|
25
|
+
print(source_path, len(wav_list))
|
|
26
|
+
if shuffle:
|
|
27
|
+
random.shuffle(wav_list)
|
|
28
|
+
return wav_list
|
|
29
|
+
|
|
30
|
+
|
|
31
|
+
def get_audio_segments(wav_len, wav_path_list, sr=16000, insert_silence=None):
|
|
32
|
+
"""
|
|
33
|
+
从音频列表中随机拼接指定长度音频
|
|
34
|
+
Args:
|
|
35
|
+
wav_len: 需要返回的音频长度
|
|
36
|
+
audio_path_list: 音频路径列表
|
|
37
|
+
sr: 采样率
|
|
38
|
+
Returns:返回指定长度的音频
|
|
39
|
+
"""
|
|
40
|
+
audio_len = 0
|
|
41
|
+
wav_list = []
|
|
42
|
+
while audio_len < wav_len:
|
|
43
|
+
audio_path = random.choice(wav_path_list)
|
|
44
|
+
wav, wav_sr = sf.read(audio_path, always_2d=True, dtype='float32')
|
|
45
|
+
assert wav_sr == sr, f"音频采样率是{wav_sr}, 期望{sr}"
|
|
46
|
+
audio_len += len(wav)
|
|
47
|
+
wav_list.append(wav)
|
|
48
|
+
if insert_silence is not None:
|
|
49
|
+
silence_len = random.randint(0, insert_silence)
|
|
50
|
+
silence = np.zeros((silence_len, ), dtype=np.float32)
|
|
51
|
+
merge_wav_len += silence_len
|
|
52
|
+
wav_list.append(silence)
|
|
53
|
+
wav = np.concatenate(wav_list, axis=0)
|
|
54
|
+
if len(wav) > wav_len:
|
|
55
|
+
# 随机截取clean_len
|
|
56
|
+
start = random.randint(0, len(wav) - wav_len)
|
|
57
|
+
wav = wav[start:start + wav_len, :]
|
|
58
|
+
return wav
|
|
59
|
+
|
|
60
|
+
|
|
61
|
+
def rename_files_and_folders(directory, replace='_-', replacement='_'):
|
|
62
|
+
# 将路径的指定字符替换为指定字符
|
|
63
|
+
for root, dirs, files in os.walk(directory):
|
|
64
|
+
for filename in files:
|
|
65
|
+
if replace in filename:
|
|
66
|
+
new_filename = filename.replace(replace, replacement)
|
|
67
|
+
old_path = os.path.join(root, filename)
|
|
68
|
+
new_path = os.path.join(root, new_filename)
|
|
69
|
+
os.rename(old_path, new_path)
|
|
70
|
+
print(f'Renamed file: {old_path} -> {new_path}')
|
|
71
|
+
|
|
72
|
+
for folder in dirs:
|
|
73
|
+
if replace in folder:
|
|
74
|
+
new_folder = folder.replace(replace, replacement)
|
|
75
|
+
old_path = os.path.join(root, folder)
|
|
76
|
+
new_path = os.path.join(root, new_folder)
|
|
77
|
+
os.rename(old_path, new_path)
|
|
78
|
+
print(f'Renamed folder: {old_path} -> {new_path}')
|
|
79
|
+
|
|
80
|
+
|
|
81
|
+
def get_file_time(file_path):
|
|
82
|
+
# 获取最后修改时间
|
|
83
|
+
mod_time = os.path.getmtime(file_path)
|
|
84
|
+
# 转为data_time格式: 年-月-日-时-分-秒
|
|
85
|
+
datetime_dt = datetime.fromtimestamp(mod_time)
|
|
86
|
+
|
|
87
|
+
# 如果时间早于2024-09-04 02:00:00, 则删除
|
|
88
|
+
# if datetime_dt < datetime(2024, 9, 4, 2, 0, 0):
|
|
89
|
+
# print(file_path)
|
|
90
|
+
return datetime_dt
|
|
91
|
+
|
|
92
|
+
|
|
93
|
+
def TrainValSplit(dataset_dir, train_dir, val_dir, percentage=0.9):
|
|
94
|
+
""" 分割数据集为训练集和验证集
|
|
95
|
+
:param dataset_dir: 源数据集地址
|
|
96
|
+
:param train_dir: 训练集地址
|
|
97
|
+
:param val_dir: 验证集地址
|
|
98
|
+
:param percentage: 分割百分比
|
|
99
|
+
"""
|
|
100
|
+
wav_path_list = get_path_list(dataset_dir, end="*.wav", shuffle=True)
|
|
101
|
+
total_wav_num = len(wav_path_list)
|
|
102
|
+
# 计算训练集和验证集的分割点
|
|
103
|
+
split_idx = int(total_wav_num * percentage)
|
|
104
|
+
train_path_list, val_path_list = wav_path_list[:split_idx], wav_path_list[split_idx:]
|
|
105
|
+
|
|
106
|
+
for train_wavpath in tqdm(train_path_list, desc="Copying train wav"):
|
|
107
|
+
target_path = train_wavpath.replace(dataset_dir, train_dir)
|
|
108
|
+
if not os.path.exists(os.path.split(target_path)[0]):
|
|
109
|
+
os.makedirs(os.path.split(target_path)[0])
|
|
110
|
+
shutil.copy(train_wavpath, target_path)
|
|
111
|
+
|
|
112
|
+
for val_wavpath in tqdm(val_path_list, desc="Copying val wav"):
|
|
113
|
+
target_path = val_wavpath.replace(dataset_dir, val_dir)
|
|
114
|
+
if not os.path.exists(os.path.split(target_path)[0]):
|
|
115
|
+
os.makedirs(os.path.split(target_path)[0])
|
|
116
|
+
shutil.copy(val_wavpath, target_path)
|
|
117
|
+
|
|
118
|
+
print("Done!")
|
|
119
|
+
|
|
120
|
+
|
|
121
|
+
def TrainValTestSplit(dataset_dir, train_dir, val_dir, test_dir, percentage=[0.8, 0.1, 0.1]):
|
|
122
|
+
""" 分割数据集为训练集、验证集和测试集
|
|
123
|
+
:param dataset_dir: 源数据集地址
|
|
124
|
+
:param train_dir: 训练集地址
|
|
125
|
+
:param val_dir: 验证集地址
|
|
126
|
+
:param test_dir: 测试集地址
|
|
127
|
+
:param percentage: 分割百分比
|
|
128
|
+
"""
|
|
129
|
+
assert sum(percentage) == 1.0, "百分比总和必须等于1.0"
|
|
130
|
+
|
|
131
|
+
wav_path_list = sorted(get_path_list(dataset_dir, end="*.wav"))
|
|
132
|
+
random.seed(10086)
|
|
133
|
+
random.shuffle(wav_path_list) # 打乱列表的顺序
|
|
134
|
+
total_wav_num = len(wav_path_list)
|
|
135
|
+
|
|
136
|
+
# 计算训练集、验证集和测试集的分割点
|
|
137
|
+
train_split_idx = int(total_wav_num * percentage[0])
|
|
138
|
+
val_split_idx = train_split_idx + int(total_wav_num * percentage[1])
|
|
139
|
+
|
|
140
|
+
train_path_list = wav_path_list[:train_split_idx]
|
|
141
|
+
val_path_list = wav_path_list[train_split_idx:val_split_idx]
|
|
142
|
+
test_path_list = wav_path_list[val_split_idx:]
|
|
143
|
+
|
|
144
|
+
for train_wavpath in tqdm(train_path_list, desc="复制训练集音频"):
|
|
145
|
+
target_path = train_wavpath.replace(dataset_dir, train_dir)
|
|
146
|
+
if not os.path.exists(os.path.split(target_path)[0]):
|
|
147
|
+
os.makedirs(os.path.split(target_path)[0])
|
|
148
|
+
shutil.copy(train_wavpath, target_path)
|
|
149
|
+
|
|
150
|
+
for val_wavpath in tqdm(val_path_list, desc="复制验证集音频"):
|
|
151
|
+
target_path = val_wavpath.replace(dataset_dir, val_dir)
|
|
152
|
+
if not os.path.exists(os.path.split(target_path)[0]):
|
|
153
|
+
os.makedirs(os.path.split(target_path)[0])
|
|
154
|
+
shutil.copy(val_wavpath, target_path)
|
|
155
|
+
|
|
156
|
+
for test_wavpath in tqdm(test_path_list, desc="复制测试集音频"):
|
|
157
|
+
target_path = test_wavpath.replace(dataset_dir, test_dir)
|
|
158
|
+
if not os.path.exists(os.path.split(target_path)[0]):
|
|
159
|
+
os.makedirs(os.path.split(target_path)[0])
|
|
160
|
+
shutil.copy(test_wavpath, target_path)
|
|
161
|
+
|
|
162
|
+
print(f"完成! 训练集: {len(train_path_list)}个文件, 验证集: {len(val_path_list)}个文件, 测试集: {len(test_path_list)}个文件")
|
|
163
|
+
|
|
164
|
+
|
|
165
|
+
def get_leaf_folders(directory):
|
|
166
|
+
# 获取最底层的文件夹路径
|
|
167
|
+
leaf_folders = []
|
|
168
|
+
for root, dirs, _ in os.walk(directory):
|
|
169
|
+
if not dirs: # 如果当前文件夹没有子文件夹
|
|
170
|
+
leaf_folders.append(root)
|
|
171
|
+
return leaf_folders
|
|
172
|
+
|
|
173
|
+
|
|
174
|
+
def del_empty_folders(path):
|
|
175
|
+
"""递归删除空文件夹(先删除子文件夹, 再删除父文件夹)"""
|
|
176
|
+
if not os.path.isdir(path):
|
|
177
|
+
return
|
|
178
|
+
|
|
179
|
+
# 获取子文件夹
|
|
180
|
+
subfolders = [os.path.join(path, d) for d in os.listdir(path) if os.path.isdir(os.path.join(path, d))]
|
|
181
|
+
|
|
182
|
+
# 递归处理子文件夹
|
|
183
|
+
for subfolder in subfolders:
|
|
184
|
+
del_empty_folders(subfolder)
|
|
185
|
+
|
|
186
|
+
# 如果文件夹为空,则删除
|
|
187
|
+
if not os.listdir(path):
|
|
188
|
+
os.rmdir(path)
|
|
189
|
+
print(f"删除空文件夹: {path}")
|
|
190
|
+
|
|
191
|
+
|
|
192
|
+
def DatasetSubfloderSplit(source_dir, split_dirs, percentage=None):
|
|
193
|
+
"""
|
|
194
|
+
将一个数据集按照子文件夹数量分割成train/val/test数据集
|
|
195
|
+
Args:
|
|
196
|
+
source_dir (str): 源数据集目录
|
|
197
|
+
split_dirs (list): 目标目录列表, 如 [train_dir, val_dir] 或 [train_dir, val_dir, test_dir]
|
|
198
|
+
percentage (list, optional): 分割比例, 如 [0.9, 0.1] 或 [0.8, 0.1, 0.1]。默认为 None, 此时:
|
|
199
|
+
- 如果是两路分割, 默认为 [0.9, 0.1]
|
|
200
|
+
- 如果是三路分割, 默认为 [0.8, 0.1, 0.1]
|
|
201
|
+
Example:
|
|
202
|
+
# 两路分割示例
|
|
203
|
+
DatasetSplit(
|
|
204
|
+
source_dir=source_dataset_path,
|
|
205
|
+
split_dirs=[target_train_path, target_val_path],
|
|
206
|
+
percentage=[0.9, 0.1]
|
|
207
|
+
)
|
|
208
|
+
|
|
209
|
+
# 三路分割示例
|
|
210
|
+
DatasetSplit(
|
|
211
|
+
source_dir=source_dataset_path,
|
|
212
|
+
split_dirs=[target_train_path, target_val_path, target_test_path],
|
|
213
|
+
percentage=[0.8, 0.1, 0.1]
|
|
214
|
+
)
|
|
215
|
+
|
|
216
|
+
# 使用默认比例的两路分割
|
|
217
|
+
DatasetSplit(
|
|
218
|
+
source_dir=source_dataset_path,
|
|
219
|
+
split_dirs=[target_train_path, target_val_path]
|
|
220
|
+
)
|
|
221
|
+
"""
|
|
222
|
+
if percentage is None:
|
|
223
|
+
percentage = [0.9, 0.1] if len(split_dirs) == 2 else [0.8, 0.1, 0.1]
|
|
224
|
+
|
|
225
|
+
# 验证输入参数
|
|
226
|
+
if len(split_dirs) not in [2, 3]:
|
|
227
|
+
raise ValueError("只支持2路或3路分割(训练集/验证集 或 训练集/验证集/测试集)")
|
|
228
|
+
if len(percentage) != len(split_dirs):
|
|
229
|
+
raise ValueError("分割比例数量必须与目标目录数量相同")
|
|
230
|
+
if sum(percentage) != 1.0:
|
|
231
|
+
raise ValueError("分割比例之和必须等于1.0")
|
|
232
|
+
|
|
233
|
+
# 获取并打乱文件夹列表
|
|
234
|
+
leaf_folder_list = sorted(get_leaf_folders(source_dir))
|
|
235
|
+
random.seed(10086)
|
|
236
|
+
random.shuffle(leaf_folder_list)
|
|
237
|
+
total_folder_num = len(leaf_folder_list)
|
|
238
|
+
|
|
239
|
+
# 计算分割点
|
|
240
|
+
split_indices = []
|
|
241
|
+
acc_percentage = 0
|
|
242
|
+
for p in percentage[:-1]: # 最后一个比例不需要计算
|
|
243
|
+
acc_percentage += p
|
|
244
|
+
split_indices.append(int(total_folder_num * acc_percentage))
|
|
245
|
+
|
|
246
|
+
# 分割文件夹列表
|
|
247
|
+
split_folder_lists = []
|
|
248
|
+
start_idx = 0
|
|
249
|
+
for end_idx in split_indices:
|
|
250
|
+
split_folder_lists.append(leaf_folder_list[start_idx:end_idx])
|
|
251
|
+
start_idx = end_idx
|
|
252
|
+
split_folder_lists.append(leaf_folder_list[start_idx:]) # 添加最后一部分
|
|
253
|
+
|
|
254
|
+
# 复制文件夹
|
|
255
|
+
split_names = ['train', 'val', 'test']
|
|
256
|
+
for folders, target_dir, split_name in zip(split_folder_lists, split_dirs, split_names[:len(split_dirs)]):
|
|
257
|
+
for folder in tqdm(folders, desc=f"Copying {split_name} folders"):
|
|
258
|
+
target_folder = folder.replace(source_dir, target_dir)
|
|
259
|
+
os.makedirs(os.path.dirname(target_folder), exist_ok=True)
|
|
260
|
+
shutil.copytree(folder, target_folder)
|
|
261
|
+
|
|
262
|
+
# 打印统计信息
|
|
263
|
+
print(f"Total folders: {total_folder_num}")
|
|
264
|
+
for folders, split_name in zip(split_folder_lists, split_names[:len(split_dirs)]):
|
|
265
|
+
print(f"{split_name.capitalize()} folders: {len(folders)}")
|
|
266
|
+
|
|
267
|
+
|
|
268
|
+
def pcm2wav(pcm_path, wav_path, sr=16000, channels=1, subtype='PCM_16'):
|
|
269
|
+
"""
|
|
270
|
+
将pcm文件转换为wav文件
|
|
271
|
+
:param pcm_path: pcm文件路径
|
|
272
|
+
:param wav_path: wav文件路径
|
|
273
|
+
:param sr: 采样率
|
|
274
|
+
:param channels: 声道数
|
|
275
|
+
:param subtype: 子类型
|
|
276
|
+
"""
|
|
277
|
+
pcm_data = np.fromfile(pcm_path, dtype=np.int16)
|
|
278
|
+
pcm_data = pcm_data.reshape(-1, channels) # 支持多通道
|
|
279
|
+
sf.write(wav_path, pcm_data, sr, subtype=subtype)
|
|
280
|
+
|
|
281
|
+
|
|
282
|
+
def wav2pcm(wav_path, pcm_path):
|
|
283
|
+
"""
|
|
284
|
+
将wav文件转换为pcm文件
|
|
285
|
+
:param wav_path: wav文件路径
|
|
286
|
+
:param pcm_path: pcm文件路径
|
|
287
|
+
"""
|
|
288
|
+
data, _ = sf.read(wav_path, dtype='int16')
|
|
289
|
+
data.tofile(pcm_path)
|
|
290
|
+
|
|
291
|
+
|
|
292
|
+
def save_weight_histogram(model, save_dir, mode=["params", "buffers"], ignore_name=["scale", "bias"], bins=100):
|
|
293
|
+
"""
|
|
294
|
+
保存模型权重分布直方图
|
|
295
|
+
Args:
|
|
296
|
+
model: PyTorch模型
|
|
297
|
+
save_dir: 保存路径
|
|
298
|
+
mode: 保存模式, 可选值为["params", "buffers"]
|
|
299
|
+
bins: 直方图bin数量
|
|
300
|
+
"""
|
|
301
|
+
import matplotlib.pyplot as plt
|
|
302
|
+
# 如果路径存在, 则删除
|
|
303
|
+
if os.path.exists(save_dir):
|
|
304
|
+
shutil.rmtree(save_dir)
|
|
305
|
+
|
|
306
|
+
if "params" in mode:
|
|
307
|
+
os.makedirs(os.path.join(save_dir, "param"), exist_ok=True)
|
|
308
|
+
for name, param in model.named_parameters():
|
|
309
|
+
if any(ignore in name for ignore in ignore_name):
|
|
310
|
+
continue
|
|
311
|
+
param = param.cpu().data.flatten().numpy()
|
|
312
|
+
param_min = param.min()
|
|
313
|
+
param_max = param.max()
|
|
314
|
+
param_mean = param.mean()
|
|
315
|
+
param_std = param.std()
|
|
316
|
+
|
|
317
|
+
# 保存模型参数到地址
|
|
318
|
+
# 绘制直方图
|
|
319
|
+
plt.title(name)
|
|
320
|
+
plt.xlabel("value")
|
|
321
|
+
plt.ylabel("count")
|
|
322
|
+
plt.grid(alpha=0.5)
|
|
323
|
+
# 在右上角添加统计信息
|
|
324
|
+
plt.text(1, 1, f"max: {param_max:.2f}\n \
|
|
325
|
+
min: {param_min:.2f}\n \
|
|
326
|
+
mean: {param_mean:.2f}\n \
|
|
327
|
+
std: {param_std:.2f}",
|
|
328
|
+
ha='right', va='top', transform=plt.gca().transAxes)
|
|
329
|
+
plt.hist(param, bins=bins)
|
|
330
|
+
plt.savefig(os.path.join(save_dir, "param", f"{name}.png"))
|
|
331
|
+
plt.close()
|
|
332
|
+
if "buffers" in mode:
|
|
333
|
+
os.makedirs(os.path.join(save_dir, "buffer"), exist_ok=True)
|
|
334
|
+
for name, buffer in model.named_buffers():
|
|
335
|
+
if "running_mean" not in name and "running_var" not in name:
|
|
336
|
+
continue
|
|
337
|
+
buffer = buffer.cpu().data.flatten().numpy()
|
|
338
|
+
|
|
339
|
+
# 计算统计数据
|
|
340
|
+
buffer_min = buffer.min()
|
|
341
|
+
buffer_max = buffer.max()
|
|
342
|
+
buffer_mean = buffer.mean()
|
|
343
|
+
buffer_std = buffer.std()
|
|
344
|
+
|
|
345
|
+
# 绘制直方图
|
|
346
|
+
plt.title(name)
|
|
347
|
+
plt.xlabel("value")
|
|
348
|
+
plt.ylabel("count")
|
|
349
|
+
plt.grid(alpha=0.5)
|
|
350
|
+
# 在右上角添加统计信息
|
|
351
|
+
plt.text(1, 1, f"max: {buffer_max:.2f}\n \
|
|
352
|
+
min: {buffer_min:.2f}\n \
|
|
353
|
+
mean: {buffer_mean:.2f}\n \
|
|
354
|
+
std: {buffer_std:.2f}",
|
|
355
|
+
ha='right', va='top', transform=plt.gca().transAxes)
|
|
356
|
+
plt.hist(buffer, bins=bins)
|
|
357
|
+
plt.savefig(os.path.join(save_dir, "buffer", f"{name}.png"))
|
|
358
|
+
plt.close()
|