pec-dss 0.1.0__tar.gz → 0.1.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {pec_dss-0.1.0/pec_dss.egg-info → pec_dss-0.1.1}/PKG-INFO +53 -1
- {pec_dss-0.1.0 → pec_dss-0.1.1}/README.md +52 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pec_dss/__init__.py +1 -1
- {pec_dss-0.1.0 → pec_dss-0.1.1/pec_dss.egg-info}/PKG-INFO +53 -1
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pyproject.toml +1 -1
- {pec_dss-0.1.0 → pec_dss-0.1.1}/LICENSE +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/MANIFEST.in +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/docs/api/index.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/docs/contributing.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/docs/examples/basic_processor.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/docs/examples/index.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/docs/index.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/docs/installation.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/docs/usage.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/examples/advanced_usage.py +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/examples/basic_usage.py +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/i18n/README_jp.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/i18n/README_ko.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/i18n/README_zh.md +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pec_dss/__main__.py +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pec_dss/cli.py +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pec_dss.egg-info/SOURCES.txt +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pec_dss.egg-info/dependency_links.txt +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pec_dss.egg-info/entry_points.txt +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pec_dss.egg-info/requires.txt +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/pec_dss.egg-info/top_level.txt +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/requirements-dev.txt +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/requirements.txt +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/setup.cfg +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/setup.py +0 -0
- {pec_dss-0.1.0 → pec_dss-0.1.1}/tests/test_core.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: pec-dss
|
3
|
-
Version: 0.1.
|
3
|
+
Version: 0.1.1
|
4
4
|
Summary: Paralinguistic Event Classification from Diarized Speaker Segments
|
5
5
|
Author-email: Hyunwoo Kim <hwk06023@gmail.com>
|
6
6
|
License: GPL-3.0-only
|
@@ -118,6 +118,56 @@ for speaker, events in results.items():
|
|
118
118
|
print(f"Speaker {speaker} has {len(events)} attributed events")
|
119
119
|
```
|
120
120
|
|
121
|
+
### CLI Usage
|
122
|
+
|
123
|
+
```bash
|
124
|
+
pec-dss --speakers-dir ./speakers --unidentified-dir ./events --output-dir ./results
|
125
|
+
```
|
126
|
+
|
127
|
+
## 📁 Directory Structure
|
128
|
+
|
129
|
+
PEC-DSS expects a specific directory structure for processing audio files:
|
130
|
+
|
131
|
+
### Speaker Reference Structure
|
132
|
+
|
133
|
+
```
|
134
|
+
speakers_directory/
|
135
|
+
├── speaker_A/ # Each speaker's name becomes their ID
|
136
|
+
│ ├── audio1.wav # Reference voice samples for this speaker
|
137
|
+
│ ├── audio2.wav
|
138
|
+
│ └── ...
|
139
|
+
├── speaker_B/
|
140
|
+
│ ├── audio1.wav
|
141
|
+
│ └── ...
|
142
|
+
└── speaker_C/
|
143
|
+
├── audio1.wav
|
144
|
+
└── ...
|
145
|
+
```
|
146
|
+
|
147
|
+
### Unidentified Audio Structure
|
148
|
+
|
149
|
+
```
|
150
|
+
unidentified_directory/
|
151
|
+
├── laugh1.wav # Non-linguistic vocal events to be classified
|
152
|
+
├── giggle1.wav
|
153
|
+
└── ...
|
154
|
+
```
|
155
|
+
|
156
|
+
### Output Structure (After Processing)
|
157
|
+
|
158
|
+
```
|
159
|
+
output_directory/
|
160
|
+
├── results.json # JSON file with all results
|
161
|
+
├── speaker_A/ # Files assigned to each speaker
|
162
|
+
│ ├── 0_laugh1.wav
|
163
|
+
│ └── ...
|
164
|
+
├── speaker_B/
|
165
|
+
│ ├── 0_giggle1.wav
|
166
|
+
│ └── ...
|
167
|
+
└── unknown/ # Files below similarity threshold (if any)
|
168
|
+
└── ...
|
169
|
+
```
|
170
|
+
|
121
171
|
## 🧩 System Architecture
|
122
172
|
|
123
173
|
PEC-DSS consists of the following components:
|
@@ -138,6 +188,8 @@ The system can identify various paralinguistic events including:
|
|
138
188
|
* Coughing
|
139
189
|
* Other non-verbal vocal expressions
|
140
190
|
|
191
|
+
**Note:** PEC-DSS does not automatically classify these event types. It only determines which speaker produced the audio event.
|
192
|
+
|
141
193
|
## 🚀 Future Developments
|
142
194
|
|
143
195
|
* 🧠 Integration with more audio encoder models
|
@@ -77,6 +77,56 @@ for speaker, events in results.items():
|
|
77
77
|
print(f"Speaker {speaker} has {len(events)} attributed events")
|
78
78
|
```
|
79
79
|
|
80
|
+
### CLI Usage
|
81
|
+
|
82
|
+
```bash
|
83
|
+
pec-dss --speakers-dir ./speakers --unidentified-dir ./events --output-dir ./results
|
84
|
+
```
|
85
|
+
|
86
|
+
## 📁 Directory Structure
|
87
|
+
|
88
|
+
PEC-DSS expects a specific directory structure for processing audio files:
|
89
|
+
|
90
|
+
### Speaker Reference Structure
|
91
|
+
|
92
|
+
```
|
93
|
+
speakers_directory/
|
94
|
+
├── speaker_A/ # Each speaker's name becomes their ID
|
95
|
+
│ ├── audio1.wav # Reference voice samples for this speaker
|
96
|
+
│ ├── audio2.wav
|
97
|
+
│ └── ...
|
98
|
+
├── speaker_B/
|
99
|
+
│ ├── audio1.wav
|
100
|
+
│ └── ...
|
101
|
+
└── speaker_C/
|
102
|
+
├── audio1.wav
|
103
|
+
└── ...
|
104
|
+
```
|
105
|
+
|
106
|
+
### Unidentified Audio Structure
|
107
|
+
|
108
|
+
```
|
109
|
+
unidentified_directory/
|
110
|
+
├── laugh1.wav # Non-linguistic vocal events to be classified
|
111
|
+
├── giggle1.wav
|
112
|
+
└── ...
|
113
|
+
```
|
114
|
+
|
115
|
+
### Output Structure (After Processing)
|
116
|
+
|
117
|
+
```
|
118
|
+
output_directory/
|
119
|
+
├── results.json # JSON file with all results
|
120
|
+
├── speaker_A/ # Files assigned to each speaker
|
121
|
+
│ ├── 0_laugh1.wav
|
122
|
+
│ └── ...
|
123
|
+
├── speaker_B/
|
124
|
+
│ ├── 0_giggle1.wav
|
125
|
+
│ └── ...
|
126
|
+
└── unknown/ # Files below similarity threshold (if any)
|
127
|
+
└── ...
|
128
|
+
```
|
129
|
+
|
80
130
|
## 🧩 System Architecture
|
81
131
|
|
82
132
|
PEC-DSS consists of the following components:
|
@@ -97,6 +147,8 @@ The system can identify various paralinguistic events including:
|
|
97
147
|
* Coughing
|
98
148
|
* Other non-verbal vocal expressions
|
99
149
|
|
150
|
+
**Note:** PEC-DSS does not automatically classify these event types. It only determines which speaker produced the audio event.
|
151
|
+
|
100
152
|
## 🚀 Future Developments
|
101
153
|
|
102
154
|
* 🧠 Integration with more audio encoder models
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: pec-dss
|
3
|
-
Version: 0.1.
|
3
|
+
Version: 0.1.1
|
4
4
|
Summary: Paralinguistic Event Classification from Diarized Speaker Segments
|
5
5
|
Author-email: Hyunwoo Kim <hwk06023@gmail.com>
|
6
6
|
License: GPL-3.0-only
|
@@ -118,6 +118,56 @@ for speaker, events in results.items():
|
|
118
118
|
print(f"Speaker {speaker} has {len(events)} attributed events")
|
119
119
|
```
|
120
120
|
|
121
|
+
### CLI Usage
|
122
|
+
|
123
|
+
```bash
|
124
|
+
pec-dss --speakers-dir ./speakers --unidentified-dir ./events --output-dir ./results
|
125
|
+
```
|
126
|
+
|
127
|
+
## 📁 Directory Structure
|
128
|
+
|
129
|
+
PEC-DSS expects a specific directory structure for processing audio files:
|
130
|
+
|
131
|
+
### Speaker Reference Structure
|
132
|
+
|
133
|
+
```
|
134
|
+
speakers_directory/
|
135
|
+
├── speaker_A/ # Each speaker's name becomes their ID
|
136
|
+
│ ├── audio1.wav # Reference voice samples for this speaker
|
137
|
+
│ ├── audio2.wav
|
138
|
+
│ └── ...
|
139
|
+
├── speaker_B/
|
140
|
+
│ ├── audio1.wav
|
141
|
+
│ └── ...
|
142
|
+
└── speaker_C/
|
143
|
+
├── audio1.wav
|
144
|
+
└── ...
|
145
|
+
```
|
146
|
+
|
147
|
+
### Unidentified Audio Structure
|
148
|
+
|
149
|
+
```
|
150
|
+
unidentified_directory/
|
151
|
+
├── laugh1.wav # Non-linguistic vocal events to be classified
|
152
|
+
├── giggle1.wav
|
153
|
+
└── ...
|
154
|
+
```
|
155
|
+
|
156
|
+
### Output Structure (After Processing)
|
157
|
+
|
158
|
+
```
|
159
|
+
output_directory/
|
160
|
+
├── results.json # JSON file with all results
|
161
|
+
├── speaker_A/ # Files assigned to each speaker
|
162
|
+
│ ├── 0_laugh1.wav
|
163
|
+
│ └── ...
|
164
|
+
├── speaker_B/
|
165
|
+
│ ├── 0_giggle1.wav
|
166
|
+
│ └── ...
|
167
|
+
└── unknown/ # Files below similarity threshold (if any)
|
168
|
+
└── ...
|
169
|
+
```
|
170
|
+
|
121
171
|
## 🧩 System Architecture
|
122
172
|
|
123
173
|
PEC-DSS consists of the following components:
|
@@ -138,6 +188,8 @@ The system can identify various paralinguistic events including:
|
|
138
188
|
* Coughing
|
139
189
|
* Other non-verbal vocal expressions
|
140
190
|
|
191
|
+
**Note:** PEC-DSS does not automatically classify these event types. It only determines which speaker produced the audio event.
|
192
|
+
|
141
193
|
## 🚀 Future Developments
|
142
194
|
|
143
195
|
* 🧠 Integration with more audio encoder models
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|