cc-transcript 0.3.0__tar.gz → 0.4.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/Cargo.lock +447 -4
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/PKG-INFO +10 -7
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/README.md +9 -6
- cc_transcript-0.4.0/cc_transcript/__init__.py +60 -0
- cc_transcript-0.4.0/cc_transcript/_parser_rs.pyi +37 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/backend.py +0 -3
- cc_transcript-0.4.0/cc_transcript/builders.py +108 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/discovery.py +0 -3
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/filters.py +0 -14
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/filterspec.py +25 -85
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/models.py +0 -20
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/parser.py +0 -11
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/rust.py +0 -3
- cc_transcript-0.4.0/cc_transcript/sentiment/__init__.py +40 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/sentiment/buckets.py +0 -13
- cc_transcript-0.4.0/cc_transcript/sentiment/engine.py +105 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/sentiment/lexicon.py +69 -14
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/sentiment/messages.py +0 -3
- cc_transcript-0.4.0/cc_transcript/sentiment/scorespec.py +213 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/store.py +0 -3
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/pyproject.toml +4 -1
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/rust/Cargo.toml +3 -1
- cc_transcript-0.4.0/rust/data/afinn-en-165.tsv +3352 -0
- cc_transcript-0.4.0/rust/data/domain_overrides.tsv +38 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/rust/src/filter.rs +8 -6
- cc_transcript-0.4.0/rust/src/lexicon.rs +108 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/rust/src/lib.rs +38 -0
- cc_transcript-0.4.0/rust/src/score.rs +171 -0
- cc_transcript-0.3.0/cc_transcript/__init__.py +0 -127
- cc_transcript-0.3.0/cc_transcript/_parser_rs.pyi +0 -21
- cc_transcript-0.3.0/cc_transcript/sentiment/__init__.py +0 -62
- cc_transcript-0.3.0/cc_transcript/sentiment/engine.py +0 -79
- cc_transcript-0.3.0/cc_transcript/sentiment/scorefilters.py +0 -149
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/Cargo.toml +0 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/LICENSE +0 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/cc_transcript/py.typed +0 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/rust/src/event.rs +0 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/rust/src/model.rs +0 -0
- {cc_transcript-0.3.0 → cc_transcript-0.4.0}/rust/src/value.rs +0 -0
|
@@ -2,6 +2,12 @@
|
|
|
2
2
|
# It is not intended for manual editing.
|
|
3
3
|
version = 4
|
|
4
4
|
|
|
5
|
+
[[package]]
|
|
6
|
+
name = "adler2"
|
|
7
|
+
version = "2.0.1"
|
|
8
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
9
|
+
checksum = "320119579fcad9c21884f5c4861d16174d0e06250625266f50fe6898340abefa"
|
|
10
|
+
|
|
5
11
|
[[package]]
|
|
6
12
|
name = "ahash"
|
|
7
13
|
version = "0.8.12"
|
|
@@ -9,7 +15,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
|
9
15
|
checksum = "5a15f179cd60c4584b8a8c596927aadc462e27f2ca70c04e0071964a73ba7a75"
|
|
10
16
|
dependencies = [
|
|
11
17
|
"cfg-if",
|
|
12
|
-
"getrandom",
|
|
18
|
+
"getrandom 0.3.4",
|
|
13
19
|
"once_cell",
|
|
14
20
|
"version_check",
|
|
15
21
|
"zerocopy",
|
|
@@ -30,6 +36,12 @@ version = "1.5.1"
|
|
|
30
36
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
31
37
|
checksum = "f2032f911046de80f0a198e0901378627c33f59ea0ac00e363d481118bd70a53"
|
|
32
38
|
|
|
39
|
+
[[package]]
|
|
40
|
+
name = "base64"
|
|
41
|
+
version = "0.22.1"
|
|
42
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
43
|
+
checksum = "72b3254f16251a8381aa12e40e3c4d2f0199f8c6508fbecb9d91f575e0fbb8c6"
|
|
44
|
+
|
|
33
45
|
[[package]]
|
|
34
46
|
name = "bumpalo"
|
|
35
47
|
version = "3.20.3"
|
|
@@ -42,12 +54,23 @@ version = "1.11.1"
|
|
|
42
54
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
43
55
|
checksum = "1e748733b7cbc798e1434b6ac524f0c1ff2ab456fe201501e6497c8417a4fc33"
|
|
44
56
|
|
|
57
|
+
[[package]]
|
|
58
|
+
name = "cc"
|
|
59
|
+
version = "1.2.63"
|
|
60
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
61
|
+
checksum = "556e016178bb5662a08681bbe0f00f8e17631781a4dfc8c45e466e4b185ec27f"
|
|
62
|
+
dependencies = [
|
|
63
|
+
"find-msvc-tools",
|
|
64
|
+
"shlex",
|
|
65
|
+
]
|
|
66
|
+
|
|
45
67
|
[[package]]
|
|
46
68
|
name = "cc_transcript_parser"
|
|
47
|
-
version = "0.
|
|
69
|
+
version = "0.4.0"
|
|
48
70
|
dependencies = [
|
|
49
71
|
"chrono",
|
|
50
72
|
"crossbeam-channel",
|
|
73
|
+
"dirs",
|
|
51
74
|
"memchr",
|
|
52
75
|
"num_cpus",
|
|
53
76
|
"once_cell",
|
|
@@ -56,6 +79,7 @@ dependencies = [
|
|
|
56
79
|
"regex",
|
|
57
80
|
"serde",
|
|
58
81
|
"sonic-rs",
|
|
82
|
+
"udpipe-rs",
|
|
59
83
|
]
|
|
60
84
|
|
|
61
85
|
[[package]]
|
|
@@ -73,6 +97,15 @@ dependencies = [
|
|
|
73
97
|
"num-traits",
|
|
74
98
|
]
|
|
75
99
|
|
|
100
|
+
[[package]]
|
|
101
|
+
name = "crc32fast"
|
|
102
|
+
version = "1.5.0"
|
|
103
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
104
|
+
checksum = "9481c1c90cbf2ac953f07c8d4a58aa3945c425b7185c9154d67a65e4230da511"
|
|
105
|
+
dependencies = [
|
|
106
|
+
"cfg-if",
|
|
107
|
+
]
|
|
108
|
+
|
|
76
109
|
[[package]]
|
|
77
110
|
name = "crossbeam-channel"
|
|
78
111
|
version = "0.5.15"
|
|
@@ -107,6 +140,27 @@ version = "0.8.21"
|
|
|
107
140
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
108
141
|
checksum = "d0a5c400df2834b80a4c3327b3aad3a4c4cd4de0629063962b03235697506a28"
|
|
109
142
|
|
|
143
|
+
[[package]]
|
|
144
|
+
name = "dirs"
|
|
145
|
+
version = "5.0.1"
|
|
146
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
147
|
+
checksum = "44c45a9d03d6676652bcb5e724c7e988de1acad23a711b5217ab9cbecbec2225"
|
|
148
|
+
dependencies = [
|
|
149
|
+
"dirs-sys",
|
|
150
|
+
]
|
|
151
|
+
|
|
152
|
+
[[package]]
|
|
153
|
+
name = "dirs-sys"
|
|
154
|
+
version = "0.4.1"
|
|
155
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
156
|
+
checksum = "520f05a5cbd335fae5a99ff7a6ab8627577660ee5cfd6a94a6a929b52ff0321c"
|
|
157
|
+
dependencies = [
|
|
158
|
+
"libc",
|
|
159
|
+
"option-ext",
|
|
160
|
+
"redox_users",
|
|
161
|
+
"windows-sys 0.48.0",
|
|
162
|
+
]
|
|
163
|
+
|
|
110
164
|
[[package]]
|
|
111
165
|
name = "either"
|
|
112
166
|
version = "1.16.0"
|
|
@@ -131,6 +185,22 @@ dependencies = [
|
|
|
131
185
|
"simdutf8",
|
|
132
186
|
]
|
|
133
187
|
|
|
188
|
+
[[package]]
|
|
189
|
+
name = "find-msvc-tools"
|
|
190
|
+
version = "0.1.9"
|
|
191
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
192
|
+
checksum = "5baebc0774151f905a1a2cc41989300b1e6fbb29aff0ceffa1064fdd3088d582"
|
|
193
|
+
|
|
194
|
+
[[package]]
|
|
195
|
+
name = "flate2"
|
|
196
|
+
version = "1.1.9"
|
|
197
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
198
|
+
checksum = "843fba2746e448b37e26a819579957415c8cef339bf08564fe8b7ddbd959573c"
|
|
199
|
+
dependencies = [
|
|
200
|
+
"crc32fast",
|
|
201
|
+
"miniz_oxide",
|
|
202
|
+
]
|
|
203
|
+
|
|
134
204
|
[[package]]
|
|
135
205
|
name = "futures-core"
|
|
136
206
|
version = "0.3.32"
|
|
@@ -155,6 +225,17 @@ dependencies = [
|
|
|
155
225
|
"slab",
|
|
156
226
|
]
|
|
157
227
|
|
|
228
|
+
[[package]]
|
|
229
|
+
name = "getrandom"
|
|
230
|
+
version = "0.2.17"
|
|
231
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
232
|
+
checksum = "ff2abc00be7fca6ebc474524697ae276ad847ad0a6b3faa4bcb027e9a4614ad0"
|
|
233
|
+
dependencies = [
|
|
234
|
+
"cfg-if",
|
|
235
|
+
"libc",
|
|
236
|
+
"wasi",
|
|
237
|
+
]
|
|
238
|
+
|
|
158
239
|
[[package]]
|
|
159
240
|
name = "getrandom"
|
|
160
241
|
version = "0.3.4"
|
|
@@ -185,6 +266,22 @@ version = "0.5.2"
|
|
|
185
266
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
186
267
|
checksum = "fc0fef456e4baa96da950455cd02c081ca953b141298e41db3fc7e36b1da849c"
|
|
187
268
|
|
|
269
|
+
[[package]]
|
|
270
|
+
name = "http"
|
|
271
|
+
version = "1.4.2"
|
|
272
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
273
|
+
checksum = "6970f50e31d6fc17d3fa27329444bfa74e196cf62e95052a3f6fee181dba6425"
|
|
274
|
+
dependencies = [
|
|
275
|
+
"bytes",
|
|
276
|
+
"itoa",
|
|
277
|
+
]
|
|
278
|
+
|
|
279
|
+
[[package]]
|
|
280
|
+
name = "httparse"
|
|
281
|
+
version = "1.10.1"
|
|
282
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
283
|
+
checksum = "6dbf3de79e51f3d586ab4cb9d5c3e2c14aa28ed23d180cf89b4df0454a69cc87"
|
|
284
|
+
|
|
188
285
|
[[package]]
|
|
189
286
|
name = "indexmap"
|
|
190
287
|
version = "2.14.0"
|
|
@@ -219,12 +316,37 @@ version = "0.2.186"
|
|
|
219
316
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
220
317
|
checksum = "68ab91017fe16c622486840e4c83c9a37afeff978bd239b5293d61ece587de66"
|
|
221
318
|
|
|
319
|
+
[[package]]
|
|
320
|
+
name = "libredox"
|
|
321
|
+
version = "0.1.17"
|
|
322
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
323
|
+
checksum = "f02ab6bace2054fb888a3c16f990117b579d14a3088e472d63c6011fa185c9d3"
|
|
324
|
+
dependencies = [
|
|
325
|
+
"libc",
|
|
326
|
+
]
|
|
327
|
+
|
|
328
|
+
[[package]]
|
|
329
|
+
name = "log"
|
|
330
|
+
version = "0.4.32"
|
|
331
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
332
|
+
checksum = "953f07c43838f8e6f9758cab68bf5bed85465e7587ebe0b823f1bcd81978ad3a"
|
|
333
|
+
|
|
222
334
|
[[package]]
|
|
223
335
|
name = "memchr"
|
|
224
336
|
version = "2.8.1"
|
|
225
337
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
226
338
|
checksum = "6b947ae49db0d222b1dbc6b113ce7248a3fc3a6ca21b696717bfc000ba4484d8"
|
|
227
339
|
|
|
340
|
+
[[package]]
|
|
341
|
+
name = "miniz_oxide"
|
|
342
|
+
version = "0.8.9"
|
|
343
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
344
|
+
checksum = "1fa76a2c86f704bdb222d66965fb3d63269ce38518b83cb0575fca855ebb6316"
|
|
345
|
+
dependencies = [
|
|
346
|
+
"adler2",
|
|
347
|
+
"simd-adler32",
|
|
348
|
+
]
|
|
349
|
+
|
|
228
350
|
[[package]]
|
|
229
351
|
name = "munge"
|
|
230
352
|
version = "0.4.7"
|
|
@@ -270,6 +392,18 @@ version = "1.21.4"
|
|
|
270
392
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
271
393
|
checksum = "9f7c3e4beb33f85d45ae3e3a1792185706c8e16d043238c593331cc7cd313b50"
|
|
272
394
|
|
|
395
|
+
[[package]]
|
|
396
|
+
name = "option-ext"
|
|
397
|
+
version = "0.2.0"
|
|
398
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
399
|
+
checksum = "04744f49eae99ab78e0d5c0b603ab218f515ea8cfe5a456d7629ad883a3b6e7d"
|
|
400
|
+
|
|
401
|
+
[[package]]
|
|
402
|
+
name = "percent-encoding"
|
|
403
|
+
version = "2.3.2"
|
|
404
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
405
|
+
checksum = "9b4f627cb1b25917193a259e49bdad08f671f8d9708acfd5fe0a8c1455d87220"
|
|
406
|
+
|
|
273
407
|
[[package]]
|
|
274
408
|
name = "pin-project-lite"
|
|
275
409
|
version = "0.2.17"
|
|
@@ -414,6 +548,17 @@ dependencies = [
|
|
|
414
548
|
"crossbeam-utils",
|
|
415
549
|
]
|
|
416
550
|
|
|
551
|
+
[[package]]
|
|
552
|
+
name = "redox_users"
|
|
553
|
+
version = "0.4.6"
|
|
554
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
555
|
+
checksum = "ba009ff324d1fc1b900bd1fdb31564febe58a8ccc8a6fdbb93b543d33b13ca43"
|
|
556
|
+
dependencies = [
|
|
557
|
+
"getrandom 0.2.17",
|
|
558
|
+
"libredox",
|
|
559
|
+
"thiserror 1.0.69",
|
|
560
|
+
]
|
|
561
|
+
|
|
417
562
|
[[package]]
|
|
418
563
|
name = "ref-cast"
|
|
419
564
|
version = "1.0.25"
|
|
@@ -469,6 +614,20 @@ version = "0.5.3"
|
|
|
469
614
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
470
615
|
checksum = "cadadef317c2f20755a64d7fdc48f9e7178ee6b0e1f7fce33fa60f1d68a276e6"
|
|
471
616
|
|
|
617
|
+
[[package]]
|
|
618
|
+
name = "ring"
|
|
619
|
+
version = "0.17.14"
|
|
620
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
621
|
+
checksum = "a4689e6c2294d81e88dc6261c768b63bc4fcdb852be6d1352498b114f61383b7"
|
|
622
|
+
dependencies = [
|
|
623
|
+
"cc",
|
|
624
|
+
"cfg-if",
|
|
625
|
+
"getrandom 0.2.17",
|
|
626
|
+
"libc",
|
|
627
|
+
"untrusted",
|
|
628
|
+
"windows-sys 0.52.0",
|
|
629
|
+
]
|
|
630
|
+
|
|
472
631
|
[[package]]
|
|
473
632
|
name = "rkyv"
|
|
474
633
|
version = "0.8.16"
|
|
@@ -498,6 +657,41 @@ dependencies = [
|
|
|
498
657
|
"syn",
|
|
499
658
|
]
|
|
500
659
|
|
|
660
|
+
[[package]]
|
|
661
|
+
name = "rustls"
|
|
662
|
+
version = "0.23.40"
|
|
663
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
664
|
+
checksum = "ef86cd5876211988985292b91c96a8f2d298df24e75989a43a3c73f2d4d8168b"
|
|
665
|
+
dependencies = [
|
|
666
|
+
"log",
|
|
667
|
+
"once_cell",
|
|
668
|
+
"ring",
|
|
669
|
+
"rustls-pki-types",
|
|
670
|
+
"rustls-webpki",
|
|
671
|
+
"subtle",
|
|
672
|
+
"zeroize",
|
|
673
|
+
]
|
|
674
|
+
|
|
675
|
+
[[package]]
|
|
676
|
+
name = "rustls-pki-types"
|
|
677
|
+
version = "1.14.1"
|
|
678
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
679
|
+
checksum = "30a7197ae7eb376e574fe940d068c30fe0462554a3ddbe4eca7838e049c937a9"
|
|
680
|
+
dependencies = [
|
|
681
|
+
"zeroize",
|
|
682
|
+
]
|
|
683
|
+
|
|
684
|
+
[[package]]
|
|
685
|
+
name = "rustls-webpki"
|
|
686
|
+
version = "0.103.13"
|
|
687
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
688
|
+
checksum = "61c429a8649f110dddef65e2a5ad240f747e85f7758a6bccc7e5777bd33f756e"
|
|
689
|
+
dependencies = [
|
|
690
|
+
"ring",
|
|
691
|
+
"rustls-pki-types",
|
|
692
|
+
"untrusted",
|
|
693
|
+
]
|
|
694
|
+
|
|
501
695
|
[[package]]
|
|
502
696
|
name = "rustversion"
|
|
503
697
|
version = "1.0.22"
|
|
@@ -534,6 +728,18 @@ dependencies = [
|
|
|
534
728
|
"syn",
|
|
535
729
|
]
|
|
536
730
|
|
|
731
|
+
[[package]]
|
|
732
|
+
name = "shlex"
|
|
733
|
+
version = "2.0.1"
|
|
734
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
735
|
+
checksum = "f8fadd59c855ef2080decdef8ff161eb6661b86933c9d82e5ba29dc602a55aba"
|
|
736
|
+
|
|
737
|
+
[[package]]
|
|
738
|
+
name = "simd-adler32"
|
|
739
|
+
version = "0.3.9"
|
|
740
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
741
|
+
checksum = "703d5c7ef118737c72f1af64ad2f6f8c5e1921f818cdcb97b8fe6fc69bf66214"
|
|
742
|
+
|
|
537
743
|
[[package]]
|
|
538
744
|
name = "simdutf8"
|
|
539
745
|
version = "0.1.5"
|
|
@@ -572,7 +778,7 @@ dependencies = [
|
|
|
572
778
|
"simdutf8",
|
|
573
779
|
"sonic-number",
|
|
574
780
|
"sonic-simd",
|
|
575
|
-
"thiserror",
|
|
781
|
+
"thiserror 2.0.18",
|
|
576
782
|
"zmij",
|
|
577
783
|
]
|
|
578
784
|
|
|
@@ -585,6 +791,12 @@ dependencies = [
|
|
|
585
791
|
"cfg-if",
|
|
586
792
|
]
|
|
587
793
|
|
|
794
|
+
[[package]]
|
|
795
|
+
name = "subtle"
|
|
796
|
+
version = "2.6.1"
|
|
797
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
798
|
+
checksum = "13c2bddecc57b384dee18652358fb23172facb8a2c51ccc10d74c157bdea3292"
|
|
799
|
+
|
|
588
800
|
[[package]]
|
|
589
801
|
name = "syn"
|
|
590
802
|
version = "2.0.117"
|
|
@@ -602,13 +814,33 @@ version = "0.13.5"
|
|
|
602
814
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
603
815
|
checksum = "adb6935a6f5c20170eeceb1a3835a49e12e19d792f6dd344ccc76a985ca5a6ca"
|
|
604
816
|
|
|
817
|
+
[[package]]
|
|
818
|
+
name = "thiserror"
|
|
819
|
+
version = "1.0.69"
|
|
820
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
821
|
+
checksum = "b6aaf5339b578ea85b50e080feb250a3e8ae8cfcdff9a461c9ec2904bc923f52"
|
|
822
|
+
dependencies = [
|
|
823
|
+
"thiserror-impl 1.0.69",
|
|
824
|
+
]
|
|
825
|
+
|
|
605
826
|
[[package]]
|
|
606
827
|
name = "thiserror"
|
|
607
828
|
version = "2.0.18"
|
|
608
829
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
609
830
|
checksum = "4288b5bcbc7920c07a1149a35cf9590a2aa808e0bc1eafaade0b80947865fbc4"
|
|
610
831
|
dependencies = [
|
|
611
|
-
"thiserror-impl",
|
|
832
|
+
"thiserror-impl 2.0.18",
|
|
833
|
+
]
|
|
834
|
+
|
|
835
|
+
[[package]]
|
|
836
|
+
name = "thiserror-impl"
|
|
837
|
+
version = "1.0.69"
|
|
838
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
839
|
+
checksum = "4fee6c4efc90059e10f81e6d42c60a18f76588c3d74cb83a0b242a2b6c7504c1"
|
|
840
|
+
dependencies = [
|
|
841
|
+
"proc-macro2",
|
|
842
|
+
"quote",
|
|
843
|
+
"syn",
|
|
612
844
|
]
|
|
613
845
|
|
|
614
846
|
[[package]]
|
|
@@ -637,12 +869,63 @@ version = "0.1.1"
|
|
|
637
869
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
638
870
|
checksum = "1f3ccbac311fea05f86f61904b462b55fb3df8837a366dfc601a0161d0532f20"
|
|
639
871
|
|
|
872
|
+
[[package]]
|
|
873
|
+
name = "udpipe-rs"
|
|
874
|
+
version = "0.2.0"
|
|
875
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
876
|
+
checksum = "9a8f34a036b145a2d253613c2742c836f79c9d5f9c2220f03931762224d23452"
|
|
877
|
+
dependencies = [
|
|
878
|
+
"cc",
|
|
879
|
+
"ureq",
|
|
880
|
+
]
|
|
881
|
+
|
|
640
882
|
[[package]]
|
|
641
883
|
name = "unicode-ident"
|
|
642
884
|
version = "1.0.24"
|
|
643
885
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
644
886
|
checksum = "e6e4313cd5fcd3dad5cafa179702e2b244f760991f45397d14d4ebf38247da75"
|
|
645
887
|
|
|
888
|
+
[[package]]
|
|
889
|
+
name = "untrusted"
|
|
890
|
+
version = "0.9.0"
|
|
891
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
892
|
+
checksum = "8ecb6da28b8a351d773b68d5825ac39017e680750f980f3a1a85cd8dd28a47c1"
|
|
893
|
+
|
|
894
|
+
[[package]]
|
|
895
|
+
name = "ureq"
|
|
896
|
+
version = "3.3.0"
|
|
897
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
898
|
+
checksum = "dea7109cdcd5864d4eeb1b58a1648dc9bf520360d7af16ec26d0a9354bafcfc0"
|
|
899
|
+
dependencies = [
|
|
900
|
+
"base64",
|
|
901
|
+
"flate2",
|
|
902
|
+
"log",
|
|
903
|
+
"percent-encoding",
|
|
904
|
+
"rustls",
|
|
905
|
+
"rustls-pki-types",
|
|
906
|
+
"ureq-proto",
|
|
907
|
+
"utf8-zero",
|
|
908
|
+
"webpki-roots",
|
|
909
|
+
]
|
|
910
|
+
|
|
911
|
+
[[package]]
|
|
912
|
+
name = "ureq-proto"
|
|
913
|
+
version = "0.6.0"
|
|
914
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
915
|
+
checksum = "e994ba84b0bd1b1b0cf92878b7ef898a5c1760108fe7b6010327e274917a808c"
|
|
916
|
+
dependencies = [
|
|
917
|
+
"base64",
|
|
918
|
+
"http",
|
|
919
|
+
"httparse",
|
|
920
|
+
"log",
|
|
921
|
+
]
|
|
922
|
+
|
|
923
|
+
[[package]]
|
|
924
|
+
name = "utf8-zero"
|
|
925
|
+
version = "0.8.1"
|
|
926
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
927
|
+
checksum = "b8c0a043c9540bae7c578c88f91dda8bd82e59ae27c21baca69c8b191aaf5a6e"
|
|
928
|
+
|
|
646
929
|
[[package]]
|
|
647
930
|
name = "uuid"
|
|
648
931
|
version = "1.23.2"
|
|
@@ -659,6 +942,12 @@ version = "0.9.5"
|
|
|
659
942
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
660
943
|
checksum = "0b928f33d975fc6ad9f86c8f283853ad26bdd5b10b7f1542aa2fa15e2289105a"
|
|
661
944
|
|
|
945
|
+
[[package]]
|
|
946
|
+
name = "wasi"
|
|
947
|
+
version = "0.11.1+wasi-snapshot-preview1"
|
|
948
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
949
|
+
checksum = "ccf3ec651a847eb01de73ccad15eb7d99f80485de043efb2f370cd654f4ea44b"
|
|
950
|
+
|
|
662
951
|
[[package]]
|
|
663
952
|
name = "wasip2"
|
|
664
953
|
version = "1.0.3+wasi-0.2.9"
|
|
@@ -713,6 +1002,154 @@ dependencies = [
|
|
|
713
1002
|
"unicode-ident",
|
|
714
1003
|
]
|
|
715
1004
|
|
|
1005
|
+
[[package]]
|
|
1006
|
+
name = "webpki-roots"
|
|
1007
|
+
version = "1.0.7"
|
|
1008
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1009
|
+
checksum = "52f5ee44c96cf55f1b349600768e3ece3a8f26010c05265ab73f945bb1a2eb9d"
|
|
1010
|
+
dependencies = [
|
|
1011
|
+
"rustls-pki-types",
|
|
1012
|
+
]
|
|
1013
|
+
|
|
1014
|
+
[[package]]
|
|
1015
|
+
name = "windows-sys"
|
|
1016
|
+
version = "0.48.0"
|
|
1017
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1018
|
+
checksum = "677d2418bec65e3338edb076e806bc1ec15693c5d0104683f2efe857f61056a9"
|
|
1019
|
+
dependencies = [
|
|
1020
|
+
"windows-targets 0.48.5",
|
|
1021
|
+
]
|
|
1022
|
+
|
|
1023
|
+
[[package]]
|
|
1024
|
+
name = "windows-sys"
|
|
1025
|
+
version = "0.52.0"
|
|
1026
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1027
|
+
checksum = "282be5f36a8ce781fad8c8ae18fa3f9beff57ec1b52cb3de0789201425d9a33d"
|
|
1028
|
+
dependencies = [
|
|
1029
|
+
"windows-targets 0.52.6",
|
|
1030
|
+
]
|
|
1031
|
+
|
|
1032
|
+
[[package]]
|
|
1033
|
+
name = "windows-targets"
|
|
1034
|
+
version = "0.48.5"
|
|
1035
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1036
|
+
checksum = "9a2fa6e2155d7247be68c096456083145c183cbbbc2764150dda45a87197940c"
|
|
1037
|
+
dependencies = [
|
|
1038
|
+
"windows_aarch64_gnullvm 0.48.5",
|
|
1039
|
+
"windows_aarch64_msvc 0.48.5",
|
|
1040
|
+
"windows_i686_gnu 0.48.5",
|
|
1041
|
+
"windows_i686_msvc 0.48.5",
|
|
1042
|
+
"windows_x86_64_gnu 0.48.5",
|
|
1043
|
+
"windows_x86_64_gnullvm 0.48.5",
|
|
1044
|
+
"windows_x86_64_msvc 0.48.5",
|
|
1045
|
+
]
|
|
1046
|
+
|
|
1047
|
+
[[package]]
|
|
1048
|
+
name = "windows-targets"
|
|
1049
|
+
version = "0.52.6"
|
|
1050
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1051
|
+
checksum = "9b724f72796e036ab90c1021d4780d4d3d648aca59e491e6b98e725b84e99973"
|
|
1052
|
+
dependencies = [
|
|
1053
|
+
"windows_aarch64_gnullvm 0.52.6",
|
|
1054
|
+
"windows_aarch64_msvc 0.52.6",
|
|
1055
|
+
"windows_i686_gnu 0.52.6",
|
|
1056
|
+
"windows_i686_gnullvm",
|
|
1057
|
+
"windows_i686_msvc 0.52.6",
|
|
1058
|
+
"windows_x86_64_gnu 0.52.6",
|
|
1059
|
+
"windows_x86_64_gnullvm 0.52.6",
|
|
1060
|
+
"windows_x86_64_msvc 0.52.6",
|
|
1061
|
+
]
|
|
1062
|
+
|
|
1063
|
+
[[package]]
|
|
1064
|
+
name = "windows_aarch64_gnullvm"
|
|
1065
|
+
version = "0.48.5"
|
|
1066
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1067
|
+
checksum = "2b38e32f0abccf9987a4e3079dfb67dcd799fb61361e53e2882c3cbaf0d905d8"
|
|
1068
|
+
|
|
1069
|
+
[[package]]
|
|
1070
|
+
name = "windows_aarch64_gnullvm"
|
|
1071
|
+
version = "0.52.6"
|
|
1072
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1073
|
+
checksum = "32a4622180e7a0ec044bb555404c800bc9fd9ec262ec147edd5989ccd0c02cd3"
|
|
1074
|
+
|
|
1075
|
+
[[package]]
|
|
1076
|
+
name = "windows_aarch64_msvc"
|
|
1077
|
+
version = "0.48.5"
|
|
1078
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1079
|
+
checksum = "dc35310971f3b2dbbf3f0690a219f40e2d9afcf64f9ab7cc1be722937c26b4bc"
|
|
1080
|
+
|
|
1081
|
+
[[package]]
|
|
1082
|
+
name = "windows_aarch64_msvc"
|
|
1083
|
+
version = "0.52.6"
|
|
1084
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1085
|
+
checksum = "09ec2a7bb152e2252b53fa7803150007879548bc709c039df7627cabbd05d469"
|
|
1086
|
+
|
|
1087
|
+
[[package]]
|
|
1088
|
+
name = "windows_i686_gnu"
|
|
1089
|
+
version = "0.48.5"
|
|
1090
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1091
|
+
checksum = "a75915e7def60c94dcef72200b9a8e58e5091744960da64ec734a6c6e9b3743e"
|
|
1092
|
+
|
|
1093
|
+
[[package]]
|
|
1094
|
+
name = "windows_i686_gnu"
|
|
1095
|
+
version = "0.52.6"
|
|
1096
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1097
|
+
checksum = "8e9b5ad5ab802e97eb8e295ac6720e509ee4c243f69d781394014ebfe8bbfa0b"
|
|
1098
|
+
|
|
1099
|
+
[[package]]
|
|
1100
|
+
name = "windows_i686_gnullvm"
|
|
1101
|
+
version = "0.52.6"
|
|
1102
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1103
|
+
checksum = "0eee52d38c090b3caa76c563b86c3a4bd71ef1a819287c19d586d7334ae8ed66"
|
|
1104
|
+
|
|
1105
|
+
[[package]]
|
|
1106
|
+
name = "windows_i686_msvc"
|
|
1107
|
+
version = "0.48.5"
|
|
1108
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1109
|
+
checksum = "8f55c233f70c4b27f66c523580f78f1004e8b5a8b659e05a4eb49d4166cca406"
|
|
1110
|
+
|
|
1111
|
+
[[package]]
|
|
1112
|
+
name = "windows_i686_msvc"
|
|
1113
|
+
version = "0.52.6"
|
|
1114
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1115
|
+
checksum = "240948bc05c5e7c6dabba28bf89d89ffce3e303022809e73deaefe4f6ec56c66"
|
|
1116
|
+
|
|
1117
|
+
[[package]]
|
|
1118
|
+
name = "windows_x86_64_gnu"
|
|
1119
|
+
version = "0.48.5"
|
|
1120
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1121
|
+
checksum = "53d40abd2583d23e4718fddf1ebec84dbff8381c07cae67ff7768bbf19c6718e"
|
|
1122
|
+
|
|
1123
|
+
[[package]]
|
|
1124
|
+
name = "windows_x86_64_gnu"
|
|
1125
|
+
version = "0.52.6"
|
|
1126
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1127
|
+
checksum = "147a5c80aabfbf0c7d901cb5895d1de30ef2907eb21fbbab29ca94c5b08b1a78"
|
|
1128
|
+
|
|
1129
|
+
[[package]]
|
|
1130
|
+
name = "windows_x86_64_gnullvm"
|
|
1131
|
+
version = "0.48.5"
|
|
1132
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1133
|
+
checksum = "0b7b52767868a23d5bab768e390dc5f5c55825b6d30b86c844ff2dc7414044cc"
|
|
1134
|
+
|
|
1135
|
+
[[package]]
|
|
1136
|
+
name = "windows_x86_64_gnullvm"
|
|
1137
|
+
version = "0.52.6"
|
|
1138
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1139
|
+
checksum = "24d5b23dc417412679681396f2b49f3de8c1473deb516bd34410872eff51ed0d"
|
|
1140
|
+
|
|
1141
|
+
[[package]]
|
|
1142
|
+
name = "windows_x86_64_msvc"
|
|
1143
|
+
version = "0.48.5"
|
|
1144
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1145
|
+
checksum = "ed94fce61571a4006852b7389a063ab983c02eb1bb37b47f8272ce92d06d9538"
|
|
1146
|
+
|
|
1147
|
+
[[package]]
|
|
1148
|
+
name = "windows_x86_64_msvc"
|
|
1149
|
+
version = "0.52.6"
|
|
1150
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1151
|
+
checksum = "589f6da84c646204747d1270a2a5661ea66ed1cced2631d546fdfb155959f9ec"
|
|
1152
|
+
|
|
716
1153
|
[[package]]
|
|
717
1154
|
name = "wit-bindgen"
|
|
718
1155
|
version = "0.57.1"
|
|
@@ -739,6 +1176,12 @@ dependencies = [
|
|
|
739
1176
|
"syn",
|
|
740
1177
|
]
|
|
741
1178
|
|
|
1179
|
+
[[package]]
|
|
1180
|
+
name = "zeroize"
|
|
1181
|
+
version = "1.8.2"
|
|
1182
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
1183
|
+
checksum = "b97154e67e32c85465826e8bcc1c59429aaaf107c1e4a9e53c8d8ccd5eff88d0"
|
|
1184
|
+
|
|
742
1185
|
[[package]]
|
|
743
1186
|
name = "zmij"
|
|
744
1187
|
version = "1.0.21"
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: cc-transcript
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.4.0
|
|
4
4
|
Classifier: Development Status :: 3 - Alpha
|
|
5
5
|
Classifier: Intended Audience :: Developers
|
|
6
6
|
Classifier: Operating System :: OS Independent
|
|
@@ -63,21 +63,24 @@ for event in events:
|
|
|
63
63
|
print(f"assistant ({model}):", text[:80])
|
|
64
64
|
```
|
|
65
65
|
|
|
66
|
-
|
|
67
|
-
|
|
66
|
+
Compose a filter from small building blocks and apply it. The builders return clauses,
|
|
67
|
+
`build_spec` assembles them into a spec, and `apply_spec` yields the survivors:
|
|
68
68
|
|
|
69
69
|
```python
|
|
70
|
-
from cc_transcript import
|
|
70
|
+
from cc_transcript import apply_spec, build_spec, keep_only, drop_junk, drop_short
|
|
71
71
|
|
|
72
|
-
|
|
72
|
+
spec = build_spec(keep_only("user", "assistant"), drop_junk("structural"), drop_short(2))
|
|
73
|
+
clean = list(apply_spec(events, spec))
|
|
73
74
|
```
|
|
74
75
|
|
|
75
|
-
|
|
76
|
+
`NOISE_SPEC` is a ready-made spec for the universal structural noise (system reminders,
|
|
77
|
+
local-command output, skill banners). For flag-style filtering, `FilterConfig` is also
|
|
78
|
+
available — every rule is off by default, so a bare `FilterConfig()` passes everything through.
|
|
76
79
|
|
|
77
80
|
## What problems does this solve?
|
|
78
81
|
|
|
79
82
|
- **One faithful parse.** Anything reading Claude Code transcripts re-implements the same JSONL quirks (str-or-list content, tool results nested two ways, envelope-less mode markers). This is that parser, written once and typed strictly.
|
|
80
|
-
- **Non-lossy by design.** The event model is a superset: sidechains, `<synthetic>` turns, thinking blocks, and unrecognized entry types all survive parsing. You decide what to drop, via `FilterConfig`.
|
|
83
|
+
- **Non-lossy by design.** The event model is a superset: sidechains, `<synthetic>` turns, thinking blocks, and unrecognized entry types all survive parsing. You decide what to drop, via composable filter specs (`build_spec`) or `FilterConfig`.
|
|
81
84
|
- **Incremental ingestion.** `FileStateStore` tracks per-file mtimes in SQLite (WAL, thread-safe) so re-runs only reparse changed files, and you compose your own writes in the same transaction.
|
|
82
85
|
- **Pluggable backends.** A Rust backend (PyO3 + rayon) is the default fast path, with a pure-Python reference parser behind the same `Backend` protocol as the fallback — both at full event parity.
|
|
83
86
|
|
|
@@ -32,21 +32,24 @@ for event in events:
|
|
|
32
32
|
print(f"assistant ({model}):", text[:80])
|
|
33
33
|
```
|
|
34
34
|
|
|
35
|
-
|
|
36
|
-
|
|
35
|
+
Compose a filter from small building blocks and apply it. The builders return clauses,
|
|
36
|
+
`build_spec` assembles them into a spec, and `apply_spec` yields the survivors:
|
|
37
37
|
|
|
38
38
|
```python
|
|
39
|
-
from cc_transcript import
|
|
39
|
+
from cc_transcript import apply_spec, build_spec, keep_only, drop_junk, drop_short
|
|
40
40
|
|
|
41
|
-
|
|
41
|
+
spec = build_spec(keep_only("user", "assistant"), drop_junk("structural"), drop_short(2))
|
|
42
|
+
clean = list(apply_spec(events, spec))
|
|
42
43
|
```
|
|
43
44
|
|
|
44
|
-
|
|
45
|
+
`NOISE_SPEC` is a ready-made spec for the universal structural noise (system reminders,
|
|
46
|
+
local-command output, skill banners). For flag-style filtering, `FilterConfig` is also
|
|
47
|
+
available — every rule is off by default, so a bare `FilterConfig()` passes everything through.
|
|
45
48
|
|
|
46
49
|
## What problems does this solve?
|
|
47
50
|
|
|
48
51
|
- **One faithful parse.** Anything reading Claude Code transcripts re-implements the same JSONL quirks (str-or-list content, tool results nested two ways, envelope-less mode markers). This is that parser, written once and typed strictly.
|
|
49
|
-
- **Non-lossy by design.** The event model is a superset: sidechains, `<synthetic>` turns, thinking blocks, and unrecognized entry types all survive parsing. You decide what to drop, via `FilterConfig`.
|
|
52
|
+
- **Non-lossy by design.** The event model is a superset: sidechains, `<synthetic>` turns, thinking blocks, and unrecognized entry types all survive parsing. You decide what to drop, via composable filter specs (`build_spec`) or `FilterConfig`.
|
|
50
53
|
- **Incremental ingestion.** `FileStateStore` tracks per-file mtimes in SQLite (WAL, thread-safe) so re-runs only reparse changed files, and you compose your own writes in the same transaction.
|
|
51
54
|
- **Pluggable backends.** A Rust backend (PyO3 + rayon) is the default fast path, with a pure-Python reference parser behind the same `Backend` protocol as the fallback — both at full event parity.
|
|
52
55
|
|