jpreprocess 0.1.0__tar.gz → 0.1.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/Cargo.lock +1 -1
- jpreprocess-0.1.1/PKG-INFO +81 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/Cargo.toml +1 -1
- jpreprocess-0.1.1/bindings/python/README.md +57 -0
- jpreprocess-0.1.0/PKG-INFO +0 -37
- jpreprocess-0.1.0/bindings/python/README.md +0 -13
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/.gitignore +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/jpreprocess/__init__.py +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/jpreprocess/dictionary.py +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/jpreprocess/jpreprocess.pyi +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/jpreprocess/py.typed +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/pytests/test_simple.py +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/src/binding.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/src/dictionary.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/bindings/python/src/structs.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/README.md +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/src/bin/dict_tools/dict_query.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/src/bin/dict_tools/main.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/src/bin/jpreprocess.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/src/dictionary/kind.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/src/dictionary/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/src/normalize_text.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/.gitignore +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/min-dict/char_def.bin +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/min-dict/dict.da +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/min-dict/dict.vals +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/min-dict/dict.words +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/min-dict/dict.wordsidx +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/min-dict/matrix.mtx +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/min-dict/unk.bin +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/open_jtalk.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess/tests/user_dictionary.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/README.md +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/accent_rule.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/cform.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/five.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/four.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/ka_irregular.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/keiyoushi.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/lower_two.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/old.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/one.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/sa_irregular.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/special.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/ctype/upper_two.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/error.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pos/doushi.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pos/fukushi.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pos/joshi.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pos/keiyoushi.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pos/kigou.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pos/meishi.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pos/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pos/settoushi.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pronunciation/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pronunciation/mora.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pronunciation/mora_dict.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pronunciation/mora_enum.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pronunciation/phoneme.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/word_details.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/word_entry.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/README.md +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/src/default.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/src/serializer/jpreprocess/current.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/src/serializer/jpreprocess/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/src/serializer/lindera.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/src/serializer/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/src/store.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/NOTICE.txt +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/README.md +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/build_dict.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/ipadic_builder.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/to_csv/da.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/to_csv/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/README.md +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/feature/builder.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/feature/limit.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/feature/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/label/accent_phrase.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/label/breath_group.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/label/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/label/utterance.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/label/word.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/word_attr/cform.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/word_attr/ctype.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/word_attr/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/word_attr/pos.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-naist-jdic/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-naist-jdic/NOTICE.txt +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-naist-jdic/README.md +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-naist-jdic/build.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-naist-jdic/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-naist-jdic/src/lindera.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/README.md +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/accent_phrase/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/accent_type/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/digit_sequence/builder.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/digit_sequence/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/digit_sequence/score.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/class1.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/class2.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/class3.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/numeral.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/others.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/symbols.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/long_vowel/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/pronunciation/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/unvoiced_vowel/mod.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/node.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-window/Cargo.toml +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-window/README.md +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-window/src/lib.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-window/src/structures.rs +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/jpreprocess/__init__.py +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/jpreprocess/dictionary.py +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/jpreprocess/jpreprocess.pyi +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/jpreprocess/py.typed +0 -0
- {jpreprocess-0.1.0 → jpreprocess-0.1.1}/pyproject.toml +0 -0
|
@@ -0,0 +1,81 @@
|
|
|
1
|
+
Metadata-Version: 2.1
|
|
2
|
+
Name: jpreprocess
|
|
3
|
+
Version: 0.1.1
|
|
4
|
+
Classifier: Programming Language :: Rust
|
|
5
|
+
Classifier: Programming Language :: Python :: Implementation :: CPython
|
|
6
|
+
Classifier: Programming Language :: Python :: Implementation :: PyPy
|
|
7
|
+
Classifier: License :: OSI Approved :: BSD License
|
|
8
|
+
Classifier: Topic :: Scientific/Engineering
|
|
9
|
+
Classifier: Topic :: Software Development
|
|
10
|
+
Classifier: Intended Audience :: Science/Research
|
|
11
|
+
Classifier: Intended Audience :: Developers
|
|
12
|
+
Requires-Dist: importlib_resources ; python_version < '3.9'
|
|
13
|
+
Requires-Dist: tqdm ; extra == 'progress'
|
|
14
|
+
Requires-Dist: pytest >=8.0.1 ; extra == 'dev'
|
|
15
|
+
Provides-Extra: progress
|
|
16
|
+
Provides-Extra: dev
|
|
17
|
+
Summary: Japanese text preprocessor for Text-to-Speech application (OpenJTalk rewrite in rust language).
|
|
18
|
+
Keywords: tts,openjtalk,library
|
|
19
|
+
License: BSD-3-Clause
|
|
20
|
+
Requires-Python: >=3.8, <=3.12
|
|
21
|
+
Description-Content-Type: text/markdown; charset=UTF-8; variant=GFM
|
|
22
|
+
Project-URL: Source Code, https://github.com/jpreprocess/jpreprocess
|
|
23
|
+
|
|
24
|
+
# jpreprocess (python binding)
|
|
25
|
+
|
|
26
|
+
Japanese text preprocessor for Text-to-Speech application.
|
|
27
|
+
|
|
28
|
+
This is a python binding of jpreprocess, which is written in Rust.
|
|
29
|
+
The rust library is published in [crates.io](https://crates.io/crates/jpreprocess).
|
|
30
|
+
|
|
31
|
+
JPreprocess (the base code written in Rust) is a rewrite of [OpenJTalk](http://open-jtalk.sourceforge.net/).
|
|
32
|
+
|
|
33
|
+
## Usage
|
|
34
|
+
|
|
35
|
+
Unlike [pyopenjtalk](https://pypi.org/project/pyopenjtalk/), this package does not include support of marine and TTS.
|
|
36
|
+
|
|
37
|
+
Currently, this package is for text processing only.
|
|
38
|
+
|
|
39
|
+
### Run text processing frontend
|
|
40
|
+
|
|
41
|
+
```python
|
|
42
|
+
import jpreprocess
|
|
43
|
+
|
|
44
|
+
j = jpreprocess.jpreprocess()
|
|
45
|
+
njd_features = j.run_frontend("本日は晴天なり")
|
|
46
|
+
|
|
47
|
+
assert njd_features[0].get("string") == "本日"
|
|
48
|
+
assert njd_features[0].get("pos") == "名詞"
|
|
49
|
+
```
|
|
50
|
+
|
|
51
|
+
### Extract full-context label
|
|
52
|
+
|
|
53
|
+
```python
|
|
54
|
+
import jpreprocess
|
|
55
|
+
|
|
56
|
+
j = jpreprocess.jpreprocess()
|
|
57
|
+
fullcontext = j.extract_fullcontext("本日は晴天なり")
|
|
58
|
+
|
|
59
|
+
assert len(fullcontext) == 21
|
|
60
|
+
assert fullcontext[0] == r"xx^xx-sil+h=o/A:xx+xx+xx/B:xx-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:xx_xx!xx_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:5_1%0_xx_xx/H:xx_xx/I:xx-xx@xx+xx&xx-xx|xx+xx/J:2_11/K:1+2-11"
|
|
61
|
+
```
|
|
62
|
+
|
|
63
|
+
### Grapheme-to-phoeneme (G2P)
|
|
64
|
+
|
|
65
|
+
```python
|
|
66
|
+
import jpreprocess
|
|
67
|
+
|
|
68
|
+
j = jpreprocess.jpreprocess()
|
|
69
|
+
|
|
70
|
+
assert j.g2p("おはようございます") == "o h a y o o g o z a i m a s U"
|
|
71
|
+
assert j.g2p("おはようございます", kana=True) == "オハヨーゴザイマス"
|
|
72
|
+
```
|
|
73
|
+
|
|
74
|
+
## Copyrights
|
|
75
|
+
|
|
76
|
+
Please see [README.md](https://github.com/jpreprocess/jpreprocess/blob/main/README.md).
|
|
77
|
+
|
|
78
|
+
## License
|
|
79
|
+
|
|
80
|
+
BSD-3-Clause
|
|
81
|
+
|
|
@@ -0,0 +1,57 @@
|
|
|
1
|
+
# jpreprocess (python binding)
|
|
2
|
+
|
|
3
|
+
Japanese text preprocessor for Text-to-Speech application.
|
|
4
|
+
|
|
5
|
+
This is a python binding of jpreprocess, which is written in Rust.
|
|
6
|
+
The rust library is published in [crates.io](https://crates.io/crates/jpreprocess).
|
|
7
|
+
|
|
8
|
+
JPreprocess (the base code written in Rust) is a rewrite of [OpenJTalk](http://open-jtalk.sourceforge.net/).
|
|
9
|
+
|
|
10
|
+
## Usage
|
|
11
|
+
|
|
12
|
+
Unlike [pyopenjtalk](https://pypi.org/project/pyopenjtalk/), this package does not include support of marine and TTS.
|
|
13
|
+
|
|
14
|
+
Currently, this package is for text processing only.
|
|
15
|
+
|
|
16
|
+
### Run text processing frontend
|
|
17
|
+
|
|
18
|
+
```python
|
|
19
|
+
import jpreprocess
|
|
20
|
+
|
|
21
|
+
j = jpreprocess.jpreprocess()
|
|
22
|
+
njd_features = j.run_frontend("本日は晴天なり")
|
|
23
|
+
|
|
24
|
+
assert njd_features[0].get("string") == "本日"
|
|
25
|
+
assert njd_features[0].get("pos") == "名詞"
|
|
26
|
+
```
|
|
27
|
+
|
|
28
|
+
### Extract full-context label
|
|
29
|
+
|
|
30
|
+
```python
|
|
31
|
+
import jpreprocess
|
|
32
|
+
|
|
33
|
+
j = jpreprocess.jpreprocess()
|
|
34
|
+
fullcontext = j.extract_fullcontext("本日は晴天なり")
|
|
35
|
+
|
|
36
|
+
assert len(fullcontext) == 21
|
|
37
|
+
assert fullcontext[0] == r"xx^xx-sil+h=o/A:xx+xx+xx/B:xx-xx_xx/C:xx_xx+xx/D:xx+xx_xx/E:xx_xx!xx_xx-xx/F:xx_xx#xx_xx@xx_xx|xx_xx/G:5_1%0_xx_xx/H:xx_xx/I:xx-xx@xx+xx&xx-xx|xx+xx/J:2_11/K:1+2-11"
|
|
38
|
+
```
|
|
39
|
+
|
|
40
|
+
### Grapheme-to-phoeneme (G2P)
|
|
41
|
+
|
|
42
|
+
```python
|
|
43
|
+
import jpreprocess
|
|
44
|
+
|
|
45
|
+
j = jpreprocess.jpreprocess()
|
|
46
|
+
|
|
47
|
+
assert j.g2p("おはようございます") == "o h a y o o g o z a i m a s U"
|
|
48
|
+
assert j.g2p("おはようございます", kana=True) == "オハヨーゴザイマス"
|
|
49
|
+
```
|
|
50
|
+
|
|
51
|
+
## Copyrights
|
|
52
|
+
|
|
53
|
+
Please see [README.md](https://github.com/jpreprocess/jpreprocess/blob/main/README.md).
|
|
54
|
+
|
|
55
|
+
## License
|
|
56
|
+
|
|
57
|
+
BSD-3-Clause
|
jpreprocess-0.1.0/PKG-INFO
DELETED
|
@@ -1,37 +0,0 @@
|
|
|
1
|
-
Metadata-Version: 2.1
|
|
2
|
-
Name: jpreprocess
|
|
3
|
-
Version: 0.1.0
|
|
4
|
-
Classifier: Programming Language :: Rust
|
|
5
|
-
Classifier: Programming Language :: Python :: Implementation :: CPython
|
|
6
|
-
Classifier: Programming Language :: Python :: Implementation :: PyPy
|
|
7
|
-
Classifier: License :: OSI Approved :: BSD License
|
|
8
|
-
Classifier: Topic :: Scientific/Engineering
|
|
9
|
-
Classifier: Topic :: Software Development
|
|
10
|
-
Classifier: Intended Audience :: Science/Research
|
|
11
|
-
Classifier: Intended Audience :: Developers
|
|
12
|
-
Requires-Dist: importlib_resources ; python_version < '3.9'
|
|
13
|
-
Requires-Dist: tqdm ; extra == 'progress'
|
|
14
|
-
Requires-Dist: pytest >=8.0.1 ; extra == 'dev'
|
|
15
|
-
Provides-Extra: progress
|
|
16
|
-
Provides-Extra: dev
|
|
17
|
-
Summary: Japanese text preprocessor for Text-to-Speech application (OpenJTalk rewrite in rust language).
|
|
18
|
-
Keywords: tts,openjtalk,library
|
|
19
|
-
License: BSD-3-Clause
|
|
20
|
-
Requires-Python: >=3.8, <=3.12
|
|
21
|
-
Description-Content-Type: text/markdown; charset=UTF-8; variant=GFM
|
|
22
|
-
Project-URL: Source Code, https://github.com/jpreprocess/jpreprocess
|
|
23
|
-
|
|
24
|
-
# python binding
|
|
25
|
-
|
|
26
|
-
## Example
|
|
27
|
-
|
|
28
|
-
```python
|
|
29
|
-
import jpreprocess
|
|
30
|
-
|
|
31
|
-
j=jpreprocess.jpreprocess()
|
|
32
|
-
njd_features=j.run_frontend("本日は晴天なり")
|
|
33
|
-
|
|
34
|
-
assert njd_features[0].get("string") == "本日"
|
|
35
|
-
assert njd_features[0].get("pos") == "名詞"
|
|
36
|
-
```
|
|
37
|
-
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pronunciation/mora_dict.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pronunciation/mora_enum.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-core/src/pronunciation/phoneme.rs
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary/src/serializer/lindera.rs
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/build_dict.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/ipadic_builder.rs
RENAMED
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/to_csv/da.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-dictionary-builder/src/to_csv/mod.rs
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/label/accent_phrase.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-jpcommon/src/label/breath_group.rs
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/accent_phrase/mod.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/accent_type/mod.rs
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/class1.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/class2.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/class3.rs
RENAMED
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/numeral.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/digit/lut/others.rs
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/long_vowel/mod.rs
RENAMED
|
File without changes
|
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/pronunciation/mod.rs
RENAMED
|
File without changes
|
{jpreprocess-0.1.0 → jpreprocess-0.1.1}/crates/jpreprocess-njd/src/njd_set/unvoiced_vowel/mod.rs
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|