@lokascript/semantic 1.2.1 → 1.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/languages/bn.d.ts +33 -0
- package/dist/languages/bn.js +1101 -0
- package/dist/languages/bn.js.map +1 -0
- package/dist/languages/es-MX.d.ts +23 -0
- package/dist/languages/es-MX.js +1676 -0
- package/dist/languages/es-MX.js.map +1 -0
- package/dist/languages/es.d.ts +3 -42
- package/dist/languages/he.d.ts +70 -0
- package/dist/languages/he.js +1331 -0
- package/dist/languages/he.js.map +1 -0
- package/dist/languages/hi.d.ts +36 -0
- package/dist/languages/hi.js +1162 -0
- package/dist/languages/hi.js.map +1 -0
- package/dist/languages/it.d.ts +53 -0
- package/dist/languages/it.js +1600 -0
- package/dist/languages/it.js.map +1 -0
- package/dist/languages/ms.d.ts +32 -0
- package/dist/languages/ms.js +1043 -0
- package/dist/languages/ms.js.map +1 -0
- package/dist/languages/pl.d.ts +37 -0
- package/dist/languages/pl.js +1331 -0
- package/dist/languages/pl.js.map +1 -0
- package/dist/languages/ru.d.ts +37 -0
- package/dist/languages/ru.js +1356 -0
- package/dist/languages/ru.js.map +1 -0
- package/dist/languages/th.d.ts +35 -0
- package/dist/languages/th.js +1076 -0
- package/dist/languages/th.js.map +1 -0
- package/dist/languages/tl.d.ts +32 -0
- package/dist/languages/tl.js +1034 -0
- package/dist/languages/tl.js.map +1 -0
- package/dist/languages/uk.d.ts +37 -0
- package/dist/languages/uk.js +1356 -0
- package/dist/languages/uk.js.map +1 -0
- package/dist/languages/vi.d.ts +59 -0
- package/dist/languages/vi.js +1220 -0
- package/dist/languages/vi.js.map +1 -0
- package/dist/spanish-BedpM-NU.d.ts +43 -0
- package/package.json +49 -1
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
import { B as BaseTokenizer, T as TokenStream, a as TokenKind, L as LanguageProfile } from '../types-BY3Id07j.js';
|
|
2
|
+
|
|
3
|
+
/**
|
|
4
|
+
* Bengali Tokenizer
|
|
5
|
+
*
|
|
6
|
+
* Tokenizes Bengali hyperscript input.
|
|
7
|
+
* Bengali is an agglutinative SOV language with:
|
|
8
|
+
* - Bengali script (U+0980-U+09FF)
|
|
9
|
+
* - Postposition markers (কে, তে, থেকে, etc.)
|
|
10
|
+
* - Similar grammatical structure to Hindi
|
|
11
|
+
* - CSS selectors are embedded ASCII
|
|
12
|
+
*/
|
|
13
|
+
|
|
14
|
+
declare class BengaliTokenizer extends BaseTokenizer {
|
|
15
|
+
readonly language = "bn";
|
|
16
|
+
readonly direction: "ltr";
|
|
17
|
+
constructor();
|
|
18
|
+
tokenize(input: string): TokenStream;
|
|
19
|
+
classifyToken(value: string): TokenKind;
|
|
20
|
+
private extractNumber;
|
|
21
|
+
}
|
|
22
|
+
declare const bengaliTokenizer: BengaliTokenizer;
|
|
23
|
+
|
|
24
|
+
/**
|
|
25
|
+
* Bengali Language Profile
|
|
26
|
+
*
|
|
27
|
+
* SOV word order, postpositions (কে, তে, থেকে, etc.), Bengali script.
|
|
28
|
+
* Agglutinative language similar to Hindi.
|
|
29
|
+
*/
|
|
30
|
+
|
|
31
|
+
declare const bengaliProfile: LanguageProfile;
|
|
32
|
+
|
|
33
|
+
export { bengaliProfile, bengaliTokenizer };
|