dwani 0.1.5__py3-none-any.whl → 0.1.7__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- dwani/__init__.py +27 -1
- dwani/asr.py +36 -3
- dwani/chat.py +41 -3
- dwani/client.py +27 -19
- dwani/docs.py +150 -23
- dwani/translate.py +42 -8
- dwani/vision.py +41 -3
- {dwani-0.1.5.dist-info → dwani-0.1.7.dist-info}/METADATA +31 -8
- dwani-0.1.7.dist-info/RECORD +14 -0
- {dwani-0.1.5.dist-info → dwani-0.1.7.dist-info}/WHEEL +1 -1
- dwani-0.1.5.dist-info/RECORD +0 -14
- {dwani-0.1.5.dist-info → dwani-0.1.7.dist-info}/licenses/LICENSE +0 -0
- {dwani-0.1.5.dist-info → dwani-0.1.7.dist-info}/top_level.txt +0 -0
dwani/__init__.py
CHANGED
@@ -3,9 +3,11 @@ from .chat import Chat
|
|
3
3
|
from .audio import Audio
|
4
4
|
from .vision import Vision
|
5
5
|
from .asr import ASR
|
6
|
+
from .translate import Translate
|
6
7
|
from .exceptions import DhwaniAPIError
|
8
|
+
from .docs import Documents
|
7
9
|
|
8
|
-
__all__ = ["DhwaniClient", "Chat", "Audio", "Vision", "ASR", "DhwaniAPIError"]
|
10
|
+
__all__ = ["DhwaniClient", "Chat", "Audio", "Vision", "ASR", "DhwaniAPIError", "Translate", "Documents"]
|
9
11
|
|
10
12
|
# Optionally, instantiate a default client for convenience
|
11
13
|
api_key = None
|
@@ -37,3 +39,27 @@ class asr:
|
|
37
39
|
@staticmethod
|
38
40
|
def transcribe(*args, **kwargs):
|
39
41
|
return _get_client().transcribe(*args, **kwargs)
|
42
|
+
|
43
|
+
|
44
|
+
class translate:
|
45
|
+
@staticmethod
|
46
|
+
def run_translate(*args, **kwargs):
|
47
|
+
return _get_client().translate(*args, **kwargs)
|
48
|
+
|
49
|
+
|
50
|
+
class document:
|
51
|
+
@staticmethod
|
52
|
+
def run_ocr(*args, **kwargs):
|
53
|
+
return _get_client().ocr(*args, **kwargs)
|
54
|
+
@staticmethod
|
55
|
+
def run_summarize(*args, **kwargs):
|
56
|
+
return _get_client().summarize(*args, **kwargs)
|
57
|
+
@staticmethod
|
58
|
+
def run_extract(*args, **kwargs):
|
59
|
+
return _get_client().extract(*args, **kwargs)
|
60
|
+
@staticmethod
|
61
|
+
def run_doc_query(*args, **kwargs):
|
62
|
+
return _get_client().doc_query(*args, **kwargs)
|
63
|
+
@staticmethod
|
64
|
+
def run_doc_query_kannada(*args, **kwargs):
|
65
|
+
return _get_client().doc_query_kannada(*args, **kwargs)
|
dwani/asr.py
CHANGED
@@ -1,10 +1,44 @@
|
|
1
1
|
from .exceptions import DhwaniAPIError
|
2
2
|
import requests
|
3
|
+
|
4
|
+
# Allowed languages (case-sensitive for display, but we'll handle case-insensitively)
|
5
|
+
ALLOWED_LANGUAGES = [
|
6
|
+
"Assamese",
|
7
|
+
"Bengali",
|
8
|
+
"Gujarati",
|
9
|
+
"Hindi",
|
10
|
+
"Kannada",
|
11
|
+
"Malayalam",
|
12
|
+
"Marathi",
|
13
|
+
"Odia",
|
14
|
+
"Punjabi",
|
15
|
+
"Tamil",
|
16
|
+
"Telugu"
|
17
|
+
]
|
18
|
+
|
19
|
+
def validate_language(language):
|
20
|
+
"""Validate that the provided language is in the allowed list (case-insensitive)."""
|
21
|
+
# Create a case-insensitive mapping of allowed languages
|
22
|
+
language_map = {lang.lower(): lang for lang in ALLOWED_LANGUAGES}
|
23
|
+
# Check if the lowercase version of the input language is in the map
|
24
|
+
if language.lower() not in language_map:
|
25
|
+
raise ValueError(
|
26
|
+
f"Unsupported language: {language}. Supported languages: {ALLOWED_LANGUAGES}"
|
27
|
+
)
|
28
|
+
# Return the original case from ALLOWED_LANGUAGES for consistency
|
29
|
+
return language_map[language.lower()]
|
30
|
+
|
3
31
|
def asr_transcribe(client, file_path, language):
|
32
|
+
# Validate the language input (case-insensitive)
|
33
|
+
validated_language = validate_language(language)
|
34
|
+
|
35
|
+
# Convert language to lowercase for the API request
|
36
|
+
api_language = validated_language.lower()
|
37
|
+
|
4
38
|
with open(file_path, "rb") as f:
|
5
39
|
files = {"file": f}
|
6
40
|
resp = requests.post(
|
7
|
-
f"{client.api_base}/v1/transcribe/?language={
|
41
|
+
f"{client.api_base}/v1/transcribe/?language={api_language}",
|
8
42
|
headers=client._headers(),
|
9
43
|
files=files
|
10
44
|
)
|
@@ -16,5 +50,4 @@ class ASR:
|
|
16
50
|
@staticmethod
|
17
51
|
def transcribe(*args, **kwargs):
|
18
52
|
from . import _get_client
|
19
|
-
return _get_client().transcribe(*args, **kwargs)
|
20
|
-
|
53
|
+
return _get_client().transcribe(*args, **kwargs)
|
dwani/chat.py
CHANGED
@@ -1,12 +1,50 @@
|
|
1
1
|
from .exceptions import DhwaniAPIError
|
2
2
|
import requests
|
3
3
|
|
4
|
+
# Language options mapping
|
5
|
+
language_options = [
|
6
|
+
("English", "eng_Latn"),
|
7
|
+
("Kannada", "kan_Knda"),
|
8
|
+
("Hindi", "hin_Deva"),
|
9
|
+
("Assamese", "asm_Beng"),
|
10
|
+
("Bengali","ben_Beng"),
|
11
|
+
("Gujarati","guj_Gujr"),
|
12
|
+
("Malayalam","mal_Mlym"),
|
13
|
+
("Marathi","mar_Deva"),
|
14
|
+
("Odia","ory_Orya"),
|
15
|
+
("Punjabi","pan_Guru"),
|
16
|
+
("Tamil","tam_Taml"),
|
17
|
+
("Telugu","tel_Telu")
|
18
|
+
]
|
19
|
+
|
20
|
+
# Create a dictionary for language name to code mapping
|
21
|
+
lang_name_to_code = {name.lower(): code for name, code in language_options}
|
22
|
+
lang_code_to_code = {code: code for _, code in language_options}
|
23
|
+
|
24
|
+
def normalize_language(lang):
|
25
|
+
"""Convert language input (name or code) to language code."""
|
26
|
+
lang = lang.strip()
|
27
|
+
# Check if input is a language name (case-insensitive)
|
28
|
+
lang_lower = lang.lower()
|
29
|
+
if lang_lower in lang_name_to_code:
|
30
|
+
return lang_name_to_code[lang_lower]
|
31
|
+
# Check if input is a language code
|
32
|
+
if lang in lang_code_to_code:
|
33
|
+
return lang_code_to_code[lang]
|
34
|
+
# Raise error if language is not supported
|
35
|
+
supported_langs = list(lang_name_to_code.keys()) + list(lang_code_to_code.keys())
|
36
|
+
raise ValueError(f"Unsupported language: {lang}. Supported languages: {supported_langs}")
|
37
|
+
|
4
38
|
def chat_create(client, prompt, src_lang, tgt_lang, **kwargs):
|
39
|
+
# Normalize source and target languages
|
40
|
+
src_lang_code = normalize_language(src_lang)
|
41
|
+
tgt_lang_code = normalize_language(tgt_lang)
|
42
|
+
|
5
43
|
url = f"{client.api_base}/v1/indic_chat"
|
6
44
|
payload = {
|
7
45
|
"prompt": prompt,
|
8
|
-
"src_lang":
|
9
|
-
"tgt_lang":
|
46
|
+
"src_lang": src_lang_code,
|
47
|
+
"tgt_lang": tgt_lang_code
|
10
48
|
}
|
11
49
|
payload.update(kwargs)
|
12
50
|
resp = requests.post(
|
@@ -22,4 +60,4 @@ class Chat:
|
|
22
60
|
@staticmethod
|
23
61
|
def create(prompt, src_lang, tgt_lang, **kwargs):
|
24
62
|
from . import _get_client
|
25
|
-
return _get_client().chat(prompt, src_lang, tgt_lang, **kwargs)
|
63
|
+
return _get_client().chat(prompt, src_lang, tgt_lang, **kwargs)
|
dwani/client.py
CHANGED
@@ -12,35 +12,43 @@ class DhwaniClient:
|
|
12
12
|
def _headers(self):
|
13
13
|
return {"X-API-Key": self.api_key}
|
14
14
|
|
15
|
-
def chat(self, prompt, src_lang, tgt_lang, **kwargs):
|
16
|
-
from .chat import chat_create
|
17
|
-
return chat_create(self, prompt, src_lang, tgt_lang, **kwargs)
|
18
|
-
|
19
15
|
def translate(self, sentences, src_lang, tgt_lang, **kwargs):
|
20
16
|
from .translate import run_translate
|
21
|
-
return run_translate(self, sentences=sentences,src_lang=
|
17
|
+
return run_translate(self, sentences=sentences, src_lang=src_lang, tgt_lang=tgt_lang, **kwargs)
|
22
18
|
|
23
|
-
def
|
19
|
+
def chat(self, prompt, src_lang, tgt_lang, **kwargs):
|
20
|
+
from .chat import chat_create
|
21
|
+
return chat_create(self, prompt=prompt, src_lang=src_lang, tgt_lang=tgt_lang, **kwargs)
|
22
|
+
|
23
|
+
def speech(self, input, response_format="mp3", **kwargs):
|
24
24
|
from .audio import audio_speech
|
25
|
-
return audio_speech(self,
|
25
|
+
return audio_speech(self, input=input, response_format=response_format, **kwargs)
|
26
26
|
|
27
|
-
def caption(self, file_path, query="describe the image", src_lang="eng_Latn", tgt_lang="kan_Knda"):
|
27
|
+
def caption(self, file_path, query="describe the image", src_lang="eng_Latn", tgt_lang="kan_Knda", **kwargs):
|
28
28
|
from .vision import vision_caption
|
29
|
-
return vision_caption(self, file_path, query, src_lang, tgt_lang)
|
29
|
+
return vision_caption(self, file_path=file_path, query=query, src_lang=src_lang, tgt_lang=tgt_lang, **kwargs)
|
30
30
|
|
31
|
-
def transcribe(self,
|
31
|
+
def transcribe(self, file_path, language=None, **kwargs):
|
32
32
|
from .asr import asr_transcribe
|
33
|
-
return asr_transcribe(self,
|
33
|
+
return asr_transcribe(self, file_path=file_path, language=language, **kwargs)
|
34
34
|
|
35
|
-
def document_ocr(self, file_path, language=None):
|
35
|
+
def document_ocr(self, file_path, language=None, **kwargs):
|
36
36
|
from .docs import document_ocr
|
37
|
-
return document_ocr(self, file_path, language)
|
38
|
-
|
39
|
-
def document_translate(self, file_path, src_lang, tgt_lang):
|
40
|
-
from .docs import document_translate
|
41
|
-
return document_translate(self, file_path, src_lang, tgt_lang)
|
37
|
+
return document_ocr(self, file_path=file_path, language=language, **kwargs)
|
42
38
|
|
43
|
-
def document_summarize(self, file_path,
|
39
|
+
def document_summarize(self, file_path, page_number=1, src_lang="eng_Latn", tgt_lang="kan_Knda", **kwargs):
|
44
40
|
from .docs import document_summarize
|
45
|
-
return document_summarize(self, file_path,
|
41
|
+
return document_summarize(self, file_path, page_number, src_lang, tgt_lang, **kwargs)
|
42
|
+
|
43
|
+
def extract(self, file_path, page_number=1, src_lang="eng_Latn", tgt_lang="kan_Knda", **kwargs):
|
44
|
+
from .docs import extract
|
45
|
+
return extract(self, file_path=file_path, page_number=page_number, src_lang=src_lang,tgt_lang=tgt_lang, **kwargs)
|
46
|
+
|
47
|
+
|
48
|
+
def doc_query( self, file_path, page_number=1, prompt="list the key points", src_lang="eng_Latn", tgt_lang="kan_Knda" , **kwargs ):
|
49
|
+
from .docs import doc_query
|
50
|
+
return doc_query( self, file_path, page_number=page_number, prompt=prompt, src_lang=src_lang, tgt_lang=tgt_lang , **kwargs )
|
46
51
|
|
52
|
+
def doc_query_kannada(self, file_path, page_number=1, prompt="list key points", src_lang="eng_Latn", language=None, **kwargs):
|
53
|
+
from .docs import doc_query_kannada
|
54
|
+
return doc_query_kannada(self, file_path=file_path, page_number=page_number, prompt=prompt, src_lang=src_lang, language=language, **kwargs)
|
dwani/docs.py
CHANGED
@@ -1,13 +1,49 @@
|
|
1
1
|
import requests
|
2
2
|
from .exceptions import DhwaniAPIError
|
3
3
|
|
4
|
+
# Language options mapping
|
5
|
+
language_options = [
|
6
|
+
("English", "eng_Latn"),
|
7
|
+
("Kannada", "kan_Knda"),
|
8
|
+
("Hindi", "hin_Deva"),
|
9
|
+
("Assamese", "asm_Beng"),
|
10
|
+
("Bengali", "ben_Beng"),
|
11
|
+
("Gujarati", "guj_Gujr"),
|
12
|
+
("Malayalam", "mal_Mlym"),
|
13
|
+
("Marathi", "mar_Deva"),
|
14
|
+
("Odia", "ory_Orya"),
|
15
|
+
("Punjabi", "pan_Guru"),
|
16
|
+
("Tamil", "tam_Taml"),
|
17
|
+
("Telugu", "tel_Telu")
|
18
|
+
]
|
19
|
+
|
20
|
+
# Create dictionaries for language name to code and code to code mapping
|
21
|
+
lang_name_to_code = {name.lower(): code for name, code in language_options}
|
22
|
+
lang_code_to_code = {code: code for _, code in language_options}
|
23
|
+
|
24
|
+
def normalize_language(lang):
|
25
|
+
"""Convert language input (name or code) to language code."""
|
26
|
+
lang = lang.strip()
|
27
|
+
# Check if input is a language name (case-insensitive)
|
28
|
+
lang_lower = lang.lower()
|
29
|
+
if lang_lower in lang_name_to_code:
|
30
|
+
return lang_name_to_code[lang_lower]
|
31
|
+
# Check if input is a language code
|
32
|
+
if lang in lang_code_to_code:
|
33
|
+
return lang_code_to_code[lang]
|
34
|
+
# Raise error if language is not supported
|
35
|
+
supported_langs = list(lang_name_to_code.keys()) + list(lang_code_to_code.keys())
|
36
|
+
raise ValueError(f"Unsupported language: {lang}. Supported languages: {supported_langs}")
|
37
|
+
|
4
38
|
def document_ocr(client, file_path, language=None):
|
5
39
|
"""OCR a document (image/PDF) and return extracted text."""
|
40
|
+
data = {}
|
41
|
+
if language:
|
42
|
+
# Normalize the language input
|
43
|
+
data["language"] = normalize_language(language)
|
44
|
+
|
6
45
|
with open(file_path, "rb") as f:
|
7
46
|
files = {"file": f}
|
8
|
-
data = {}
|
9
|
-
if language:
|
10
|
-
data["language"] = language
|
11
47
|
resp = requests.post(
|
12
48
|
f"{client.api_base}/v1/document/ocr",
|
13
49
|
headers=client._headers(),
|
@@ -18,17 +54,24 @@ def document_ocr(client, file_path, language=None):
|
|
18
54
|
raise DhwaniAPIError(resp)
|
19
55
|
return resp.json()
|
20
56
|
|
21
|
-
def
|
22
|
-
"""
|
57
|
+
def document_summarize(client, file_path, page_number=1, src_lang="eng_Latn", tgt_lang="kan_Knda"):
|
58
|
+
"""Summarize a PDF document with language and page number options."""
|
59
|
+
# Normalize source and target languages
|
60
|
+
src_lang_code = normalize_language(src_lang)
|
61
|
+
tgt_lang_code = normalize_language(tgt_lang)
|
62
|
+
|
63
|
+
url = f"{client.api_base}/v1/indic-summarize-pdf"
|
64
|
+
headers = client._headers()
|
23
65
|
with open(file_path, "rb") as f:
|
24
|
-
files = {"file": f}
|
66
|
+
files = {"file": (file_path, f, "application/pdf")}
|
25
67
|
data = {
|
26
|
-
"
|
27
|
-
"
|
68
|
+
"page_number": str(page_number),
|
69
|
+
"src_lang": src_lang_code,
|
70
|
+
"tgt_lang": tgt_lang_code
|
28
71
|
}
|
29
72
|
resp = requests.post(
|
30
|
-
|
31
|
-
headers=
|
73
|
+
url,
|
74
|
+
headers=headers,
|
32
75
|
files=files,
|
33
76
|
data=data
|
34
77
|
)
|
@@ -36,16 +79,90 @@ def document_translate(client, file_path, src_lang, tgt_lang):
|
|
36
79
|
raise DhwaniAPIError(resp)
|
37
80
|
return resp.json()
|
38
81
|
|
39
|
-
def
|
40
|
-
"""
|
82
|
+
def extract(client, file_path, page_number, src_lang, tgt_lang):
|
83
|
+
"""
|
84
|
+
Extract and translate text from a document (image/PDF) using query parameters.
|
85
|
+
"""
|
86
|
+
# Normalize source and target languages
|
87
|
+
src_lang_code = normalize_language(src_lang)
|
88
|
+
tgt_lang_code = normalize_language(tgt_lang)
|
89
|
+
|
90
|
+
# Build the URL with query parameters
|
91
|
+
url = (
|
92
|
+
f"{client.api_base}/v1/indic-extract-text/"
|
93
|
+
f"?page_number={page_number}&src_lang={src_lang_code}&tgt_lang={tgt_lang_code}"
|
94
|
+
)
|
95
|
+
headers = client._headers()
|
41
96
|
with open(file_path, "rb") as f:
|
42
|
-
files = {"file": f}
|
43
|
-
data = {}
|
44
|
-
if language:
|
45
|
-
data["language"] = language
|
97
|
+
files = {"file": (file_path, f, "application/pdf")}
|
46
98
|
resp = requests.post(
|
47
|
-
|
48
|
-
headers=
|
99
|
+
url,
|
100
|
+
headers=headers,
|
101
|
+
files=files
|
102
|
+
)
|
103
|
+
if resp.status_code != 200:
|
104
|
+
raise DhwaniAPIError(resp)
|
105
|
+
return resp.json()
|
106
|
+
|
107
|
+
def doc_query(
|
108
|
+
client,
|
109
|
+
file_path,
|
110
|
+
page_number=1,
|
111
|
+
prompt="list the key points",
|
112
|
+
src_lang="eng_Latn",
|
113
|
+
tgt_lang="kan_Knda"
|
114
|
+
):
|
115
|
+
"""Query a document with a custom prompt and language options."""
|
116
|
+
# Normalize source and target languages
|
117
|
+
src_lang_code = normalize_language(src_lang)
|
118
|
+
tgt_lang_code = normalize_language(tgt_lang)
|
119
|
+
|
120
|
+
url = f"{client.api_base}/v1/indic-custom-prompt-pdf"
|
121
|
+
headers = client._headers()
|
122
|
+
with open(file_path, "rb") as f:
|
123
|
+
files = {"file": (file_path, f, "application/pdf")}
|
124
|
+
data = {
|
125
|
+
"page_number": str(page_number),
|
126
|
+
"prompt": prompt,
|
127
|
+
"source_language": src_lang_code,
|
128
|
+
"target_language": tgt_lang_code
|
129
|
+
}
|
130
|
+
resp = requests.post(
|
131
|
+
url,
|
132
|
+
headers=headers,
|
133
|
+
files=files,
|
134
|
+
data=data
|
135
|
+
)
|
136
|
+
if resp.status_code != 200:
|
137
|
+
raise DhwaniAPIError(resp)
|
138
|
+
return resp.json()
|
139
|
+
|
140
|
+
def doc_query_kannada(
|
141
|
+
client,
|
142
|
+
file_path,
|
143
|
+
page_number=1,
|
144
|
+
prompt="list key points",
|
145
|
+
src_lang="eng_Latn",
|
146
|
+
language=None
|
147
|
+
):
|
148
|
+
"""Summarize a document (image/PDF/text) with custom prompt and language."""
|
149
|
+
# Normalize source language and optional language parameter
|
150
|
+
src_lang_code = normalize_language(src_lang)
|
151
|
+
data = {
|
152
|
+
"page_number": str(page_number),
|
153
|
+
"prompt": prompt,
|
154
|
+
"src_lang": src_lang_code,
|
155
|
+
}
|
156
|
+
if language:
|
157
|
+
data["language"] = normalize_language(language)
|
158
|
+
|
159
|
+
url = f"{client.api_base}/v1/indic-custom-prompt-kannada-pdf"
|
160
|
+
headers = client._headers()
|
161
|
+
with open(file_path, "rb") as f:
|
162
|
+
files = {"file": (file_path, f, "application/pdf")}
|
163
|
+
resp = requests.post(
|
164
|
+
url,
|
165
|
+
headers=headers,
|
49
166
|
files=files,
|
50
167
|
data=data
|
51
168
|
)
|
@@ -60,11 +177,21 @@ class Documents:
|
|
60
177
|
return _get_client().document_ocr(file_path, language)
|
61
178
|
|
62
179
|
@staticmethod
|
63
|
-
def
|
180
|
+
def summarize(*args, **kwargs):
|
64
181
|
from . import _get_client
|
65
|
-
return _get_client().
|
66
|
-
|
182
|
+
return _get_client().document_summarize(*args, **kwargs)
|
183
|
+
|
184
|
+
@staticmethod
|
185
|
+
def run_extract(*args, **kwargs):
|
186
|
+
from . import _get_client
|
187
|
+
return _get_client().extract(*args, **kwargs)
|
188
|
+
|
189
|
+
@staticmethod
|
190
|
+
def run_doc_query(*args, **kwargs):
|
191
|
+
from . import _get_client
|
192
|
+
return _get_client().doc_query(*args, **kwargs)
|
193
|
+
|
67
194
|
@staticmethod
|
68
|
-
def
|
195
|
+
def run_doc_query_kannada(*args, **kwargs):
|
69
196
|
from . import _get_client
|
70
|
-
return _get_client().
|
197
|
+
return _get_client().doc_query_kannada(*args, **kwargs)
|
dwani/translate.py
CHANGED
@@ -1,12 +1,50 @@
|
|
1
1
|
from .exceptions import DhwaniAPIError
|
2
2
|
import requests
|
3
3
|
|
4
|
+
# Language options mapping
|
5
|
+
language_options = [
|
6
|
+
("English", "eng_Latn"),
|
7
|
+
("Kannada", "kan_Knda"),
|
8
|
+
("Hindi", "hin_Deva"),
|
9
|
+
("Assamese", "asm_Beng"),
|
10
|
+
("Bengali", "ben_Beng"),
|
11
|
+
("Gujarati", "guj_Gujr"),
|
12
|
+
("Malayalam", "mal_Mlym"),
|
13
|
+
("Marathi", "mar_Deva"),
|
14
|
+
("Odia", "ory_Orya"),
|
15
|
+
("Punjabi", "pan_Guru"),
|
16
|
+
("Tamil", "tam_Taml"),
|
17
|
+
("Telugu", "tel_Telu")
|
18
|
+
]
|
19
|
+
|
20
|
+
# Create dictionaries for language name to code and code to code mapping
|
21
|
+
lang_name_to_code = {name.lower(): code for name, code in language_options}
|
22
|
+
lang_code_to_code = {code: code for _, code in language_options}
|
23
|
+
|
24
|
+
def normalize_language(lang):
|
25
|
+
"""Convert language input (name or code) to language code."""
|
26
|
+
lang = lang.strip()
|
27
|
+
# Check if input is a language name (case-insensitive)
|
28
|
+
lang_lower = lang.lower()
|
29
|
+
if lang_lower in lang_name_to_code:
|
30
|
+
return lang_name_to_code[lang_lower]
|
31
|
+
# Check if input is a language code
|
32
|
+
if lang in lang_code_to_code:
|
33
|
+
return lang_code_to_code[lang]
|
34
|
+
# Raise error if language is not supported
|
35
|
+
supported_langs = list(lang_name_to_code.keys()) + list(lang_code_to_code.keys())
|
36
|
+
raise ValueError(f"Unsupported language: {lang}. Supported languages: {supported_langs}")
|
37
|
+
|
4
38
|
def run_translate(client, sentences, src_lang, tgt_lang, **kwargs):
|
39
|
+
# Normalize source and target languages
|
40
|
+
src_lang_code = normalize_language(src_lang)
|
41
|
+
tgt_lang_code = normalize_language(tgt_lang)
|
42
|
+
|
5
43
|
url = f"{client.api_base}/v1/translate"
|
6
44
|
payload = {
|
7
45
|
"sentences": sentences,
|
8
|
-
"src_lang":
|
9
|
-
"tgt_lang":
|
46
|
+
"src_lang": src_lang_code,
|
47
|
+
"tgt_lang": tgt_lang_code
|
10
48
|
}
|
11
49
|
payload.update(kwargs)
|
12
50
|
resp = requests.post(
|
@@ -20,10 +58,6 @@ def run_translate(client, sentences, src_lang, tgt_lang, **kwargs):
|
|
20
58
|
|
21
59
|
class Translate:
|
22
60
|
@staticmethod
|
23
|
-
def
|
61
|
+
def run_translate(sentences, src_lang, tgt_lang, **kwargs):
|
24
62
|
from . import _get_client
|
25
|
-
|
26
|
-
# Ensure sentences is always a list
|
27
|
-
response = run_translate(client, [sentence], src_lang, tgt_lang, **kwargs)
|
28
|
-
# Return the first translation, or None if not found
|
29
|
-
return response.get("translations", [None])[0]
|
63
|
+
return _get_client().translate(sentences, src_lang, tgt_lang, **kwargs)
|
dwani/vision.py
CHANGED
@@ -1,15 +1,53 @@
|
|
1
1
|
from .exceptions import DhwaniAPIError
|
2
2
|
import requests
|
3
|
+
|
4
|
+
# Language options mapping
|
5
|
+
language_options = [
|
6
|
+
("English", "eng_Latn"),
|
7
|
+
("Kannada", "kan_Knda"),
|
8
|
+
("Hindi", "hin_Deva"),
|
9
|
+
("Assamese", "asm_Beng"),
|
10
|
+
("Bengali", "ben_Beng"),
|
11
|
+
("Gujarati", "guj_Gujr"),
|
12
|
+
("Malayalam", "mal_Mlym"),
|
13
|
+
("Marathi", "mar_Deva"),
|
14
|
+
("Odia", "ory_Orya"),
|
15
|
+
("Punjabi", "pan_Guru"),
|
16
|
+
("Tamil", "tam_Taml"),
|
17
|
+
("Telugu", "tel_Telu")
|
18
|
+
]
|
19
|
+
|
20
|
+
# Create dictionaries for language name to code and code to code mapping
|
21
|
+
lang_name_to_code = {name.lower(): code for name, code in language_options}
|
22
|
+
lang_code_to_code = {code: code for _, code in language_options}
|
23
|
+
|
24
|
+
def normalize_language(lang):
|
25
|
+
"""Convert language input (name or code) to language code."""
|
26
|
+
lang = lang.strip()
|
27
|
+
# Check if input is a language name (case-insensitive)
|
28
|
+
lang_lower = lang.lower()
|
29
|
+
if lang_lower in lang_name_to_code:
|
30
|
+
return lang_name_to_code[lang_lower]
|
31
|
+
# Check if input is a language code
|
32
|
+
if lang in lang_code_to_code:
|
33
|
+
return lang_code_to_code[lang]
|
34
|
+
# Raise error if language is not supported
|
35
|
+
supported_langs = list(lang_name_to_code.keys()) + list(lang_code_to_code.keys())
|
36
|
+
raise ValueError(f"Unsupported language: {lang}. Supported languages: {supported_langs}")
|
37
|
+
|
3
38
|
def vision_caption(client, file_path, query="describe the image", src_lang="eng_Latn", tgt_lang="kan_Knda"):
|
39
|
+
# Normalize source and target languages
|
40
|
+
src_lang_code = normalize_language(src_lang)
|
41
|
+
tgt_lang_code = normalize_language(tgt_lang)
|
42
|
+
|
4
43
|
# Build the endpoint using the client's api_base
|
5
44
|
url = (
|
6
45
|
f"{client.api_base}/v1/indic_visual_query"
|
7
|
-
f"?src_lang={
|
46
|
+
f"?src_lang={src_lang_code}&tgt_lang={tgt_lang_code}"
|
8
47
|
)
|
9
48
|
headers = {
|
10
49
|
**client._headers(),
|
11
50
|
"accept": "application/json"
|
12
|
-
# Note: 'Content-Type' will be set automatically by requests when using 'files'
|
13
51
|
}
|
14
52
|
with open(file_path, "rb") as f:
|
15
53
|
files = {"file": (file_path, f, "image/png")}
|
@@ -28,4 +66,4 @@ class Vision:
|
|
28
66
|
@staticmethod
|
29
67
|
def caption(*args, **kwargs):
|
30
68
|
from . import _get_client
|
31
|
-
return _get_client().caption(*args, **kwargs)
|
69
|
+
return _get_client().caption(*args, **kwargs)
|
@@ -1,7 +1,7 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: dwani
|
3
|
-
Version: 0.1.
|
4
|
-
Summary: Multimodal API for Indian languages (
|
3
|
+
Version: 0.1.7
|
4
|
+
Summary: Multimodal API for Indian languages (Chat, Vision, TTS, ASR, Translate, Docs)
|
5
5
|
Author-email: sachin <python@dwani.ai>
|
6
6
|
License: MIT License
|
7
7
|
|
@@ -42,6 +42,9 @@ Dynamic: license-file
|
|
42
42
|
pip install dwani
|
43
43
|
```
|
44
44
|
|
45
|
+
### Languages supported
|
46
|
+
- Assamese, Bengali, Gujarati, Hindi, Kannada, Malayalam, Marathi, Odia, Punjabi, Tamil, Telugu
|
47
|
+
|
45
48
|
### Setup the credentials
|
46
49
|
```python
|
47
50
|
import dwani
|
@@ -59,6 +62,10 @@ dwani.api_base = os.getenv("DWANI_API_BASE_URL")
|
|
59
62
|
resp = dwani.Chat.create(prompt="Hello!", src_lang="eng_Latn", tgt_lang="kan_Knda")
|
60
63
|
print(resp)
|
61
64
|
```
|
65
|
+
```json
|
66
|
+
{'response': 'ನಮಸ್ತೆ! ಭಾರತ ಮತ್ತು ಕರ್ನಾಟಕವನ್ನು ಗಮನದಲ್ಲಿಟ್ಟುಕೊಂಡು ಇಂದು ನಿಮ್ಮ ಪ್ರಶ್ನೆಗಳಿಗೆ ನಾನು ನಿಮಗೆ ಹೇಗೆ ಸಹಾಯ ಮಾಡಲಿ?'}
|
67
|
+
```
|
68
|
+
|
62
69
|
|
63
70
|
#### Vision Query
|
64
71
|
```python
|
@@ -70,13 +77,27 @@ result = dwani.Vision.caption(
|
|
70
77
|
)
|
71
78
|
print(result)
|
72
79
|
```
|
80
|
+
```json
|
81
|
+
{'answer': 'ಒಂದು ವಾಕ್ಯದಲ್ಲಿ ಚಿತ್ರದ ಸಾರಾಂಶವನ್ನು ಇಲ್ಲಿ ನೀಡಲಾಗಿದೆಃ ಪ್ರಕಟಣೆಯ ಅವಲೋಕನವು ಪ್ರಸ್ತುತ ಅರವತ್ತನಾಲ್ಕು ದೇಶಗಳು/ಪ್ರದೇಶಗಳನ್ನು ಸೇರಿಸಲಾಗಿದೆ ಮತ್ತು ಇನ್ನೂ ಹದಿನಾರು ಪ್ರದೇಶಗಳನ್ನು ಸೇರಿಸಬೇಕಾಗಿದೆ. ಒದಗಿಸಲಾದ ಚಿತ್ರದಲ್ಲಿ ಲಾಂಛನವು ಕಾಣಿಸುವುದಿಲ್ಲ.'}
|
82
|
+
```
|
73
83
|
|
74
84
|
#### Speech to Text - Automatic Speech Recognition (ASR)
|
75
85
|
```python
|
76
86
|
result = dwani.ASR.transcribe(file_path="kannada_sample.wav", language="kannada")
|
77
87
|
print(result)
|
78
88
|
```
|
89
|
+
```json
|
90
|
+
{'text': 'ಕರ್ನಾಟಕ ದ ರಾಜಧಾನಿ ಯಾವುದು'}
|
91
|
+
```
|
79
92
|
|
93
|
+
### Translate
|
94
|
+
```python
|
95
|
+
resp = dwani.Translate.run_translate(sentences=["hi"], src_lang="eng_Latn", tgt_lang="kan_Knda")
|
96
|
+
print(resp)
|
97
|
+
```
|
98
|
+
```json
|
99
|
+
{'translations': ['ಹಾಯ್']}
|
100
|
+
```
|
80
101
|
#### Text to Speech - Speech Synthesis
|
81
102
|
|
82
103
|
```python
|
@@ -85,16 +106,18 @@ with open("output.mp3", "wb") as f:
|
|
85
106
|
f.write(response)
|
86
107
|
```
|
87
108
|
|
88
|
-
|
109
|
+
#### Document - Extract Text
|
110
|
+
```python
|
111
|
+
result = dwani.Documents.run_extract(file_path = "dwani-workshop.pdf", page_number=1, src_lang="eng_Latn",tgt_lang="kan_Knda" )
|
112
|
+
print(result)
|
113
|
+
```
|
114
|
+
```json
|
115
|
+
{'pages': [{'processed_page': 1, 'page_content': ' a plain text representation of the document', 'translated_content': 'ಡಾಕ್ಯುಮೆಂಟ್ನ ಸರಳ ಪಠ್ಯ ಪ್ರಾತಿನಿಧ್ಯವನ್ನು ಇಲ್ಲಿ ನೀಡಲಾಗಿದೆ, ಅದನ್ನು ಸ್ವಾಭಾವಿಕವಾಗಿ ಓದುವಂತೆಃ'}]}
|
116
|
+
```
|
89
117
|
|
90
118
|
- Website -> [dwani.ai](https://dwani.ai)
|
91
119
|
|
92
120
|
|
93
|
-
|
94
|
-
#### Contact
|
95
|
-
- For any questions or issues, please open an issue on GitHub or contact us via email.
|
96
|
-
- For collaborations
|
97
|
-
- Join the discord group - [invite link](https://discord.gg/WZMCerEZ2P)
|
98
121
|
<!--
|
99
122
|
## local development
|
100
123
|
pip install -e .
|
@@ -0,0 +1,14 @@
|
|
1
|
+
dwani/__init__.py,sha256=ldO5OND7DvJlbxaQ0R57Cc73jJTnCSslDDt4I4r-Op8,1895
|
2
|
+
dwani/asr.py,sha256=3LYrLOaMhc5eXKFSoi63C8KAvwZI2NcuO25pwTfSVe0,1692
|
3
|
+
dwani/audio.py,sha256=Q9vw4uBxGy1vQzmiZjZGrY8hkAEQNkGhjz5OcnpFEQQ,888
|
4
|
+
dwani/chat.py,sha256=dQCl8lLQczwnAsvYlTZowd471ktRVZcW3w8gZ5Wpzms,2097
|
5
|
+
dwani/client.py,sha256=OrnwqxBQMfEZ1iQEleFigNujiZve3ox53yv5aSmB3iQ,2849
|
6
|
+
dwani/docs.py,sha256=EO41opJwfDFsNmH6nQl-HOsyWravCnj1f5ZDgxSZECI,6323
|
7
|
+
dwani/exceptions.py,sha256=qEN5ukqlnN7v-kHNEnISWFMpPMt6uTft9mPsTXJ4LVA,227
|
8
|
+
dwani/translate.py,sha256=IJiKrYIfwdJKc_PjlZKVRAwzpQDst_2MF_B_huxid_E,2185
|
9
|
+
dwani/vision.py,sha256=wN7WkMRVmLrZnBJxnam7vihTXWGlWJ4JqXgyrp-tbrg,2330
|
10
|
+
dwani-0.1.7.dist-info/licenses/LICENSE,sha256=IAD8tbwWZbPWHXgYjabHoMv0aaUzZUYzYiEbfhTCisY,1070
|
11
|
+
dwani-0.1.7.dist-info/METADATA,sha256=ggOY4wss1nwN6PzhB0BZG5332emrP6C76qwjaK2mzSs,4810
|
12
|
+
dwani-0.1.7.dist-info/WHEEL,sha256=Nw36Djuh_5VDukK0H78QzOX-_FQEo6V37m3nkm96gtU,91
|
13
|
+
dwani-0.1.7.dist-info/top_level.txt,sha256=AM5EhkyuO_EXQFR9JIxEV6tAYMCCyc-a1dLifpCGBUk,6
|
14
|
+
dwani-0.1.7.dist-info/RECORD,,
|
dwani-0.1.5.dist-info/RECORD
DELETED
@@ -1,14 +0,0 @@
|
|
1
|
-
dwani/__init__.py,sha256=P2pyHkZ7JHn6lHSEbCdV4hjYAwCOXHN3RbsNIU0F5PE,1084
|
2
|
-
dwani/asr.py,sha256=Y5Mbv1KsvhfXNZacMZycUHPn79NRQC-XPH0j9SYPUSY,590
|
3
|
-
dwani/audio.py,sha256=Q9vw4uBxGy1vQzmiZjZGrY8hkAEQNkGhjz5OcnpFEQQ,888
|
4
|
-
dwani/chat.py,sha256=WFuEShNd4nd6KUbIZTkm3eyPGoP33GepOLJax86nNn8,720
|
5
|
-
dwani/client.py,sha256=saQxRBcERSMoCMOqBIe_IqRygh9-e4KxF3iZZvBEZDc,1826
|
6
|
-
dwani/docs.py,sha256=2B87KqshPl7-2gDJAJxdvcgmPWuC2IQ1FcsDIyeVJPg,2202
|
7
|
-
dwani/exceptions.py,sha256=qEN5ukqlnN7v-kHNEnISWFMpPMt6uTft9mPsTXJ4LVA,227
|
8
|
-
dwani/translate.py,sha256=nYB62DLoPf7Weg26aNtpoEpyasDIsArVTzl5xKPp6eI,972
|
9
|
-
dwani/vision.py,sha256=JtMSS0hI-8gxtLugVP10__enZsPPy8jheMyWXvrGrdw,1015
|
10
|
-
dwani-0.1.5.dist-info/licenses/LICENSE,sha256=IAD8tbwWZbPWHXgYjabHoMv0aaUzZUYzYiEbfhTCisY,1070
|
11
|
-
dwani-0.1.5.dist-info/METADATA,sha256=qxXqLp_wZG_eoGD29p1HdVZFjfpG4ExxJ1xDeyb6O7U,3118
|
12
|
-
dwani-0.1.5.dist-info/WHEEL,sha256=DnLRTWE75wApRYVsjgc6wsVswC54sMSJhAEd4xhDpBk,91
|
13
|
-
dwani-0.1.5.dist-info/top_level.txt,sha256=AM5EhkyuO_EXQFR9JIxEV6tAYMCCyc-a1dLifpCGBUk,6
|
14
|
-
dwani-0.1.5.dist-info/RECORD,,
|
File without changes
|
File without changes
|