dwani 0.1.5__py3-none-any.whl → 0.1.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
dwani/__init__.py CHANGED
@@ -3,9 +3,11 @@ from .chat import Chat
3
3
  from .audio import Audio
4
4
  from .vision import Vision
5
5
  from .asr import ASR
6
+ from .translate import Translate
6
7
  from .exceptions import DhwaniAPIError
8
+ from .docs import Documents
7
9
 
8
- __all__ = ["DhwaniClient", "Chat", "Audio", "Vision", "ASR", "DhwaniAPIError"]
10
+ __all__ = ["DhwaniClient", "Chat", "Audio", "Vision", "ASR", "DhwaniAPIError", "Translate", "Documents"]
9
11
 
10
12
  # Optionally, instantiate a default client for convenience
11
13
  api_key = None
@@ -37,3 +39,27 @@ class asr:
37
39
  @staticmethod
38
40
  def transcribe(*args, **kwargs):
39
41
  return _get_client().transcribe(*args, **kwargs)
42
+
43
+
44
+ class translate:
45
+ @staticmethod
46
+ def run_translate(*args, **kwargs):
47
+ return _get_client().translate(*args, **kwargs)
48
+
49
+
50
+ class document:
51
+ @staticmethod
52
+ def run_ocr(*args, **kwargs):
53
+ return _get_client().ocr(*args, **kwargs)
54
+ @staticmethod
55
+ def run_summarize(*args, **kwargs):
56
+ return _get_client().summarize(*args, **kwargs)
57
+ @staticmethod
58
+ def run_extract(*args, **kwargs):
59
+ return _get_client().extract(*args, **kwargs)
60
+ @staticmethod
61
+ def run_doc_query(*args, **kwargs):
62
+ return _get_client().doc_query(*args, **kwargs)
63
+ @staticmethod
64
+ def run_doc_query_kannada(*args, **kwargs):
65
+ return _get_client().doc_query_kannada(*args, **kwargs)
dwani/asr.py CHANGED
@@ -1,10 +1,44 @@
1
1
  from .exceptions import DhwaniAPIError
2
2
  import requests
3
+
4
+ # Allowed languages (case-sensitive for display, but we'll handle case-insensitively)
5
+ ALLOWED_LANGUAGES = [
6
+ "Assamese",
7
+ "Bengali",
8
+ "Gujarati",
9
+ "Hindi",
10
+ "Kannada",
11
+ "Malayalam",
12
+ "Marathi",
13
+ "Odia",
14
+ "Punjabi",
15
+ "Tamil",
16
+ "Telugu"
17
+ ]
18
+
19
+ def validate_language(language):
20
+ """Validate that the provided language is in the allowed list (case-insensitive)."""
21
+ # Create a case-insensitive mapping of allowed languages
22
+ language_map = {lang.lower(): lang for lang in ALLOWED_LANGUAGES}
23
+ # Check if the lowercase version of the input language is in the map
24
+ if language.lower() not in language_map:
25
+ raise ValueError(
26
+ f"Unsupported language: {language}. Supported languages: {ALLOWED_LANGUAGES}"
27
+ )
28
+ # Return the original case from ALLOWED_LANGUAGES for consistency
29
+ return language_map[language.lower()]
30
+
3
31
  def asr_transcribe(client, file_path, language):
32
+ # Validate the language input (case-insensitive)
33
+ validated_language = validate_language(language)
34
+
35
+ # Convert language to lowercase for the API request
36
+ api_language = validated_language.lower()
37
+
4
38
  with open(file_path, "rb") as f:
5
39
  files = {"file": f}
6
40
  resp = requests.post(
7
- f"{client.api_base}/v1/transcribe/?language={language}",
41
+ f"{client.api_base}/v1/transcribe/?language={api_language}",
8
42
  headers=client._headers(),
9
43
  files=files
10
44
  )
@@ -16,5 +50,4 @@ class ASR:
16
50
  @staticmethod
17
51
  def transcribe(*args, **kwargs):
18
52
  from . import _get_client
19
- return _get_client().transcribe(*args, **kwargs)
20
-
53
+ return _get_client().transcribe(*args, **kwargs)
dwani/chat.py CHANGED
@@ -1,12 +1,50 @@
1
1
  from .exceptions import DhwaniAPIError
2
2
  import requests
3
3
 
4
+ # Language options mapping
5
+ language_options = [
6
+ ("English", "eng_Latn"),
7
+ ("Kannada", "kan_Knda"),
8
+ ("Hindi", "hin_Deva"),
9
+ ("Assamese", "asm_Beng"),
10
+ ("Bengali","ben_Beng"),
11
+ ("Gujarati","guj_Gujr"),
12
+ ("Malayalam","mal_Mlym"),
13
+ ("Marathi","mar_Deva"),
14
+ ("Odia","ory_Orya"),
15
+ ("Punjabi","pan_Guru"),
16
+ ("Tamil","tam_Taml"),
17
+ ("Telugu","tel_Telu")
18
+ ]
19
+
20
+ # Create a dictionary for language name to code mapping
21
+ lang_name_to_code = {name.lower(): code for name, code in language_options}
22
+ lang_code_to_code = {code: code for _, code in language_options}
23
+
24
+ def normalize_language(lang):
25
+ """Convert language input (name or code) to language code."""
26
+ lang = lang.strip()
27
+ # Check if input is a language name (case-insensitive)
28
+ lang_lower = lang.lower()
29
+ if lang_lower in lang_name_to_code:
30
+ return lang_name_to_code[lang_lower]
31
+ # Check if input is a language code
32
+ if lang in lang_code_to_code:
33
+ return lang_code_to_code[lang]
34
+ # Raise error if language is not supported
35
+ supported_langs = list(lang_name_to_code.keys()) + list(lang_code_to_code.keys())
36
+ raise ValueError(f"Unsupported language: {lang}. Supported languages: {supported_langs}")
37
+
4
38
  def chat_create(client, prompt, src_lang, tgt_lang, **kwargs):
39
+ # Normalize source and target languages
40
+ src_lang_code = normalize_language(src_lang)
41
+ tgt_lang_code = normalize_language(tgt_lang)
42
+
5
43
  url = f"{client.api_base}/v1/indic_chat"
6
44
  payload = {
7
45
  "prompt": prompt,
8
- "src_lang": src_lang,
9
- "tgt_lang": tgt_lang
46
+ "src_lang": src_lang_code,
47
+ "tgt_lang": tgt_lang_code
10
48
  }
11
49
  payload.update(kwargs)
12
50
  resp = requests.post(
@@ -22,4 +60,4 @@ class Chat:
22
60
  @staticmethod
23
61
  def create(prompt, src_lang, tgt_lang, **kwargs):
24
62
  from . import _get_client
25
- return _get_client().chat(prompt, src_lang, tgt_lang, **kwargs)
63
+ return _get_client().chat(prompt, src_lang, tgt_lang, **kwargs)
dwani/client.py CHANGED
@@ -12,35 +12,43 @@ class DhwaniClient:
12
12
  def _headers(self):
13
13
  return {"X-API-Key": self.api_key}
14
14
 
15
- def chat(self, prompt, src_lang, tgt_lang, **kwargs):
16
- from .chat import chat_create
17
- return chat_create(self, prompt, src_lang, tgt_lang, **kwargs)
18
-
19
15
  def translate(self, sentences, src_lang, tgt_lang, **kwargs):
20
16
  from .translate import run_translate
21
- return run_translate(self, sentences=sentences,src_lang= src_lang, tgt_lang=tgt_lang, **kwargs)
17
+ return run_translate(self, sentences=sentences, src_lang=src_lang, tgt_lang=tgt_lang, **kwargs)
22
18
 
23
- def speech(self, *args, **kwargs):
19
+ def chat(self, prompt, src_lang, tgt_lang, **kwargs):
20
+ from .chat import chat_create
21
+ return chat_create(self, prompt=prompt, src_lang=src_lang, tgt_lang=tgt_lang, **kwargs)
22
+
23
+ def speech(self, input, response_format="mp3", **kwargs):
24
24
  from .audio import audio_speech
25
- return audio_speech(self, *args, **kwargs)
25
+ return audio_speech(self, input=input, response_format=response_format, **kwargs)
26
26
 
27
- def caption(self, file_path, query="describe the image", src_lang="eng_Latn", tgt_lang="kan_Knda"):
27
+ def caption(self, file_path, query="describe the image", src_lang="eng_Latn", tgt_lang="kan_Knda", **kwargs):
28
28
  from .vision import vision_caption
29
- return vision_caption(self, file_path, query, src_lang, tgt_lang)
29
+ return vision_caption(self, file_path=file_path, query=query, src_lang=src_lang, tgt_lang=tgt_lang, **kwargs)
30
30
 
31
- def transcribe(self, *args, **kwargs):
31
+ def transcribe(self, file_path, language=None, **kwargs):
32
32
  from .asr import asr_transcribe
33
- return asr_transcribe(self, *args, **kwargs)
33
+ return asr_transcribe(self, file_path=file_path, language=language, **kwargs)
34
34
 
35
- def document_ocr(self, file_path, language=None):
35
+ def document_ocr(self, file_path, language=None, **kwargs):
36
36
  from .docs import document_ocr
37
- return document_ocr(self, file_path, language)
38
-
39
- def document_translate(self, file_path, src_lang, tgt_lang):
40
- from .docs import document_translate
41
- return document_translate(self, file_path, src_lang, tgt_lang)
37
+ return document_ocr(self, file_path=file_path, language=language, **kwargs)
42
38
 
43
- def document_summarize(self, file_path, language=None):
39
+ def document_summarize(self, file_path, page_number=1, src_lang="eng_Latn", tgt_lang="kan_Knda", **kwargs):
44
40
  from .docs import document_summarize
45
- return document_summarize(self, file_path, language)
41
+ return document_summarize(self, file_path, page_number, src_lang, tgt_lang, **kwargs)
42
+
43
+ def extract(self, file_path, page_number=1, src_lang="eng_Latn", tgt_lang="kan_Knda", **kwargs):
44
+ from .docs import extract
45
+ return extract(self, file_path=file_path, page_number=page_number, src_lang=src_lang,tgt_lang=tgt_lang, **kwargs)
46
+
47
+
48
+ def doc_query( self, file_path, page_number=1, prompt="list the key points", src_lang="eng_Latn", tgt_lang="kan_Knda" , **kwargs ):
49
+ from .docs import doc_query
50
+ return doc_query( self, file_path, page_number=page_number, prompt=prompt, src_lang=src_lang, tgt_lang=tgt_lang , **kwargs )
46
51
 
52
+ def doc_query_kannada(self, file_path, page_number=1, prompt="list key points", src_lang="eng_Latn", language=None, **kwargs):
53
+ from .docs import doc_query_kannada
54
+ return doc_query_kannada(self, file_path=file_path, page_number=page_number, prompt=prompt, src_lang=src_lang, language=language, **kwargs)
dwani/docs.py CHANGED
@@ -1,13 +1,49 @@
1
1
  import requests
2
2
  from .exceptions import DhwaniAPIError
3
3
 
4
+ # Language options mapping
5
+ language_options = [
6
+ ("English", "eng_Latn"),
7
+ ("Kannada", "kan_Knda"),
8
+ ("Hindi", "hin_Deva"),
9
+ ("Assamese", "asm_Beng"),
10
+ ("Bengali", "ben_Beng"),
11
+ ("Gujarati", "guj_Gujr"),
12
+ ("Malayalam", "mal_Mlym"),
13
+ ("Marathi", "mar_Deva"),
14
+ ("Odia", "ory_Orya"),
15
+ ("Punjabi", "pan_Guru"),
16
+ ("Tamil", "tam_Taml"),
17
+ ("Telugu", "tel_Telu")
18
+ ]
19
+
20
+ # Create dictionaries for language name to code and code to code mapping
21
+ lang_name_to_code = {name.lower(): code for name, code in language_options}
22
+ lang_code_to_code = {code: code for _, code in language_options}
23
+
24
+ def normalize_language(lang):
25
+ """Convert language input (name or code) to language code."""
26
+ lang = lang.strip()
27
+ # Check if input is a language name (case-insensitive)
28
+ lang_lower = lang.lower()
29
+ if lang_lower in lang_name_to_code:
30
+ return lang_name_to_code[lang_lower]
31
+ # Check if input is a language code
32
+ if lang in lang_code_to_code:
33
+ return lang_code_to_code[lang]
34
+ # Raise error if language is not supported
35
+ supported_langs = list(lang_name_to_code.keys()) + list(lang_code_to_code.keys())
36
+ raise ValueError(f"Unsupported language: {lang}. Supported languages: {supported_langs}")
37
+
4
38
  def document_ocr(client, file_path, language=None):
5
39
  """OCR a document (image/PDF) and return extracted text."""
40
+ data = {}
41
+ if language:
42
+ # Normalize the language input
43
+ data["language"] = normalize_language(language)
44
+
6
45
  with open(file_path, "rb") as f:
7
46
  files = {"file": f}
8
- data = {}
9
- if language:
10
- data["language"] = language
11
47
  resp = requests.post(
12
48
  f"{client.api_base}/v1/document/ocr",
13
49
  headers=client._headers(),
@@ -18,17 +54,24 @@ def document_ocr(client, file_path, language=None):
18
54
  raise DhwaniAPIError(resp)
19
55
  return resp.json()
20
56
 
21
- def document_translate(client, file_path, src_lang, tgt_lang):
22
- """Translate a document (image/PDF with text) from src_lang to tgt_lang."""
57
+ def document_summarize(client, file_path, page_number=1, src_lang="eng_Latn", tgt_lang="kan_Knda"):
58
+ """Summarize a PDF document with language and page number options."""
59
+ # Normalize source and target languages
60
+ src_lang_code = normalize_language(src_lang)
61
+ tgt_lang_code = normalize_language(tgt_lang)
62
+
63
+ url = f"{client.api_base}/v1/indic-summarize-pdf"
64
+ headers = client._headers()
23
65
  with open(file_path, "rb") as f:
24
- files = {"file": f}
66
+ files = {"file": (file_path, f, "application/pdf")}
25
67
  data = {
26
- "src_lang": src_lang,
27
- "tgt_lang": tgt_lang
68
+ "page_number": str(page_number),
69
+ "src_lang": src_lang_code,
70
+ "tgt_lang": tgt_lang_code
28
71
  }
29
72
  resp = requests.post(
30
- f"{client.api_base}/v1/document/translate",
31
- headers=client._headers(),
73
+ url,
74
+ headers=headers,
32
75
  files=files,
33
76
  data=data
34
77
  )
@@ -36,16 +79,90 @@ def document_translate(client, file_path, src_lang, tgt_lang):
36
79
  raise DhwaniAPIError(resp)
37
80
  return resp.json()
38
81
 
39
- def document_summarize(client, file_path, language=None):
40
- """Summarize a document (image/PDF/text)."""
82
+ def extract(client, file_path, page_number, src_lang, tgt_lang):
83
+ """
84
+ Extract and translate text from a document (image/PDF) using query parameters.
85
+ """
86
+ # Normalize source and target languages
87
+ src_lang_code = normalize_language(src_lang)
88
+ tgt_lang_code = normalize_language(tgt_lang)
89
+
90
+ # Build the URL with query parameters
91
+ url = (
92
+ f"{client.api_base}/v1/indic-extract-text/"
93
+ f"?page_number={page_number}&src_lang={src_lang_code}&tgt_lang={tgt_lang_code}"
94
+ )
95
+ headers = client._headers()
41
96
  with open(file_path, "rb") as f:
42
- files = {"file": f}
43
- data = {}
44
- if language:
45
- data["language"] = language
97
+ files = {"file": (file_path, f, "application/pdf")}
46
98
  resp = requests.post(
47
- f"{client.api_base}/v1/document/summarize",
48
- headers=client._headers(),
99
+ url,
100
+ headers=headers,
101
+ files=files
102
+ )
103
+ if resp.status_code != 200:
104
+ raise DhwaniAPIError(resp)
105
+ return resp.json()
106
+
107
+ def doc_query(
108
+ client,
109
+ file_path,
110
+ page_number=1,
111
+ prompt="list the key points",
112
+ src_lang="eng_Latn",
113
+ tgt_lang="kan_Knda"
114
+ ):
115
+ """Query a document with a custom prompt and language options."""
116
+ # Normalize source and target languages
117
+ src_lang_code = normalize_language(src_lang)
118
+ tgt_lang_code = normalize_language(tgt_lang)
119
+
120
+ url = f"{client.api_base}/v1/indic-custom-prompt-pdf"
121
+ headers = client._headers()
122
+ with open(file_path, "rb") as f:
123
+ files = {"file": (file_path, f, "application/pdf")}
124
+ data = {
125
+ "page_number": str(page_number),
126
+ "prompt": prompt,
127
+ "source_language": src_lang_code,
128
+ "target_language": tgt_lang_code
129
+ }
130
+ resp = requests.post(
131
+ url,
132
+ headers=headers,
133
+ files=files,
134
+ data=data
135
+ )
136
+ if resp.status_code != 200:
137
+ raise DhwaniAPIError(resp)
138
+ return resp.json()
139
+
140
+ def doc_query_kannada(
141
+ client,
142
+ file_path,
143
+ page_number=1,
144
+ prompt="list key points",
145
+ src_lang="eng_Latn",
146
+ language=None
147
+ ):
148
+ """Summarize a document (image/PDF/text) with custom prompt and language."""
149
+ # Normalize source language and optional language parameter
150
+ src_lang_code = normalize_language(src_lang)
151
+ data = {
152
+ "page_number": str(page_number),
153
+ "prompt": prompt,
154
+ "src_lang": src_lang_code,
155
+ }
156
+ if language:
157
+ data["language"] = normalize_language(language)
158
+
159
+ url = f"{client.api_base}/v1/indic-custom-prompt-kannada-pdf"
160
+ headers = client._headers()
161
+ with open(file_path, "rb") as f:
162
+ files = {"file": (file_path, f, "application/pdf")}
163
+ resp = requests.post(
164
+ url,
165
+ headers=headers,
49
166
  files=files,
50
167
  data=data
51
168
  )
@@ -60,11 +177,21 @@ class Documents:
60
177
  return _get_client().document_ocr(file_path, language)
61
178
 
62
179
  @staticmethod
63
- def translate(file_path, src_lang, tgt_lang):
180
+ def summarize(*args, **kwargs):
64
181
  from . import _get_client
65
- return _get_client().document_translate(file_path, src_lang, tgt_lang)
66
-
182
+ return _get_client().document_summarize(*args, **kwargs)
183
+
184
+ @staticmethod
185
+ def run_extract(*args, **kwargs):
186
+ from . import _get_client
187
+ return _get_client().extract(*args, **kwargs)
188
+
189
+ @staticmethod
190
+ def run_doc_query(*args, **kwargs):
191
+ from . import _get_client
192
+ return _get_client().doc_query(*args, **kwargs)
193
+
67
194
  @staticmethod
68
- def summarize(file_path, language=None):
195
+ def run_doc_query_kannada(*args, **kwargs):
69
196
  from . import _get_client
70
- return _get_client().document_summarize(file_path, language)
197
+ return _get_client().doc_query_kannada(*args, **kwargs)
dwani/translate.py CHANGED
@@ -1,12 +1,50 @@
1
1
  from .exceptions import DhwaniAPIError
2
2
  import requests
3
3
 
4
+ # Language options mapping
5
+ language_options = [
6
+ ("English", "eng_Latn"),
7
+ ("Kannada", "kan_Knda"),
8
+ ("Hindi", "hin_Deva"),
9
+ ("Assamese", "asm_Beng"),
10
+ ("Bengali", "ben_Beng"),
11
+ ("Gujarati", "guj_Gujr"),
12
+ ("Malayalam", "mal_Mlym"),
13
+ ("Marathi", "mar_Deva"),
14
+ ("Odia", "ory_Orya"),
15
+ ("Punjabi", "pan_Guru"),
16
+ ("Tamil", "tam_Taml"),
17
+ ("Telugu", "tel_Telu")
18
+ ]
19
+
20
+ # Create dictionaries for language name to code and code to code mapping
21
+ lang_name_to_code = {name.lower(): code for name, code in language_options}
22
+ lang_code_to_code = {code: code for _, code in language_options}
23
+
24
+ def normalize_language(lang):
25
+ """Convert language input (name or code) to language code."""
26
+ lang = lang.strip()
27
+ # Check if input is a language name (case-insensitive)
28
+ lang_lower = lang.lower()
29
+ if lang_lower in lang_name_to_code:
30
+ return lang_name_to_code[lang_lower]
31
+ # Check if input is a language code
32
+ if lang in lang_code_to_code:
33
+ return lang_code_to_code[lang]
34
+ # Raise error if language is not supported
35
+ supported_langs = list(lang_name_to_code.keys()) + list(lang_code_to_code.keys())
36
+ raise ValueError(f"Unsupported language: {lang}. Supported languages: {supported_langs}")
37
+
4
38
  def run_translate(client, sentences, src_lang, tgt_lang, **kwargs):
39
+ # Normalize source and target languages
40
+ src_lang_code = normalize_language(src_lang)
41
+ tgt_lang_code = normalize_language(tgt_lang)
42
+
5
43
  url = f"{client.api_base}/v1/translate"
6
44
  payload = {
7
45
  "sentences": sentences,
8
- "src_lang": src_lang,
9
- "tgt_lang": tgt_lang
46
+ "src_lang": src_lang_code,
47
+ "tgt_lang": tgt_lang_code
10
48
  }
11
49
  payload.update(kwargs)
12
50
  resp = requests.post(
@@ -20,10 +58,6 @@ def run_translate(client, sentences, src_lang, tgt_lang, **kwargs):
20
58
 
21
59
  class Translate:
22
60
  @staticmethod
23
- def translate(sentence, src_lang, tgt_lang, **kwargs):
61
+ def run_translate(sentences, src_lang, tgt_lang, **kwargs):
24
62
  from . import _get_client
25
- client = _get_client()
26
- # Ensure sentences is always a list
27
- response = run_translate(client, [sentence], src_lang, tgt_lang, **kwargs)
28
- # Return the first translation, or None if not found
29
- return response.get("translations", [None])[0]
63
+ return _get_client().translate(sentences, src_lang, tgt_lang, **kwargs)
dwani/vision.py CHANGED
@@ -1,15 +1,53 @@
1
1
  from .exceptions import DhwaniAPIError
2
2
  import requests
3
+
4
+ # Language options mapping
5
+ language_options = [
6
+ ("English", "eng_Latn"),
7
+ ("Kannada", "kan_Knda"),
8
+ ("Hindi", "hin_Deva"),
9
+ ("Assamese", "asm_Beng"),
10
+ ("Bengali", "ben_Beng"),
11
+ ("Gujarati", "guj_Gujr"),
12
+ ("Malayalam", "mal_Mlym"),
13
+ ("Marathi", "mar_Deva"),
14
+ ("Odia", "ory_Orya"),
15
+ ("Punjabi", "pan_Guru"),
16
+ ("Tamil", "tam_Taml"),
17
+ ("Telugu", "tel_Telu")
18
+ ]
19
+
20
+ # Create dictionaries for language name to code and code to code mapping
21
+ lang_name_to_code = {name.lower(): code for name, code in language_options}
22
+ lang_code_to_code = {code: code for _, code in language_options}
23
+
24
+ def normalize_language(lang):
25
+ """Convert language input (name or code) to language code."""
26
+ lang = lang.strip()
27
+ # Check if input is a language name (case-insensitive)
28
+ lang_lower = lang.lower()
29
+ if lang_lower in lang_name_to_code:
30
+ return lang_name_to_code[lang_lower]
31
+ # Check if input is a language code
32
+ if lang in lang_code_to_code:
33
+ return lang_code_to_code[lang]
34
+ # Raise error if language is not supported
35
+ supported_langs = list(lang_name_to_code.keys()) + list(lang_code_to_code.keys())
36
+ raise ValueError(f"Unsupported language: {lang}. Supported languages: {supported_langs}")
37
+
3
38
  def vision_caption(client, file_path, query="describe the image", src_lang="eng_Latn", tgt_lang="kan_Knda"):
39
+ # Normalize source and target languages
40
+ src_lang_code = normalize_language(src_lang)
41
+ tgt_lang_code = normalize_language(tgt_lang)
42
+
4
43
  # Build the endpoint using the client's api_base
5
44
  url = (
6
45
  f"{client.api_base}/v1/indic_visual_query"
7
- f"?src_lang={src_lang}&tgt_lang={tgt_lang}"
46
+ f"?src_lang={src_lang_code}&tgt_lang={tgt_lang_code}"
8
47
  )
9
48
  headers = {
10
49
  **client._headers(),
11
50
  "accept": "application/json"
12
- # Note: 'Content-Type' will be set automatically by requests when using 'files'
13
51
  }
14
52
  with open(file_path, "rb") as f:
15
53
  files = {"file": (file_path, f, "image/png")}
@@ -28,4 +66,4 @@ class Vision:
28
66
  @staticmethod
29
67
  def caption(*args, **kwargs):
30
68
  from . import _get_client
31
- return _get_client().caption(*args, **kwargs)
69
+ return _get_client().caption(*args, **kwargs)
@@ -1,7 +1,7 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: dwani
3
- Version: 0.1.5
4
- Summary: Multimodal API for Indian languages (speech, vision, LLMs, TTS, ASR, etc.)
3
+ Version: 0.1.7
4
+ Summary: Multimodal API for Indian languages (Chat, Vision, TTS, ASR, Translate, Docs)
5
5
  Author-email: sachin <python@dwani.ai>
6
6
  License: MIT License
7
7
 
@@ -42,6 +42,9 @@ Dynamic: license-file
42
42
  pip install dwani
43
43
  ```
44
44
 
45
+ ### Languages supported
46
+ - Assamese, Bengali, Gujarati, Hindi, Kannada, Malayalam, Marathi, Odia, Punjabi, Tamil, Telugu
47
+
45
48
  ### Setup the credentials
46
49
  ```python
47
50
  import dwani
@@ -59,6 +62,10 @@ dwani.api_base = os.getenv("DWANI_API_BASE_URL")
59
62
  resp = dwani.Chat.create(prompt="Hello!", src_lang="eng_Latn", tgt_lang="kan_Knda")
60
63
  print(resp)
61
64
  ```
65
+ ```json
66
+ {'response': 'ನಮಸ್ತೆ! ಭಾರತ ಮತ್ತು ಕರ್ನಾಟಕವನ್ನು ಗಮನದಲ್ಲಿಟ್ಟುಕೊಂಡು ಇಂದು ನಿಮ್ಮ ಪ್ರಶ್ನೆಗಳಿಗೆ ನಾನು ನಿಮಗೆ ಹೇಗೆ ಸಹಾಯ ಮಾಡಲಿ?'}
67
+ ```
68
+
62
69
 
63
70
  #### Vision Query
64
71
  ```python
@@ -70,13 +77,27 @@ result = dwani.Vision.caption(
70
77
  )
71
78
  print(result)
72
79
  ```
80
+ ```json
81
+ {'answer': 'ಒಂದು ವಾಕ್ಯದಲ್ಲಿ ಚಿತ್ರದ ಸಾರಾಂಶವನ್ನು ಇಲ್ಲಿ ನೀಡಲಾಗಿದೆಃ ಪ್ರಕಟಣೆಯ ಅವಲೋಕನವು ಪ್ರಸ್ತುತ ಅರವತ್ತನಾಲ್ಕು ದೇಶಗಳು/ಪ್ರದೇಶಗಳನ್ನು ಸೇರಿಸಲಾಗಿದೆ ಮತ್ತು ಇನ್ನೂ ಹದಿನಾರು ಪ್ರದೇಶಗಳನ್ನು ಸೇರಿಸಬೇಕಾಗಿದೆ. ಒದಗಿಸಲಾದ ಚಿತ್ರದಲ್ಲಿ ಲಾಂಛನವು ಕಾಣಿಸುವುದಿಲ್ಲ.'}
82
+ ```
73
83
 
74
84
  #### Speech to Text - Automatic Speech Recognition (ASR)
75
85
  ```python
76
86
  result = dwani.ASR.transcribe(file_path="kannada_sample.wav", language="kannada")
77
87
  print(result)
78
88
  ```
89
+ ```json
90
+ {'text': 'ಕರ್ನಾಟಕ ದ ರಾಜಧಾನಿ ಯಾವುದು'}
91
+ ```
79
92
 
93
+ ### Translate
94
+ ```python
95
+ resp = dwani.Translate.run_translate(sentences=["hi"], src_lang="eng_Latn", tgt_lang="kan_Knda")
96
+ print(resp)
97
+ ```
98
+ ```json
99
+ {'translations': ['ಹಾಯ್']}
100
+ ```
80
101
  #### Text to Speech - Speech Synthesis
81
102
 
82
103
  ```python
@@ -85,16 +106,18 @@ with open("output.mp3", "wb") as f:
85
106
  f.write(response)
86
107
  ```
87
108
 
88
-
109
+ #### Document - Extract Text
110
+ ```python
111
+ result = dwani.Documents.run_extract(file_path = "dwani-workshop.pdf", page_number=1, src_lang="eng_Latn",tgt_lang="kan_Knda" )
112
+ print(result)
113
+ ```
114
+ ```json
115
+ {'pages': [{'processed_page': 1, 'page_content': ' a plain text representation of the document', 'translated_content': 'ಡಾಕ್ಯುಮೆಂಟ್ನ ಸರಳ ಪಠ್ಯ ಪ್ರಾತಿನಿಧ್ಯವನ್ನು ಇಲ್ಲಿ ನೀಡಲಾಗಿದೆ, ಅದನ್ನು ಸ್ವಾಭಾವಿಕವಾಗಿ ಓದುವಂತೆಃ'}]}
116
+ ```
89
117
 
90
118
  - Website -> [dwani.ai](https://dwani.ai)
91
119
 
92
120
 
93
-
94
- #### Contact
95
- - For any questions or issues, please open an issue on GitHub or contact us via email.
96
- - For collaborations
97
- - Join the discord group - [invite link](https://discord.gg/WZMCerEZ2P)
98
121
  <!--
99
122
  ## local development
100
123
  pip install -e .
@@ -0,0 +1,14 @@
1
+ dwani/__init__.py,sha256=ldO5OND7DvJlbxaQ0R57Cc73jJTnCSslDDt4I4r-Op8,1895
2
+ dwani/asr.py,sha256=3LYrLOaMhc5eXKFSoi63C8KAvwZI2NcuO25pwTfSVe0,1692
3
+ dwani/audio.py,sha256=Q9vw4uBxGy1vQzmiZjZGrY8hkAEQNkGhjz5OcnpFEQQ,888
4
+ dwani/chat.py,sha256=dQCl8lLQczwnAsvYlTZowd471ktRVZcW3w8gZ5Wpzms,2097
5
+ dwani/client.py,sha256=OrnwqxBQMfEZ1iQEleFigNujiZve3ox53yv5aSmB3iQ,2849
6
+ dwani/docs.py,sha256=EO41opJwfDFsNmH6nQl-HOsyWravCnj1f5ZDgxSZECI,6323
7
+ dwani/exceptions.py,sha256=qEN5ukqlnN7v-kHNEnISWFMpPMt6uTft9mPsTXJ4LVA,227
8
+ dwani/translate.py,sha256=IJiKrYIfwdJKc_PjlZKVRAwzpQDst_2MF_B_huxid_E,2185
9
+ dwani/vision.py,sha256=wN7WkMRVmLrZnBJxnam7vihTXWGlWJ4JqXgyrp-tbrg,2330
10
+ dwani-0.1.7.dist-info/licenses/LICENSE,sha256=IAD8tbwWZbPWHXgYjabHoMv0aaUzZUYzYiEbfhTCisY,1070
11
+ dwani-0.1.7.dist-info/METADATA,sha256=ggOY4wss1nwN6PzhB0BZG5332emrP6C76qwjaK2mzSs,4810
12
+ dwani-0.1.7.dist-info/WHEEL,sha256=Nw36Djuh_5VDukK0H78QzOX-_FQEo6V37m3nkm96gtU,91
13
+ dwani-0.1.7.dist-info/top_level.txt,sha256=AM5EhkyuO_EXQFR9JIxEV6tAYMCCyc-a1dLifpCGBUk,6
14
+ dwani-0.1.7.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (80.4.0)
2
+ Generator: setuptools (80.7.1)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5
 
@@ -1,14 +0,0 @@
1
- dwani/__init__.py,sha256=P2pyHkZ7JHn6lHSEbCdV4hjYAwCOXHN3RbsNIU0F5PE,1084
2
- dwani/asr.py,sha256=Y5Mbv1KsvhfXNZacMZycUHPn79NRQC-XPH0j9SYPUSY,590
3
- dwani/audio.py,sha256=Q9vw4uBxGy1vQzmiZjZGrY8hkAEQNkGhjz5OcnpFEQQ,888
4
- dwani/chat.py,sha256=WFuEShNd4nd6KUbIZTkm3eyPGoP33GepOLJax86nNn8,720
5
- dwani/client.py,sha256=saQxRBcERSMoCMOqBIe_IqRygh9-e4KxF3iZZvBEZDc,1826
6
- dwani/docs.py,sha256=2B87KqshPl7-2gDJAJxdvcgmPWuC2IQ1FcsDIyeVJPg,2202
7
- dwani/exceptions.py,sha256=qEN5ukqlnN7v-kHNEnISWFMpPMt6uTft9mPsTXJ4LVA,227
8
- dwani/translate.py,sha256=nYB62DLoPf7Weg26aNtpoEpyasDIsArVTzl5xKPp6eI,972
9
- dwani/vision.py,sha256=JtMSS0hI-8gxtLugVP10__enZsPPy8jheMyWXvrGrdw,1015
10
- dwani-0.1.5.dist-info/licenses/LICENSE,sha256=IAD8tbwWZbPWHXgYjabHoMv0aaUzZUYzYiEbfhTCisY,1070
11
- dwani-0.1.5.dist-info/METADATA,sha256=qxXqLp_wZG_eoGD29p1HdVZFjfpG4ExxJ1xDeyb6O7U,3118
12
- dwani-0.1.5.dist-info/WHEEL,sha256=DnLRTWE75wApRYVsjgc6wsVswC54sMSJhAEd4xhDpBk,91
13
- dwani-0.1.5.dist-info/top_level.txt,sha256=AM5EhkyuO_EXQFR9JIxEV6tAYMCCyc-a1dLifpCGBUk,6
14
- dwani-0.1.5.dist-info/RECORD,,