Open-AutoTools 0.0.2.post2__py3-none-any.whl → 0.0.3rc1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,46 @@
1
+ import pytest
2
+ from click.testing import CliRunner
3
+ from autotools.cli import autolower
4
+
5
+ # INTEGRATION TESTS
6
+
7
+ # TEST FOR BASIC CLI FUNCTIONALITY
8
+ def test_autolower_cli_basic():
9
+ """TEST BASIC CLI FUNCTIONALITY"""
10
+ runner = CliRunner()
11
+ result = runner.invoke(autolower, ["HELLO WORLD"])
12
+ assert result.exit_code == 0
13
+ assert "hello world" in result.output
14
+
15
+ # TEST FOR EMPTY INPUT
16
+ def test_autolower_cli_empty():
17
+ """TEST CLI WITH EMPTY INPUT"""
18
+ runner = CliRunner()
19
+ result = runner.invoke(autolower, [""])
20
+ assert result.exit_code == 0
21
+ assert "" in result.output
22
+
23
+ # TEST FOR SPECIAL CHARACTERS
24
+ def test_autolower_cli_special_chars():
25
+ """TEST CLI WITH SPECIAL CHARACTERS"""
26
+ runner = CliRunner()
27
+ result = runner.invoke(autolower, ["HELLO@WORLD.COM"])
28
+ assert result.exit_code == 0
29
+ assert "hello@world.com" in result.output
30
+
31
+ # TEST FOR UNICODE CHARACTERS
32
+ def test_autolower_cli_unicode():
33
+ """TEST CLI WITH UNICODE CHARACTERS"""
34
+ runner = CliRunner()
35
+ result = runner.invoke(autolower, ["HÉLLO WÖRLD"])
36
+ assert result.exit_code == 0
37
+ assert "héllo wörld" in result.output
38
+
39
+ # TEST FOR MULTIPLE ARGUMENTS
40
+ def test_autolower_cli_multiple_args():
41
+ """TEST CLI WITH MULTIPLE ARGUMENTS"""
42
+ runner = CliRunner()
43
+ result = runner.invoke(autolower, ["HELLO", "WORLD"])
44
+ assert result.exit_code == 0
45
+ # SHOULD ONLY PROCESS FIRST ARGUMENT
46
+ assert "hello" in result.output
@@ -0,0 +1,3 @@
1
+ from .core import SpellChecker
2
+
3
+ __all__ = ['SpellChecker']
@@ -0,0 +1,222 @@
1
+ import language_tool_python
2
+ import spacy
3
+ from typing import List, Dict, Optional
4
+ import pyperclip
5
+ import requests
6
+ from langdetect import detect, detect_langs
7
+
8
+ class SpellChecker:
9
+ def __init__(self):
10
+ # INITIALIZE LANGUAGE TOOL
11
+ self.tool = language_tool_python.LanguageTool('auto')
12
+
13
+ # CACHE FOR SPACY MODELS
14
+ self.nlp_models = {}
15
+
16
+ # LOAD SPACY MODEL FOR GIVEN LANGUAGE
17
+ def _load_spacy_model(self, lang_code: str) -> Optional[spacy.language.Language]:
18
+ """LOAD SPACY MODEL FOR GIVEN LANGUAGE"""
19
+ try:
20
+ if lang_code not in self.nlp_models:
21
+ # GET ALL INSTALLED MODELS FOR THIS LANGUAGE
22
+ available_models = [
23
+ model for model in spacy.util.get_installed_models()
24
+ if model.startswith(lang_code)
25
+ ]
26
+
27
+ if not available_models:
28
+ # TRY TO CREATE A BLANK MODEL IF NO TRAINED MODELS
29
+ self.nlp_models[lang_code] = spacy.blank(lang_code)
30
+ else:
31
+ # USE MOST COMPREHENSIVE MODEL (USUALLY ENDS WITH 'lg' OR 'trf')
32
+ preferred_model = None
33
+ for suffix in ['trf', 'lg', 'md', 'sm']:
34
+ for model in available_models:
35
+ if model.endswith(suffix):
36
+ preferred_model = model
37
+ break
38
+ if preferred_model:
39
+ break
40
+
41
+ # IF NO PREFERRED MODEL, USE FIRST AVAILABLE MODEL
42
+ if not preferred_model:
43
+ preferred_model = available_models[0]
44
+
45
+ self.nlp_models[lang_code] = spacy.load(preferred_model) # LOAD PREFERRED MODEL
46
+
47
+ return self.nlp_models.get(lang_code) # RETURN LOADED MODEL
48
+ except:
49
+ return None
50
+
51
+ # CHECK TEXT FOR SPELLING AND GRAMMAR ERRORS
52
+ def check_text(self, text: str, lang: str = 'auto') -> Dict:
53
+ """CHECK TEXT FOR SPELLING AND GRAMMAR ERRORS
54
+
55
+ ARGS:
56
+ text: Text to check
57
+ lang: Language code (auto for automatic detection)
58
+
59
+ RETURNS:
60
+ Dict with corrections and statistics
61
+ """
62
+ # DETECT LANGUAGE CONFIDENCE
63
+ if lang == 'auto':
64
+ try:
65
+ lang_scores = detect_langs(text)
66
+ lang = lang_scores[0].lang
67
+ confidence = lang_scores[0].prob
68
+ except:
69
+ confidence = 0
70
+ else:
71
+ confidence = 1.0
72
+
73
+ # SET LANGUAGE
74
+ if lang != 'auto':
75
+ self.tool.language = lang
76
+
77
+ # GET MATCHES
78
+ matches = self.tool.check(text)
79
+
80
+ # PREPARE CORRECTIONS WITH SEVERITY LEVELS
81
+ corrections = []
82
+ for match in matches:
83
+ severity = self._get_error_severity(match)
84
+ correction = {
85
+ 'message': match.message,
86
+ 'context': match.context,
87
+ 'offset': match.offset,
88
+ 'length': match.errorLength,
89
+ 'category': match.category,
90
+ 'rule_id': match.ruleId,
91
+ 'replacements': match.replacements,
92
+ 'severity': severity
93
+ }
94
+ corrections.append(correction)
95
+
96
+ # GET DETAILED STATISTICS
97
+ stats = self._get_detailed_stats(corrections)
98
+
99
+ return {
100
+ 'corrections': corrections,
101
+ 'statistics': stats,
102
+ 'language': {
103
+ 'code': lang,
104
+ 'name': lang.upper(),
105
+ 'confidence': confidence
106
+ }
107
+ }
108
+
109
+ # DETERMINE ERROR SEVERITY LEVEL
110
+ def _get_error_severity(self, match) -> str:
111
+ """DETERMINE ERROR SEVERITY LEVEL"""
112
+ if 'TYPO' in match.ruleId or 'SPELLING' in match.ruleId:
113
+ return 'high'
114
+ elif 'GRAMMAR' in match.ruleId:
115
+ return 'medium'
116
+ else:
117
+ return 'low'
118
+
119
+ # GET DETAILED ERROR STATISTICS
120
+ def _get_detailed_stats(self, corrections: List[Dict]) -> Dict:
121
+ """GET DETAILED ERROR STATISTICS"""
122
+ stats = {
123
+ 'total_errors': len(corrections),
124
+ 'categories': {},
125
+ 'severity': {
126
+ 'high': 0,
127
+ 'medium': 0,
128
+ 'low': 0
129
+ }
130
+ }
131
+
132
+ # COUNT ERRORS BY CATEGORY AND SEVERITY
133
+ for corr in corrections:
134
+ # COUNT BY CATEGORY
135
+ cat = corr['category']
136
+ stats['categories'][cat] = stats['categories'].get(cat, 0) + 1
137
+
138
+ # COUNT BY SEVERITY
139
+ stats['severity'][corr['severity']] += 1
140
+
141
+ return stats
142
+
143
+ # FIX TEXT AUTOMATICALLY
144
+ def fix_text(self, text: str, lang: str = 'auto', copy_to_clipboard: bool = False,
145
+ ignore: list = None, interactive: bool = False) -> str:
146
+ """FIX TEXT AUTOMATICALLY"""
147
+ if lang != 'auto':
148
+ self.tool.language = lang
149
+
150
+ if interactive:
151
+ # GET ALL CORRECTIONS
152
+ matches = self.tool.check(text)
153
+ corrected = text
154
+
155
+ # ASK FOR EACH CORRECTION
156
+ for match in matches:
157
+ if ignore and any(t in match.ruleId.lower() for t in ignore):
158
+ continue
159
+
160
+ print(f"\nError: {match.message}")
161
+ print(f"Context: {match.context}")
162
+ if match.replacements:
163
+ print("Suggestions:")
164
+ for i, sugg in enumerate(match.replacements[:3], 1):
165
+ print(f"{i}. {sugg}")
166
+
167
+ # ASK FOR EACH CORRECTION
168
+ choice = input("\nApply correction? (1-3/n): ").lower()
169
+ if choice.isdigit() and 1 <= int(choice) <= len(match.replacements[:3]):
170
+ replacement = match.replacements[int(choice)-1]
171
+ corrected = corrected[:match.offset] + replacement + corrected[match.offset + match.errorLength:]
172
+ else:
173
+ # NORMAL AUTO-FIX
174
+ corrected = self.tool.correct(text)
175
+
176
+ # COPY TO CLIPBOARD IF REQUESTED
177
+ if copy_to_clipboard:
178
+ pyperclip.copy(corrected)
179
+
180
+ return corrected
181
+
182
+ # GET LIST OF SUPPORTED LANGUAGES
183
+ def get_supported_languages(self) -> List[Dict]:
184
+ """GET LIST OF SUPPORTED LANGUAGES"""
185
+ try:
186
+ # GET LANGUAGES FROM LANGUAGE TOOL PUBLIC API
187
+ response = requests.get('https://api.languagetool.org/v2/languages')
188
+ languages = response.json()
189
+
190
+ # FORMAT LANGUAGES INTO REQUIRED STRUCTURE
191
+ formatted_langs = []
192
+ seen_codes = set()
193
+
194
+ # FORMAT LANGUAGES INTO REQUIRED STRUCTURE
195
+ for lang in languages:
196
+ code = lang['longCode'].split('-')[0]
197
+
198
+ # SKIP DUPLICATES
199
+ if code in seen_codes:
200
+ continue
201
+
202
+ # TEST IF LANGUAGE IS ACTUALLY SUPPORTED BY LOCAL TOOL
203
+ try:
204
+ self.tool.language = code
205
+ formatted_langs.append({
206
+ 'code': code,
207
+ 'name': lang['name'],
208
+ 'variants': [v['name'] for v in lang.get('variants', [])]
209
+ })
210
+ seen_codes.add(code)
211
+ except:
212
+ continue
213
+
214
+ return formatted_langs
215
+
216
+ except Exception as e:
217
+ # IF API FAILS, GET LANGUAGES FROM LOCAL TOOL
218
+ try:
219
+ current_lang = self.tool.language
220
+ return [{'code': current_lang, 'name': current_lang.upper(), 'variants': []}]
221
+ except:
222
+ return []
@@ -10,7 +10,7 @@ def get_supported_languages() -> dict:
10
10
  return dict(sorted(langs.items(), key=lambda x: x[1].lower()))
11
11
 
12
12
  def translate_text(text: str, to_lang: str = 'en', from_lang: str = None,
13
- copy: bool = False, detect_lang: bool = False) -> str:
13
+ copy: bool = False, detect_lang: bool = False, output: str = None) -> str:
14
14
  """TRANSLATE TEXT TO SPECIFIED LANGUAGE
15
15
 
16
16
  ARGS:
@@ -19,6 +19,7 @@ def translate_text(text: str, to_lang: str = 'en', from_lang: str = None,
19
19
  from_lang (str): SOURCE LANGUAGE CODE (DEFAULT: AUTO-DETECT)
20
20
  copy (bool): COPY RESULT TO CLIPBOARD
21
21
  detect_lang (bool): SHOW DETECTED SOURCE LANGUAGE
22
+ output (str): PATH TO SAVE TRANSLATION TO FILE
22
23
 
23
24
  RETURNS:
24
25
  str: TRANSLATED TEXT
@@ -34,6 +35,17 @@ def translate_text(text: str, to_lang: str = 'en', from_lang: str = None,
34
35
  if copy:
35
36
  pyperclip.copy(result)
36
37
 
38
+ # SAVE TO FILE IF OUTPUT PATH PROVIDED
39
+ if output:
40
+ try:
41
+ with open(output, 'w', encoding='utf-8') as f:
42
+ if detect_lang:
43
+ f.write(f"[Detected: {source_lang}] {result}")
44
+ else:
45
+ f.write(result)
46
+ except Exception as e:
47
+ print(f"\nError saving to file: {str(e)}")
48
+
37
49
  # RETURN RESULT WITH DETECTED LANGUAGE IF REQUESTED
38
50
  if detect_lang:
39
51
  return f"[Detected: {source_lang}] {result}"