PyPI - skrutable - Versions diffs - 2.1.3__tar.gz → 2.2.0__tar.gz - Mend

skrutable 2.1.3tar.gz → 2.2.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

{skrutable-2.1.3 → skrutable-2.2.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: skrutable
-Version: 2.1.3
+Version: 2.2.0
 Summary: skrutable library for working with Sanskrit text
 Home-page: https://github.com/tylergneill/skrutable
 Author: Tyler Neill

skrutable-2.2.0/src/skrutable/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "2.2.0"

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/config.json RENAMED Viewed

@@ -12,7 +12,11 @@
 	"max score" : 9,
 	"anuṣṭubh, full, both halves perfect)" : 9,
 	"anuṣṭubh, full, one half perfect, one imperfect)" : 7,
+	"anuṣṭubh, full, both halves imperfect)": 5,
+	"anuṣṭubh, full, one half perfect, one length error)": 6,
+	"anuṣṭubh, full, one half imperfect, one length error)": 4,
 	"anuṣṭubh, half, single half perfect)" : 9,
+	"anuṣṭubh, half, single half imperfect)": 5,
 	"samavṛtta, perfect" : 9,
 	"samavṛtta, imperfect (3)" : 6,
 	"samavṛtta, imperfect (2)" : 5,
@@ -22,7 +26,7 @@
 	"viṣamavṛtta, perfect" : 9,
 	"upajāti, perfect" : 7,
 	"upajāti, imperfect" : 6,
-	"upajāti, non-triṣṭubh, perfect" : 5,
+	"upajāti, non-triṣṭubh, perfect" : 4.5,
 	"upajāti, triṣṭubh-jagatī-saṃkara, perfect" : 4,
 	"upajāti, non-triṣṭubh, imperfect" : 3,
 	"jāti, perfect" : 8,

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/meter_identification.py RENAMED Viewed

@@ -3,6 +3,8 @@ from skrutable import meter_patterns
 from skrutable.config import load_config_dict_from_json_file
 import re
 from copy import copy
+from dataclasses import dataclass, field
+from typing import Optional
 # load config variables
 config = load_config_dict_from_json_file()
@@ -12,6 +14,24 @@ default_resplit_keep_midpoint = config["default_resplit_keep_midpoint"]  # e.g.
 disable_non_trizwuB_upajAti = config["disable_non_trizwuB_upajAti"]  # e.g. True
 meter_scores = config["meter_scores"]  # dict
+@dataclass
+class Diagnostic:
+	perfect_id_label: Optional[str] = None      # 'pathyā', 'ma-vipulā', etc.; None if imperfect
+	imperfect_id_label: Optional[str] = None    # 'asamīcīnā ma-vipulā', etc.; None if perfect or unidentified
+	failure_code: Optional[str] = None           # short internal code, e.g. 'hahn_general_2'; None if perfect
+	problem_syllables: dict = field(default_factory=lambda: {'odd': [], 'even': []})
+	def perfect(self):
+		return self.perfect_id_label is not None
+	def imperfect(self):
+		return self.imperfect_id_label is not None
+	def length_error(self):
+		return self.failure_code in ('hypermetric', 'hypometric')
 class VerseTester(object):
 	"""
 	Internal agent-style object.
@@ -29,6 +49,7 @@ class VerseTester(object):
 		self.resplit_option = default_resplit_option # string
 		self.resplit_keep_midpoint = default_resplit_keep_midpoint # bool
 		self.identification_attempt_count = 0
+		self._anuzwuB_half_cache = {}  # cleared per wiggle_identify run
 	def combine_results(self, Vrs, new_label, new_score):
 		old_label = Vrs.meter_label or ''
@@ -55,24 +76,55 @@ class VerseTester(object):
 		"""
 		Accepts two strings of syllable weights (e.g. 'llglgllg').
 		Tries to match to known odd-even 'anuṣṭubh' foot pairings:
-				pathya
+				pathyā
 				vipulā (4.5 subtypes: na, ra, ma, bha, and variant bha).
-		Returns string result if match found, None otherwise.
+		Returns Diagnostic with perfect_id_label set if match found, None otherwise.
 		"""
-		# check even pāda
-		regex = re.compile(meter_patterns.anuzwuB_pAda['even'])
-		if not re.match(regex, even_pAda_weights):
-			return None
-		# check odd pāda (both 'paTyA' and 'vipulA')
-		for weights_pattern in meter_patterns.anuzwuB_pAda['odd'].keys():
-			regex = re.compile(weights_pattern)
-			if re.match(regex, odd_pAda_weights):
-				return meter_patterns.anuzwuB_pAda['odd'][weights_pattern]
+		cache_key = (odd_pAda_weights, even_pAda_weights)
+		if cache_key in self._anuzwuB_half_cache:
+			return self._anuzwuB_half_cache[cache_key]
+		# check lengths first; length_error only reported when exactly one pāda is off
+		even_len_ok = len(even_pAda_weights) == 8
+		odd_len_ok = len(odd_pAda_weights) == 8
+		if not even_len_ok and not odd_len_ok:
+			result = None  # both wrong: bad split, not credible
+		elif not even_len_ok:
+			code = 'hypermetric' if len(even_pAda_weights) > 8 else 'hypometric'
+			result = Diagnostic(failure_code=code, problem_syllables={'odd': [], 'even': list(range(len(even_pAda_weights)))})
+		elif not odd_len_ok:
+			code = 'hypermetric' if len(odd_pAda_weights) > 8 else 'hypometric'
+			result = Diagnostic(failure_code=code, problem_syllables={'odd': list(range(len(odd_pAda_weights))), 'even': []})
 		else:
-			return None
+			# check even pāda
+			if not re.match(meter_patterns.anuzwuB_pAda['even'], even_pAda_weights):
+				result = None
+				for weights_pattern, (label, problem_syls, code) in meter_patterns.anuzwuB_pAda_asamIcIna['even'].items():
+					if re.match(weights_pattern, even_pAda_weights):
+						result = Diagnostic(imperfect_id_label=label, failure_code=code, problem_syllables={'odd': [], 'even': problem_syls})
+						break
+				if result is None:
+					result = Diagnostic(imperfect_id_label='asamīcīnā, [caturthāt] pathyā yujo j', failure_code='hahn_general_4', problem_syllables={'odd': [], 'even': [4, 5, 6]})
+			else:
+				# check odd pāda (both 'paTyA' and 'vipulA')
+				result = None
+				for weights_pattern, label in meter_patterns.anuzwuB_pAda['odd'].items():
+					if re.match(weights_pattern, odd_pAda_weights):
+						result = Diagnostic(perfect_id_label=label)
+						break
+				if result is None:
+					# check for broken conditioning on odd pāda
+					for weights_pattern, (label, problem_syls, code) in meter_patterns.anuzwuB_pAda_asamIcIna['odd'].items():
+						if re.match(weights_pattern, odd_pAda_weights):
+							result = Diagnostic(imperfect_id_label=label, failure_code=code, problem_syllables={'odd': problem_syls, 'even': []})
+							break
+				if result is None:
+					result = Diagnostic(imperfect_id_label='asamīcīnā, [vipulāyām asatyām] ya[gaṇaḥ] [ayujo] caturthāt [syāt]', failure_code='hahn_paTyA', problem_syllables={'odd': [4, 5, 6], 'even': []})
+		self._anuzwuB_half_cache[cache_key] = result
+		return result
 	def test_as_anuzwuB(self, Vrs):
 	# >> def test_as_zloka(self, Vrs):
@@ -81,52 +133,99 @@ class VerseTester(object):
 		Determines whether first four lines of Verse's syllable_weights is anuṣṭubh.
 		Internally sets Verse parameters if identified as such.
 		Tests halves ab and cd independently, reports if either half found to be valid.
-		Returns 1 if anuṣṭubh, or 0 if not.
+		Returns Diagnostic if anuṣṭubh, or None if not.
 		"""
 		w_p = Vrs.syllable_weights.split('\n')  # weights by pāda
 		# make sure full four pādas
 		try: w_p[3]
-		except IndexError: return 0
+		except IndexError: return None
 		# test each half
-		pAdas_ab = self.test_as_anuzwuB_half(w_p[0], w_p[1])
-		pAdas_cd = self.test_as_anuzwuB_half(w_p[2], w_p[3])
+		pAdas_ab_result = self.test_as_anuzwuB_half(w_p[0], w_p[1])
+		pAdas_cd_result = self.test_as_anuzwuB_half(w_p[2], w_p[3])
+		if pAdas_ab_result is None and pAdas_cd_result is None:
+			ardham_eva_result = self.test_as_anuzwuB_half(w_p[0] + w_p[1], w_p[2] + w_p[3])
+			if ardham_eva_result is None:
+				return None
+			if ardham_eva_result.perfect():
+				Vrs.meter_label = f"anuṣṭubh (ardham eva: {ardham_eva_result.perfect_id_label})"
+				Vrs.identification_score = meter_scores["anuṣṭubh, half, single half perfect)"]
+				Vrs.diagnostic = ardham_eva_result
+				return ardham_eva_result
+			elif ardham_eva_result.imperfect():
+				Vrs.meter_label = f"anuṣṭubh (ardham eva: {ardham_eva_result.imperfect_id_label})"
+				Vrs.identification_score = meter_scores["anuṣṭubh, half, single half imperfect)"]
+				Vrs.diagnostic = ardham_eva_result
+				return ardham_eva_result
+			else:
+				return None
-		# report results
+		if pAdas_ab_result is None or pAdas_cd_result is None:
+			return None
 		# both halves perfect
-		if pAdas_ab != None and pAdas_cd != None:
-			Vrs.meter_label = "anuṣṭubh (1,2: " + pAdas_ab + ", 3,4: " + pAdas_cd + ")"
+		if pAdas_ab_result.perfect() and pAdas_cd_result.perfect():
+			Vrs.meter_label = f"anuṣṭubh (1,2: {pAdas_ab_result.perfect_id_label}; 3,4: {pAdas_cd_result.perfect_id_label})"
 			Vrs.identification_score = meter_scores["anuṣṭubh, full, both halves perfect)"]
-			return 1
+			Vrs.diagnostic = {'ab': pAdas_ab_result, 'cd': pAdas_cd_result}
+			return pAdas_ab_result
 		# one half imperfect
-		elif pAdas_ab == None and pAdas_cd != None:
-			Vrs.meter_label = "anuṣṭubh (1,2: asamīcīna, 3,4: " + pAdas_cd + ")"
+		elif pAdas_ab_result.imperfect() and pAdas_cd_result.perfect():
+			Vrs.meter_label = f"anuṣṭubh (1,2: {pAdas_ab_result.imperfect_id_label}; 3,4: {pAdas_cd_result.perfect_id_label})"
 			Vrs.identification_score = meter_scores["anuṣṭubh, full, one half perfect, one imperfect)"]
-			return 1
-		elif pAdas_ab != None and pAdas_cd == None:
-			Vrs.meter_label = "anuṣṭubh (1,2: " + pAdas_ab + ", 3,4: asamīcīna)"
+			Vrs.diagnostic = {'ab': pAdas_ab_result, 'cd': pAdas_cd_result}
+			return pAdas_ab_result
+		elif pAdas_ab_result.perfect() and pAdas_cd_result.imperfect():
+			Vrs.meter_label = f"anuṣṭubh (1,2: {pAdas_ab_result.perfect_id_label}; 3,4: {pAdas_cd_result.imperfect_id_label})"
 			Vrs.identification_score = meter_scores["anuṣṭubh, full, one half perfect, one imperfect)"]
-			return 1
-		# currently cannot do both halves imperfect
-		# also test whether just a single perfect half
-		pAdas_ab = self.test_as_anuzwuB_half(w_p[0]+w_p[1], w_p[2]+w_p[3])
-		if pAdas_ab != None:
-			Vrs.meter_label = "anuṣṭubh (ardham eva: " + pAdas_ab + ")"
-			Vrs.identification_score = meter_scores["anuṣṭubh, half, single half perfect)"]
-			return 1
-		# currently cannot do just a single imperfect half
-		return 0
+			Vrs.diagnostic = {'ab': pAdas_ab_result, 'cd': pAdas_cd_result}
+			return pAdas_cd_result
+		# both halves imperfect
+		elif pAdas_ab_result.imperfect() and pAdas_cd_result.imperfect():
+			Vrs.meter_label = f"anuṣṭubh (1,2: {pAdas_ab_result.imperfect_id_label}; 3,4: {pAdas_cd_result.imperfect_id_label})"
+			Vrs.identification_score = meter_scores["anuṣṭubh, full, both halves imperfect)"]
+			Vrs.diagnostic = {'ab': pAdas_ab_result, 'cd': pAdas_cd_result}
+			return pAdas_ab_result
+		# one half perfect, one length error
+		elif pAdas_ab_result.length_error() and pAdas_cd_result.perfect():
+			code = pAdas_ab_result.failure_code
+			Vrs.meter_label = f"anuṣṭubh (1,2: ?? {code}; 3,4: {pAdas_cd_result.perfect_id_label})"
+			Vrs.identification_score = meter_scores["anuṣṭubh, full, one half perfect, one length error)"]
+			Vrs.diagnostic = {'ab': pAdas_ab_result, 'cd': pAdas_cd_result}
+			return pAdas_cd_result
+		elif pAdas_ab_result.perfect() and pAdas_cd_result.length_error():
+			code = pAdas_cd_result.failure_code
+			Vrs.meter_label = f"anuṣṭubh (1,2: {pAdas_ab_result.perfect_id_label}; 3,4: ?? {code})"
+			Vrs.identification_score = meter_scores["anuṣṭubh, full, one half perfect, one length error)"]
+			Vrs.diagnostic = {'ab': pAdas_ab_result, 'cd': pAdas_cd_result}
+			return pAdas_ab_result
+		# one half imperfect, one length error
+		elif pAdas_ab_result.length_error() and pAdas_cd_result.imperfect():
+			code = pAdas_ab_result.failure_code
+			Vrs.meter_label = f"anuṣṭubh (1,2: ?? {code}; 3,4: {pAdas_cd_result.imperfect_id_label})"
+			Vrs.identification_score = meter_scores["anuṣṭubh, full, one half imperfect, one length error)"]
+			Vrs.diagnostic = {'ab': pAdas_ab_result, 'cd': pAdas_cd_result}
+			return pAdas_cd_result
+		elif pAdas_ab_result.imperfect() and pAdas_cd_result.length_error():
+			code = pAdas_cd_result.failure_code
+			Vrs.meter_label = f"anuṣṭubh (1,2: {pAdas_ab_result.imperfect_id_label}; 3,4: ?? {code})"
+			Vrs.identification_score = meter_scores["anuṣṭubh, full, one half imperfect, one length error)"]
+			Vrs.diagnostic = {'ab': pAdas_ab_result, 'cd': pAdas_cd_result}
+			return pAdas_ab_result
+		return None
 	def count_pAdasamatva(self, Vrs):
 		"""
@@ -540,8 +639,8 @@ class VerseTester(object):
 		# anuzwuB
-		success_anuzwuB = self.test_as_anuzwuB(Vrs) # 1 if successful, 0 if not
-		if success_anuzwuB and Vrs.identification_score == meter_scores["max score"]:
+		anuzwuB_diagnostic = self.test_as_anuzwuB(Vrs) # Diagnostic if successful, None if not
+		if anuzwuB_diagnostic and Vrs.identification_score == meter_scores["max score"]:
 			return 1
 		# samavftta, upajAti, vizamavftta, ardhasamavftta
@@ -557,7 +656,7 @@ class VerseTester(object):
 		success_jAti = self.test_as_jAti(Vrs)
-		if success_anuzwuB or success_samavftta_etc or success_jAti:
+		if anuzwuB_diagnostic or success_samavftta_etc or success_jAti:
 			return 1
 		else:
 			return 0
@@ -613,6 +712,7 @@ class MeterIdentifier(object):
 							pAda_brs, quarter_len):
 		"""Returns a list for MeterIdentifier.Verses_found"""
+		self._anuzwuB_half_cache = {}
 		pos_iterators = {}
 		for k in ['ab', 'bc', 'cd']:
 			if  (

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/meter_patterns.py RENAMED Viewed

@@ -47,6 +47,20 @@ anuzwuB_pAda = {
 	}
 }
+anuzwuB_pAda_asamIcIna = {
+	'odd' : {
+		'^.ll.{5}$' :   ('asamīcīnā, na prathamāt snau',              [1, 2],    'hahn_general_2'),  # syllables 2–3 both light
+		'^.{4}ggg.$' :  ('asamīcīnā, ma-vipulāyāḥ paścād raḥ syāt',  [1, 2, 3], 'hahn_vipulA_3'),   # ma-vipulā conditioning violated
+		'^.{4}gll.$' :  ('asamīcīnā, bha-vipulāyāḥ paścād raḥ syāt', [1, 2, 3], 'hahn_vipulA_2'),   # bha-vipulā conditioning violated
+		'^.{3}llll.$' : ('asamīcīnā, na-vipulāyāḥ paścād guruḥ syāt', [3],       'hahn_vipulA_1'),   # na-vipulā conditioning violated
+		'^.{3}lglg.$' : ('asamīcīnā, ra-vipulāyāḥ paścād guruḥ syāt', [3],       'hahn_vipulA_4'),   # ra-vipulā conditioning violated
+	},
+	'even' : {
+		'^.ll.{5}$' :   ('asamīcīnā, na prathamāt snau',         [1, 2],    'hahn_general_2'),  # syllables 2–3 both light
+		'^.glg.{4}$' :  ('asamīcīnā, [na] dvitīyacaturthayo raḥ', [1, 2, 3], 'hahn_general_3'),  # ra-gaṇa at syllables 2–4
+	},
+}
 """
 	samavṛtta

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/scansion.py RENAMED Viewed

@@ -34,6 +34,7 @@ class Verse(object):
 		self.gaRa_abbreviations = None	# string, may contain newlines
 		self.meter_label = None			# string
 		self.identification_score = 0 	# int
+		self.diagnostic = None			# Diagnostic or dict of Diagnostics, set by meter_identification
 	def summarize(self,
 		show_weights=True, show_morae=True, show_gaRas=True, # part_A

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: skrutable
-Version: 2.1.3
+Version: 2.2.0
 Summary: skrutable library for working with Sanskrit text
 Home-page: https://github.com/tylergneill/skrutable
 Author: Tyler Neill

skrutable-2.1.3/src/skrutable/__init__.py DELETED Viewed

	@@ -1 +0,0 @@
1	- __version__ = "2.1.3"

{skrutable-2.1.3 → skrutable-2.2.0}/LICENSE.md RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/README.md RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/setup.cfg RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/setup.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/config.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/generate_scheme_vectors.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/impossible_bigrams.json RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/manual.md RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/phonemes.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/run_examples.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/scheme_detection.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/scheme_maps.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/scheme_vectors.json RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/scheme_vectors_mbh.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/splitting.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/transliteration.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable/virAma_avoidance.py RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable.egg-info/requires.txt RENAMED Viewed

File without changes

{skrutable-2.1.3 → skrutable-2.2.0}/src/skrutable.egg-info/top_level.txt RENAMED Viewed

File without changes

skrutable 2.1.3__tar.gz → 2.2.0__tar.gz

skrutable 2.1.3tar.gz → 2.2.0tar.gz