RubyGems - text_alignment - Versions diffs - 0.12.0 → 0.12.2 - Mend

text_alignment 0.12.0 → 0.12.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

checksums.yaml +4 -4
data/lib/text_alignment/char_mapping.rb +32 -7
data/lib/text_alignment/mixed_alignment.rb +1 -1
data/lib/text_alignment/version.rb +1 -1
metadata +2 -2

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: fc90a3ea0092a4e2672fd40a3bf3e6bb25fba612fc663fc7c249741e79b7a990
-  data.tar.gz: 8676468d98902404d400b78711668930c9aaed268ddc1f555283b67fb731e2dd
+  metadata.gz: 3c2a36fe4cfde7dfb76f554fd4afcae7cb5a03e455887621217f5e5e633b20b3
+  data.tar.gz: f63070c6f423bc15d0fc8c742a21238a104a1b2c1d3fe56ac436effa8ef8eacf
 SHA512:
-  metadata.gz: 8194112635d7ffebe3983ae4393c05183ea86e3beab2efe645d512cb56c59f38187ab62d5d7bb7fb589ca20989a6763d42af0d881fdff4bb94be69954d9cb3c2
-  data.tar.gz: 2907241a5a589b2ab3bfee5e08ebf3c498af79f18ba3bd4d2ae3ef543681d251db2213f3d3dffe441aa39263136b7ea755fa4376fa46acc02af0beca379d2a5e
+  metadata.gz: '078a41bc6ab9b16e7747be6a3bb15aff4b23a1161bcea0b653a93f04d673799afcac2109cd1ce8d1a95c99c5c07d36842e3698c9f0997500e653fb4ab939e04a'
+  data.tar.gz: ce44d334779d43b3057317537f615ebf39b8049639d3e50c4e14272c952b76a5df2b060cfd3a15f1d28372c11a795ef8bf43cb04de32b5a78ce2f44433edddfb

data/lib/text_alignment/char_mapping.rb CHANGED Viewed

@@ -91,6 +91,9 @@ class TextAlignment::CharMapping
 			@method_squeeze_ws = method(:squeeze_ws_1!)
 		end
+		@text  = _text
+		# sort by the length of the spell-outs is important
 		char_mapping ||= TextAlignment::CHAR_MAPPING.sort{|a, b| b[1].length <=> a[1].length}
 		@mapped_text, offset_mapping = enmap_text(_text, char_mapping)
 		@index_enmap = offset_mapping.to_h
@@ -98,11 +101,11 @@ class TextAlignment::CharMapping
 	end
 	def enmap_position(position)
-		@index_enmap[position] || raise(ArgumentError, "Unusual position for annotation: #{position}")
+		@index_enmap[position] || raise(ArgumentError, "Unusual position of annotation: #{position}")
 	end
 	def demap_position(position)
-		@index_demap[position] || raise(ArgumentError, "Unusual position for annotation: #{position}")
+		@index_demap[position] || raise(ArgumentError, "Unusual position of annotation: #{position}")
 	end
 	def enmap_denotations(denotations)
@@ -110,6 +113,23 @@ class TextAlignment::CharMapping
 		denotations.map do |d|
 			d.dup.merge(span:{begin:enmap_position(d[:span][:begin]), end:enmap_position(d[:span][:end])})
+		rescue ArgumentError => e
+			snippet_begin = d[:span][:begin] - 5
+			if snippet_begin < 0
+				snippet_begin = 0
+			end
+			snippet_end = d[:span][:end] + 5
+			if snippet_end > @text.length
+				snippet_end = @text.length
+			end
+			snippet = @text[snippet_begin ... d[:span][:begin]] + '[' + @text[d[:span][:begin] ... d[:span][:end]] + ']' + @text[d[:span][:end] ... snippet_end]
+			if snippet_begin > 0
+				snippet = '...' + snippet
+			end
+			if snippet_end < @text.length
+				snippet = snippet + '...'
+			end
+			raise ArgumentError, e.message + " (#{snippet})"
 		end
 	end
@@ -118,7 +138,7 @@ class TextAlignment::CharMapping
 	def enmap_text(_text, char_mapping, no_ws = false)
 		text = _text.dup
-		# To execute the single letter mapping replacement
+		# To perform the single letter mapping replacement
 		char_mapping.each do |one, long|
 			text.gsub!(one, long) if long.length == 1
 		end
@@ -130,12 +150,16 @@ class TextAlignment::CharMapping
 			init_next = 0
 			while loc = text.index(long, init_next)
-				rpositions << [loc, long.length, 1]
+				# Huristics to check if the surrounding letters are sufficiently distinguished.
+				if long.length > 3 || ((text[loc - 1, 2] !~ /[a-z][a-z]/) && (text[loc + long.length - 1, 2] !~ /[a-z][a-z]/))
+				# if true
+					rpositions << [loc, long.length, 1]
+					# a workaround to avoid messing-up due to embedding
+					text[loc, long.length] = one * long.length
+				end
 				init_next = loc + long.length
 			end
-			# a workaround to avoid messing-up due to embedding
-			text.gsub!(long, one * long.length)
 		end
 		# To get the replacement positions, (position, old_length, new_length), for consecutive whitespaces
@@ -163,6 +187,7 @@ class TextAlignment::CharMapping
 		# To execute the long letter mapping
 		char_mapping.each do |one, long|
+			next unless text =~ /#{one}/
 			text.gsub!(one * long.length, one) if long.length > 1
 		end

data/lib/text_alignment/mixed_alignment.rb CHANGED Viewed

@@ -17,7 +17,7 @@ class TextAlignment::MixedAlignment
 	attr_reader :similarity
 	attr_reader :str1_match_initial, :str1_match_final, :str2_match_initial, :str2_match_final
-	def initialize(_str1, _str2, _mappings = nil)
+	def initialize(_str1, _str2, mappings = nil)
 		raise ArgumentError, "nil string" if _str1.nil? || _str2.nil?
 		mappings ||= TextAlignment::CHAR_MAPPING

data/lib/text_alignment/version.rb CHANGED Viewed

@@ -1,3 +1,3 @@
 class TextAlignment
-	VERSION = '0.12.0'
+	VERSION = '0.12.2'
 end

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: text_alignment
 version: !ruby/object:Gem::Version
-  version: 0.12.0
+  version: 0.12.2
 platform: ruby
 authors:
 - Jin-Dong Kim
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2023-12-21 00:00:00.000000000 Z
+date: 2024-01-03 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: ruby-dictionary