myers_diff 1.1.0 → 1.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 38ecad0ebd0a04de796e852e6cfc77065daf0b0da1e6384beed39520b4279230
4
- data.tar.gz: 285e2e66e2e25facf31c54b2c32d7d45d8bd2f695d7f789f04b84c579ef2abc4
3
+ metadata.gz: eafb6443ba3020bb242ceba65c0043dda61b5de37a6549173d0b9ec31d5157e4
4
+ data.tar.gz: 744e6423f793f07fdce00d11d567e840d8bb59df8f3838e3403fabbc4d9c67b8
5
5
  SHA512:
6
- metadata.gz: 1fa47b2e26e99fc72dbda6f16155848de64da9b59da6aa68cc8ecdfca127395b0887c8e4ecd3ecaa2a3acab2e937c7175aa50f35c4a6b8d39bef0c906286b2e3
7
- data.tar.gz: eeb8d1d8db1bebda97e164932b4e878374945d1940f8515d2f0b308bd922361fff2e1ae035f5044fb43ea405a283109a407c4a9fc32c145b200526ff3afbe213
6
+ metadata.gz: 6d9860589443562ac1c8619f52d560805ced707c789bf1232000e2c05c5f565ede2e532dc2c399c4bf8797e98c9a245ebebc56f1e4ae7e01ad0e81f24c6aa66d
7
+ data.tar.gz: c8aff408c8bdc6941712262016f089fb6b5d50858c7b4afd9c8c66e286c9df6117accbccfdafbf22ef8159d1a9cca2997af226b1a204860dfafa35d82d5ff9ec
@@ -1,3 +1,3 @@
1
1
  module MyersDiff
2
- VERSION = "1.1.0".freeze
2
+ VERSION = "1.1.1".freeze
3
3
  end
@@ -1,5 +1,8 @@
1
1
  module MyersDiff
2
2
  class WordDiff
3
+ BOUNDARIES_REGEX = /(\s+|[()\[\]{}'"]|\b)/.freeze
4
+ EXTENDED_WORD_CHARS_REGEX = /^[a-zA-Z\u{C0}-\u{FF}\u{D8}-\u{F6}\u{F8}-\u{2C6}\u{2C8}-\u{2D7}\u{2DE}-\u{2FF}\u{1E00}-\u{1EFF}]+$/u.freeze
5
+
3
6
  def diff(s1, s2, **options)
4
7
  old_string = cast_input(s1)
5
8
  new_string = cast_input(s2)
@@ -117,11 +120,26 @@ module MyersDiff
117
120
  end
118
121
 
119
122
  def tokenize(str)
120
- str.split(' ')
123
+ tokens = str.split(BOUNDARIES_REGEX)
124
+
125
+ i = 0
126
+ while i < tokens.size - 1
127
+ if tokens[i + 1].empty? && !tokens[i + 2].empty? &&
128
+ EXTENDED_WORD_CHARS_REGEX.match?(tokens[i]) &&
129
+ EXTENDED_WORD_CHARS_REGEX.match?(tokens[i + 2])
130
+ tokens[i] += tokens[i + 2]
131
+ tokens.delete_at(i + 1)
132
+ tokens.delete_at(i + 1)
133
+ i -= 1
134
+ end
135
+ i += 1
136
+ end
137
+
138
+ tokens
121
139
  end
122
140
 
123
141
  def join(chars)
124
- chars.join(' ')
142
+ chars.join('')
125
143
  end
126
144
 
127
145
  # new_string - tokenized string i.e. array of strings
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: myers_diff
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.1.0
4
+ version: 1.1.1
5
5
  platform: ruby
6
6
  authors:
7
7
  - Alex Tsui
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2020-05-27 00:00:00.000000000 Z
11
+ date: 2020-05-28 00:00:00.000000000 Z
12
12
  dependencies: []
13
13
  description: Implementation of Myers 1986 text diff algorithm that started as a port
14
14
  of the jsdiff project with plans to branch out to human-friendly diffs