groonga 0.9.1 → 1.0.0
Sign up to get free protection for your applications and to get access to all the features.
- metadata +38 -227
- data/AUTHORS +0 -5
- data/NEWS.ja.rdoc +0 -114
- data/NEWS.rdoc +0 -116
- data/README.ja.rdoc +0 -63
- data/README.rdoc +0 -64
- data/Rakefile +0 -216
- data/benchmark/common.rb +0 -49
- data/benchmark/read-write-many-small-items.rb +0 -144
- data/benchmark/write-many-small-items.rb +0 -135
- data/example/bookmark.rb +0 -161
- data/example/index-html.rb +0 -89
- data/example/search/config.ru +0 -211
- data/example/search/public/css/groonga.css +0 -122
- data/ext/.gitignore +0 -2
- data/ext/rb-grn-accessor.c +0 -52
- data/ext/rb-grn-array-cursor.c +0 -36
- data/ext/rb-grn-array.c +0 -210
- data/ext/rb-grn-column.c +0 -570
- data/ext/rb-grn-context.c +0 -655
- data/ext/rb-grn-database.c +0 -415
- data/ext/rb-grn-encoding-support.c +0 -64
- data/ext/rb-grn-encoding.c +0 -257
- data/ext/rb-grn-exception.c +0 -1110
- data/ext/rb-grn-expression-builder.c +0 -75
- data/ext/rb-grn-expression.c +0 -732
- data/ext/rb-grn-fix-size-column.c +0 -166
- data/ext/rb-grn-hash-cursor.c +0 -38
- data/ext/rb-grn-hash.c +0 -294
- data/ext/rb-grn-index-column.c +0 -488
- data/ext/rb-grn-logger.c +0 -325
- data/ext/rb-grn-object.c +0 -1335
- data/ext/rb-grn-operation.c +0 -198
- data/ext/rb-grn-patricia-trie-cursor.c +0 -39
- data/ext/rb-grn-patricia-trie.c +0 -488
- data/ext/rb-grn-procedure.c +0 -52
- data/ext/rb-grn-query.c +0 -260
- data/ext/rb-grn-record.c +0 -40
- data/ext/rb-grn-snippet.c +0 -328
- data/ext/rb-grn-table-cursor-key-support.c +0 -69
- data/ext/rb-grn-table-cursor.c +0 -246
- data/ext/rb-grn-table-key-support.c +0 -731
- data/ext/rb-grn-table.c +0 -2038
- data/ext/rb-grn-type.c +0 -181
- data/ext/rb-grn-utils.c +0 -769
- data/ext/rb-grn-variable-size-column.c +0 -36
- data/ext/rb-grn-variable.c +0 -108
- data/ext/rb-grn.h +0 -684
- data/ext/rb-groonga.c +0 -113
- data/extconf.rb +0 -216
- data/html/bar.svg +0 -153
- data/html/developer.html +0 -121
- data/html/developer.svg +0 -469
- data/html/download.svg +0 -253
- data/html/favicon.ico +0 -0
- data/html/favicon.xcf +0 -0
- data/html/footer.html.erb +0 -28
- data/html/head.html.erb +0 -4
- data/html/header.html.erb +0 -17
- data/html/index.html +0 -147
- data/html/install.svg +0 -636
- data/html/logo.xcf +0 -0
- data/html/ranguba.css +0 -248
- data/html/tutorial.svg +0 -559
- data/lib/groonga.rb +0 -83
- data/lib/groonga/expression-builder.rb +0 -285
- data/lib/groonga/patricia-trie.rb +0 -53
- data/lib/groonga/record.rb +0 -276
- data/lib/groonga/schema.rb +0 -916
- data/license/GPL +0 -340
- data/license/LGPL +0 -504
- data/license/RUBY +0 -59
- data/misc/grnop2ruby.rb +0 -49
- data/pkg-config.rb +0 -333
- data/src/rb-grn-table-cursor.c +0 -296
- data/test-unit/Rakefile +0 -40
- data/test-unit/TODO +0 -5
- data/test-unit/bin/testrb +0 -5
- data/test-unit/html/classic.html +0 -15
- data/test-unit/html/index.html +0 -25
- data/test-unit/html/index.html.ja +0 -27
- data/test-unit/lib/test/unit.rb +0 -323
- data/test-unit/lib/test/unit/assertionfailederror.rb +0 -25
- data/test-unit/lib/test/unit/assertions.rb +0 -1230
- data/test-unit/lib/test/unit/attribute.rb +0 -125
- data/test-unit/lib/test/unit/autorunner.rb +0 -353
- data/test-unit/lib/test/unit/collector.rb +0 -36
- data/test-unit/lib/test/unit/collector/descendant.rb +0 -23
- data/test-unit/lib/test/unit/collector/dir.rb +0 -108
- data/test-unit/lib/test/unit/collector/load.rb +0 -136
- data/test-unit/lib/test/unit/collector/objectspace.rb +0 -34
- data/test-unit/lib/test/unit/color-scheme.rb +0 -102
- data/test-unit/lib/test/unit/color.rb +0 -96
- data/test-unit/lib/test/unit/diff.rb +0 -724
- data/test-unit/lib/test/unit/error.rb +0 -130
- data/test-unit/lib/test/unit/exceptionhandler.rb +0 -39
- data/test-unit/lib/test/unit/failure.rb +0 -136
- data/test-unit/lib/test/unit/fixture.rb +0 -176
- data/test-unit/lib/test/unit/notification.rb +0 -129
- data/test-unit/lib/test/unit/omission.rb +0 -191
- data/test-unit/lib/test/unit/pending.rb +0 -150
- data/test-unit/lib/test/unit/priority.rb +0 -181
- data/test-unit/lib/test/unit/runner/console.rb +0 -52
- data/test-unit/lib/test/unit/runner/emacs.rb +0 -8
- data/test-unit/lib/test/unit/runner/tap.rb +0 -8
- data/test-unit/lib/test/unit/testcase.rb +0 -476
- data/test-unit/lib/test/unit/testresult.rb +0 -89
- data/test-unit/lib/test/unit/testsuite.rb +0 -110
- data/test-unit/lib/test/unit/ui/console/outputlevel.rb +0 -14
- data/test-unit/lib/test/unit/ui/console/testrunner.rb +0 -464
- data/test-unit/lib/test/unit/ui/emacs/testrunner.rb +0 -63
- data/test-unit/lib/test/unit/ui/tap/testrunner.rb +0 -92
- data/test-unit/lib/test/unit/ui/testrunner.rb +0 -28
- data/test-unit/lib/test/unit/ui/testrunnermediator.rb +0 -77
- data/test-unit/lib/test/unit/ui/testrunnerutilities.rb +0 -41
- data/test-unit/lib/test/unit/util/backtracefilter.rb +0 -41
- data/test-unit/lib/test/unit/util/method-owner-finder.rb +0 -28
- data/test-unit/lib/test/unit/util/observable.rb +0 -90
- data/test-unit/lib/test/unit/util/procwrapper.rb +0 -48
- data/test-unit/lib/test/unit/version.rb +0 -7
- data/test-unit/sample/adder.rb +0 -13
- data/test-unit/sample/subtracter.rb +0 -12
- data/test-unit/sample/test_adder.rb +0 -20
- data/test-unit/sample/test_subtracter.rb +0 -20
- data/test-unit/sample/test_user.rb +0 -23
- data/test-unit/test/collector/test-descendant.rb +0 -133
- data/test-unit/test/collector/test-load.rb +0 -329
- data/test-unit/test/collector/test_dir.rb +0 -406
- data/test-unit/test/collector/test_objectspace.rb +0 -100
- data/test-unit/test/run-test.rb +0 -15
- data/test-unit/test/test-attribute.rb +0 -86
- data/test-unit/test/test-color-scheme.rb +0 -67
- data/test-unit/test/test-color.rb +0 -47
- data/test-unit/test/test-diff.rb +0 -518
- data/test-unit/test/test-emacs-runner.rb +0 -60
- data/test-unit/test/test-fixture.rb +0 -287
- data/test-unit/test/test-notification.rb +0 -33
- data/test-unit/test/test-omission.rb +0 -81
- data/test-unit/test/test-pending.rb +0 -70
- data/test-unit/test/test-priority.rb +0 -119
- data/test-unit/test/test-testcase.rb +0 -554
- data/test-unit/test/test_assertions.rb +0 -1151
- data/test-unit/test/test_error.rb +0 -26
- data/test-unit/test/test_failure.rb +0 -33
- data/test-unit/test/test_testresult.rb +0 -113
- data/test-unit/test/test_testsuite.rb +0 -129
- data/test-unit/test/testunit-test-util.rb +0 -14
- data/test-unit/test/ui/test_testrunmediator.rb +0 -20
- data/test-unit/test/util/test-method-owner-finder.rb +0 -38
- data/test-unit/test/util/test_backtracefilter.rb +0 -41
- data/test-unit/test/util/test_observable.rb +0 -102
- data/test-unit/test/util/test_procwrapper.rb +0 -36
- data/test/.gitignore +0 -1
- data/test/groonga-test-utils.rb +0 -106
- data/test/run-test.rb +0 -58
- data/test/test-array.rb +0 -97
- data/test/test-column.rb +0 -298
- data/test/test-context.rb +0 -73
- data/test/test-database.rb +0 -113
- data/test/test-encoding.rb +0 -33
- data/test/test-exception.rb +0 -93
- data/test/test-expression-builder.rb +0 -156
- data/test/test-expression.rb +0 -133
- data/test/test-fix-size-column.rb +0 -65
- data/test/test-gqtp.rb +0 -70
- data/test/test-hash.rb +0 -312
- data/test/test-index-column.rb +0 -81
- data/test/test-patricia-trie.rb +0 -189
- data/test/test-procedure.rb +0 -37
- data/test/test-query.rb +0 -22
- data/test/test-record.rb +0 -268
- data/test/test-remote.rb +0 -53
- data/test/test-schema.rb +0 -416
- data/test/test-snippet.rb +0 -121
- data/test/test-table-cursor.rb +0 -153
- data/test/test-table-offset-and-limit.rb +0 -102
- data/test/test-table-select-normalize.rb +0 -48
- data/test/test-table-select.rb +0 -145
- data/test/test-table.rb +0 -642
- data/test/test-type.rb +0 -61
- data/test/test-variable-size-column.rb +0 -98
- data/test/test-variable.rb +0 -28
- data/test/test-vector-column.rb +0 -76
- data/test/test-version.rb +0 -31
- data/text/TUTORIAL.ja.rdoc +0 -392
- data/text/expression.rdoc +0 -284
@@ -1,724 +0,0 @@
|
|
1
|
-
# port of Python's difflib.
|
2
|
-
|
3
|
-
module Test
|
4
|
-
module Unit
|
5
|
-
module Diff
|
6
|
-
class SequenceMatcher
|
7
|
-
def initialize(from, to, &junk_predicate)
|
8
|
-
@from = from
|
9
|
-
@to = to
|
10
|
-
@junk_predicate = junk_predicate
|
11
|
-
update_to_indexes
|
12
|
-
end
|
13
|
-
|
14
|
-
def longest_match(from_start, from_end, to_start, to_end)
|
15
|
-
best_info = find_best_match_position(from_start, from_end,
|
16
|
-
to_start, to_end)
|
17
|
-
unless @junks.empty?
|
18
|
-
args = [from_start, from_end, to_start, to_end]
|
19
|
-
best_info = adjust_best_info_with_junk_predicate(false, best_info,
|
20
|
-
*args)
|
21
|
-
best_info = adjust_best_info_with_junk_predicate(true, best_info,
|
22
|
-
*args)
|
23
|
-
end
|
24
|
-
|
25
|
-
best_info
|
26
|
-
end
|
27
|
-
|
28
|
-
def blocks
|
29
|
-
@blocks ||= compute_blocks
|
30
|
-
end
|
31
|
-
|
32
|
-
def operations
|
33
|
-
@operations ||= compute_operations
|
34
|
-
end
|
35
|
-
|
36
|
-
def grouped_operations(context_size=nil)
|
37
|
-
context_size ||= 3
|
38
|
-
_operations = operations.dup
|
39
|
-
_operations = [[:equal, 0, 0, 0, 0]] if _operations.empty?
|
40
|
-
expand_edge_equal_operations!(_operations, context_size)
|
41
|
-
|
42
|
-
group_window = context_size * 2
|
43
|
-
groups = []
|
44
|
-
group = []
|
45
|
-
_operations.each do |tag, from_start, from_end, to_start, to_end|
|
46
|
-
if tag == :equal and from_end - from_start > group_window
|
47
|
-
group << [tag,
|
48
|
-
from_start,
|
49
|
-
[from_end, from_start + context_size].min,
|
50
|
-
to_start,
|
51
|
-
[to_end, to_start + context_size].min]
|
52
|
-
groups << group
|
53
|
-
group = []
|
54
|
-
from_start = [from_start, from_end - context_size].max
|
55
|
-
to_start = [to_start, to_end - context_size].max
|
56
|
-
end
|
57
|
-
group << [tag, from_start, from_end, to_start, to_end]
|
58
|
-
end
|
59
|
-
groups << group unless group.empty?
|
60
|
-
groups
|
61
|
-
end
|
62
|
-
|
63
|
-
def ratio
|
64
|
-
@ratio ||= compute_ratio
|
65
|
-
end
|
66
|
-
|
67
|
-
private
|
68
|
-
def update_to_indexes
|
69
|
-
@to_indexes = {}
|
70
|
-
@junks = {}
|
71
|
-
if @to.is_a?(String)
|
72
|
-
each = " "[0].is_a?(Integer) ? :each_byte : :each_char
|
73
|
-
else
|
74
|
-
each = :each
|
75
|
-
end
|
76
|
-
i = 0
|
77
|
-
@to.send(each) do |item|
|
78
|
-
@to_indexes[item] ||= []
|
79
|
-
@to_indexes[item] << i
|
80
|
-
i += 1
|
81
|
-
end
|
82
|
-
|
83
|
-
return if @junk_predicate.nil?
|
84
|
-
@to_indexes = @to_indexes.reject do |key, value|
|
85
|
-
junk = @junk_predicate.call(key)
|
86
|
-
@junks[key] = true if junk
|
87
|
-
junk
|
88
|
-
end
|
89
|
-
end
|
90
|
-
|
91
|
-
def find_best_match_position(from_start, from_end, to_start, to_end)
|
92
|
-
best_from, best_to, best_size = from_start, to_start, 0
|
93
|
-
sizes = {}
|
94
|
-
from_start.upto(from_end) do |from_index|
|
95
|
-
_sizes = {}
|
96
|
-
(@to_indexes[@from[from_index]] || []).each do |to_index|
|
97
|
-
next if to_index < to_start
|
98
|
-
break if to_index > to_end
|
99
|
-
size = _sizes[to_index] = (sizes[to_index - 1] || 0) + 1
|
100
|
-
if size > best_size
|
101
|
-
best_from = from_index - size + 1
|
102
|
-
best_to = to_index - size + 1
|
103
|
-
best_size = size
|
104
|
-
end
|
105
|
-
end
|
106
|
-
sizes = _sizes
|
107
|
-
end
|
108
|
-
[best_from, best_to, best_size]
|
109
|
-
end
|
110
|
-
|
111
|
-
def adjust_best_info_with_junk_predicate(should_junk, best_info,
|
112
|
-
from_start, from_end,
|
113
|
-
to_start, to_end)
|
114
|
-
best_from, best_to, best_size = best_info
|
115
|
-
while best_from > from_start and best_to > to_start and
|
116
|
-
(should_junk ?
|
117
|
-
@junks.has_key?(@to[best_to - 1]) :
|
118
|
-
!@junks.has_key?(@to[best_to - 1])) and
|
119
|
-
@from[best_from - 1] == @to[best_to - 1]
|
120
|
-
best_from -= 1
|
121
|
-
best_to -= 1
|
122
|
-
best_size += 1
|
123
|
-
end
|
124
|
-
|
125
|
-
while best_from + best_size < from_end and
|
126
|
-
best_to + best_size < to_end and
|
127
|
-
(should_junk ?
|
128
|
-
@junks.has_key?(@to[best_to + best_size]) :
|
129
|
-
!@junks.has_key?(@to[best_to + best_size])) and
|
130
|
-
@from[best_from + best_size] == @to[best_to + best_size]
|
131
|
-
best_size += 1
|
132
|
-
end
|
133
|
-
|
134
|
-
[best_from, best_to, best_size]
|
135
|
-
end
|
136
|
-
|
137
|
-
def matches
|
138
|
-
@matches ||= compute_matches
|
139
|
-
end
|
140
|
-
|
141
|
-
def compute_matches
|
142
|
-
matches = []
|
143
|
-
queue = [[0, @from.size, 0, @to.size]]
|
144
|
-
until queue.empty?
|
145
|
-
from_start, from_end, to_start, to_end = queue.pop
|
146
|
-
match = longest_match(from_start, from_end - 1, to_start, to_end - 1)
|
147
|
-
match_from_index, match_to_index, size = match
|
148
|
-
unless size.zero?
|
149
|
-
if from_start < match_from_index and
|
150
|
-
to_start < match_to_index
|
151
|
-
queue.push([from_start, match_from_index,
|
152
|
-
to_start, match_to_index])
|
153
|
-
end
|
154
|
-
matches << match
|
155
|
-
if match_from_index + size < from_end and
|
156
|
-
match_to_index + size < to_end
|
157
|
-
queue.push([match_from_index + size, from_end,
|
158
|
-
match_to_index + size, to_end])
|
159
|
-
end
|
160
|
-
end
|
161
|
-
end
|
162
|
-
matches.sort_by do |(from_index, to_index, match_size)|
|
163
|
-
from_index
|
164
|
-
end
|
165
|
-
end
|
166
|
-
|
167
|
-
def compute_blocks
|
168
|
-
blocks = []
|
169
|
-
current_from_index = current_to_index = current_size = 0
|
170
|
-
matches.each do |from_index, to_index, size|
|
171
|
-
if current_from_index + current_size == from_index and
|
172
|
-
current_to_index + current_size == to_index
|
173
|
-
current_size += size
|
174
|
-
else
|
175
|
-
unless current_size.zero?
|
176
|
-
blocks << [current_from_index, current_to_index, current_size]
|
177
|
-
end
|
178
|
-
current_from_index = from_index
|
179
|
-
current_to_index = to_index
|
180
|
-
current_size = size
|
181
|
-
end
|
182
|
-
end
|
183
|
-
unless current_size.zero?
|
184
|
-
blocks << [current_from_index, current_to_index, current_size]
|
185
|
-
end
|
186
|
-
|
187
|
-
blocks << [@from.size, @to.size, 0]
|
188
|
-
blocks
|
189
|
-
end
|
190
|
-
|
191
|
-
def compute_operations
|
192
|
-
from_index = to_index = 0
|
193
|
-
operations = []
|
194
|
-
blocks.each do |match_from_index, match_to_index, size|
|
195
|
-
tag = determine_tag(from_index, to_index,
|
196
|
-
match_from_index, match_to_index)
|
197
|
-
if tag != :equal
|
198
|
-
operations << [tag,
|
199
|
-
from_index, match_from_index,
|
200
|
-
to_index, match_to_index]
|
201
|
-
end
|
202
|
-
|
203
|
-
from_index, to_index = match_from_index + size, match_to_index + size
|
204
|
-
if size > 0
|
205
|
-
operations << [:equal,
|
206
|
-
match_from_index, from_index,
|
207
|
-
match_to_index, to_index]
|
208
|
-
end
|
209
|
-
end
|
210
|
-
operations
|
211
|
-
end
|
212
|
-
|
213
|
-
def compute_ratio
|
214
|
-
matches = blocks.inject(0) {|result, block| result + block[-1]}
|
215
|
-
length = @from.length + @to.length
|
216
|
-
if length.zero?
|
217
|
-
1.0
|
218
|
-
else
|
219
|
-
2.0 * matches / length
|
220
|
-
end
|
221
|
-
end
|
222
|
-
|
223
|
-
def determine_tag(from_index, to_index,
|
224
|
-
match_from_index, match_to_index)
|
225
|
-
if from_index < match_from_index and to_index < match_to_index
|
226
|
-
:replace
|
227
|
-
elsif from_index < match_from_index
|
228
|
-
:delete
|
229
|
-
elsif to_index < match_to_index
|
230
|
-
:insert
|
231
|
-
else
|
232
|
-
:equal
|
233
|
-
end
|
234
|
-
end
|
235
|
-
|
236
|
-
def expand_edge_equal_operations!(_operations, context_size)
|
237
|
-
tag, from_start, from_end, to_start, to_end = _operations[0]
|
238
|
-
if tag == :equal
|
239
|
-
_operations[0] = [tag,
|
240
|
-
[from_start, from_end - context_size].max,
|
241
|
-
from_end,
|
242
|
-
[to_start, to_end - context_size].max,
|
243
|
-
to_end]
|
244
|
-
end
|
245
|
-
|
246
|
-
tag, from_start, from_end, to_start, to_end = _operations[-1]
|
247
|
-
if tag == :equal
|
248
|
-
_operations[-1] = [tag,
|
249
|
-
from_start,
|
250
|
-
[from_end, from_start + context_size].min,
|
251
|
-
to_start,
|
252
|
-
[to_end, to_start + context_size].min]
|
253
|
-
end
|
254
|
-
end
|
255
|
-
end
|
256
|
-
|
257
|
-
class Differ
|
258
|
-
def initialize(from, to)
|
259
|
-
@from = from
|
260
|
-
@to = to
|
261
|
-
end
|
262
|
-
|
263
|
-
private
|
264
|
-
def tag(mark, contents)
|
265
|
-
contents.collect {|content| "#{mark}#{content}"}
|
266
|
-
end
|
267
|
-
end
|
268
|
-
|
269
|
-
class UTF8Line
|
270
|
-
class << self
|
271
|
-
# from http://unicode.org/reports/tr11/
|
272
|
-
WIDE_CHARACTERS =
|
273
|
-
[0x1100..0x1159, 0x115F..0x115F, 0x2329..0x232A,
|
274
|
-
0x2E80..0x2E99, 0x2E9B..0x2EF3, 0x2F00..0x2FD5,
|
275
|
-
0x2FF0..0x2FFB, 0x3000..0x303E, 0x3041..0x3096,
|
276
|
-
0x3099..0x30FF, 0x3105..0x312D, 0x3131..0x318E,
|
277
|
-
0x3190..0x31B7, 0x31C0..0x31E3, 0x31F0..0x321E,
|
278
|
-
0x3220..0x3243, 0x3250..0x32FE, 0x3300..0x4DB5,
|
279
|
-
0x4E00..0x9FC3, 0xA000..0xA48C, 0xA490..0xA4C6,
|
280
|
-
0xAC00..0xD7A3, 0xF900..0xFA2D, 0xFA30..0xFA6A,
|
281
|
-
0xFA70..0xFAD9, 0xFE10..0xFE19, 0xFE30..0xFE52,
|
282
|
-
0xFE54..0xFE66, 0xFE68..0xFE6B, 0xFF01..0xFF60,
|
283
|
-
0xFFE0..0xFFE6, 0x20000..0x2FFFD, 0x30000..0x3FFFD,
|
284
|
-
]
|
285
|
-
|
286
|
-
AMBIGUOUS =
|
287
|
-
[0x00A1..0x00A1, 0x00A4..0x00A4, 0x00A7..0x00A8,
|
288
|
-
0x00AA..0x00AA, 0x00AD..0x00AE, 0x00B0..0x00B4,
|
289
|
-
0x00B6..0x00BA, 0x00BC..0x00BF, 0x00C6..0x00C6,
|
290
|
-
0x00D0..0x00D0, 0x00D7..0x00D8, 0x00DE..0x00E1,
|
291
|
-
0x00E6..0x00E6, 0x00E8..0x00EA, 0x00EC..0x00ED,
|
292
|
-
0x00F0..0x00F0, 0x00F2..0x00F3, 0x00F7..0x00FA,
|
293
|
-
0x00FC..0x00FC, 0x00FE..0x00FE, 0x0101..0x0101,
|
294
|
-
0x0111..0x0111, 0x0113..0x0113, 0x011B..0x011B,
|
295
|
-
0x0126..0x0127, 0x012B..0x012B, 0x0131..0x0133,
|
296
|
-
0x0138..0x0138, 0x013F..0x0142, 0x0144..0x0144,
|
297
|
-
0x0148..0x014B, 0x014D..0x014D, 0x0152..0x0153,
|
298
|
-
0x0166..0x0167, 0x016B..0x016B, 0x01CE..0x01CE,
|
299
|
-
0x01D0..0x01D0, 0x01D2..0x01D2, 0x01D4..0x01D4,
|
300
|
-
0x01D6..0x01D6, 0x01D8..0x01D8, 0x01DA..0x01DA,
|
301
|
-
0x01DC..0x01DC, 0x0251..0x0251, 0x0261..0x0261,
|
302
|
-
0x02C4..0x02C4, 0x02C7..0x02C7, 0x02C9..0x02CB,
|
303
|
-
0x02CD..0x02CD, 0x02D0..0x02D0, 0x02D8..0x02DB,
|
304
|
-
0x02DD..0x02DD, 0x02DF..0x02DF, 0x0300..0x036F,
|
305
|
-
0x0391..0x03A1, 0x03A3..0x03A9, 0x03B1..0x03C1,
|
306
|
-
0x03C3..0x03C9, 0x0401..0x0401, 0x0410..0x044F,
|
307
|
-
0x0451..0x0451, 0x2010..0x2010, 0x2013..0x2016,
|
308
|
-
0x2018..0x2019, 0x201C..0x201D, 0x2020..0x2022,
|
309
|
-
0x2024..0x2027, 0x2030..0x2030, 0x2032..0x2033,
|
310
|
-
0x2035..0x2035, 0x203B..0x203B, 0x203E..0x203E,
|
311
|
-
0x2074..0x2074, 0x207F..0x207F, 0x2081..0x2084,
|
312
|
-
0x20AC..0x20AC, 0x2103..0x2103, 0x2105..0x2105,
|
313
|
-
0x2109..0x2109, 0x2113..0x2113, 0x2116..0x2116,
|
314
|
-
0x2121..0x2122, 0x2126..0x2126, 0x212B..0x212B,
|
315
|
-
0x2153..0x2154, 0x215B..0x215E, 0x2160..0x216B,
|
316
|
-
0x2170..0x2179, 0x2190..0x2199, 0x21B8..0x21B9,
|
317
|
-
0x21D2..0x21D2, 0x21D4..0x21D4, 0x21E7..0x21E7,
|
318
|
-
0x2200..0x2200, 0x2202..0x2203, 0x2207..0x2208,
|
319
|
-
0x220B..0x220B, 0x220F..0x220F, 0x2211..0x2211,
|
320
|
-
0x2215..0x2215, 0x221A..0x221A, 0x221D..0x2220,
|
321
|
-
0x2223..0x2223, 0x2225..0x2225, 0x2227..0x222C,
|
322
|
-
0x222E..0x222E, 0x2234..0x2237, 0x223C..0x223D,
|
323
|
-
0x2248..0x2248, 0x224C..0x224C, 0x2252..0x2252,
|
324
|
-
0x2260..0x2261, 0x2264..0x2267, 0x226A..0x226B,
|
325
|
-
0x226E..0x226F, 0x2282..0x2283, 0x2286..0x2287,
|
326
|
-
0x2295..0x2295, 0x2299..0x2299, 0x22A5..0x22A5,
|
327
|
-
0x22BF..0x22BF, 0x2312..0x2312, 0x2460..0x24E9,
|
328
|
-
0x24EB..0x254B, 0x2550..0x2573, 0x2580..0x258F,
|
329
|
-
0x2592..0x2595, 0x25A0..0x25A1, 0x25A3..0x25A9,
|
330
|
-
0x25B2..0x25B3, 0x25B6..0x25B7, 0x25BC..0x25BD,
|
331
|
-
0x25C0..0x25C1, 0x25C6..0x25C8, 0x25CB..0x25CB,
|
332
|
-
0x25CE..0x25D1, 0x25E2..0x25E5, 0x25EF..0x25EF,
|
333
|
-
0x2605..0x2606, 0x2609..0x2609, 0x260E..0x260F,
|
334
|
-
0x2614..0x2615, 0x261C..0x261C, 0x261E..0x261E,
|
335
|
-
0x2640..0x2640, 0x2642..0x2642, 0x2660..0x2661,
|
336
|
-
0x2663..0x2665, 0x2667..0x266A, 0x266C..0x266D,
|
337
|
-
0x266F..0x266F, 0x273D..0x273D, 0x2776..0x277F,
|
338
|
-
0xE000..0xF8FF, 0xFE00..0xFE0F, 0xFFFD..0xFFFD,
|
339
|
-
0xE0100..0xE01EF, 0xF0000..0xFFFFD, 0x100000..0x10FFFD,
|
340
|
-
]
|
341
|
-
|
342
|
-
def wide_character?(character)
|
343
|
-
binary_search_ranges(character, WIDE_CHARACTERS) or
|
344
|
-
binary_search_ranges(character, AMBIGUOUS)
|
345
|
-
end
|
346
|
-
|
347
|
-
private
|
348
|
-
def binary_search_ranges(character, ranges)
|
349
|
-
if ranges.size.zero?
|
350
|
-
false
|
351
|
-
elsif ranges.size == 1
|
352
|
-
ranges[0].include?(character)
|
353
|
-
else
|
354
|
-
half = ranges.size / 2
|
355
|
-
range = ranges[half]
|
356
|
-
if range.include?(character)
|
357
|
-
true
|
358
|
-
elsif character < range.begin
|
359
|
-
binary_search_ranges(character, ranges[0...half])
|
360
|
-
else
|
361
|
-
binary_search_ranges(character, ranges[(half + 1)..-1])
|
362
|
-
end
|
363
|
-
end
|
364
|
-
end
|
365
|
-
end
|
366
|
-
|
367
|
-
def initialize(line)
|
368
|
-
@line = line
|
369
|
-
@characters = @line.unpack("U*")
|
370
|
-
end
|
371
|
-
|
372
|
-
def [](*args)
|
373
|
-
result = @characters[*args]
|
374
|
-
if result.respond_to?(:pack)
|
375
|
-
result.pack("U*")
|
376
|
-
else
|
377
|
-
result
|
378
|
-
end
|
379
|
-
end
|
380
|
-
|
381
|
-
def each(&block)
|
382
|
-
@characters.each(&block)
|
383
|
-
end
|
384
|
-
|
385
|
-
def size
|
386
|
-
@characters.size
|
387
|
-
end
|
388
|
-
|
389
|
-
def to_s
|
390
|
-
@line
|
391
|
-
end
|
392
|
-
|
393
|
-
def compute_width(start, _end)
|
394
|
-
width = 0
|
395
|
-
start.upto(_end - 1) do |i|
|
396
|
-
if self.class.wide_character?(@characters[i])
|
397
|
-
width += 2
|
398
|
-
else
|
399
|
-
width += 1
|
400
|
-
end
|
401
|
-
end
|
402
|
-
width
|
403
|
-
end
|
404
|
-
end
|
405
|
-
|
406
|
-
class ReadableDiffer < Differ
|
407
|
-
def diff(options={})
|
408
|
-
@result = []
|
409
|
-
operations.each do |tag, from_start, from_end, to_start, to_end|
|
410
|
-
case tag
|
411
|
-
when :replace
|
412
|
-
diff_lines(from_start, from_end, to_start, to_end)
|
413
|
-
when :delete
|
414
|
-
tag_deleted(@from[from_start...from_end])
|
415
|
-
when :insert
|
416
|
-
tag_inserted(@to[to_start...to_end])
|
417
|
-
when :equal
|
418
|
-
tag_equal(@from[from_start...from_end])
|
419
|
-
else
|
420
|
-
raise "unknown tag: #{tag}"
|
421
|
-
end
|
422
|
-
end
|
423
|
-
@result
|
424
|
-
end
|
425
|
-
|
426
|
-
private
|
427
|
-
def operations
|
428
|
-
@operations ||= nil
|
429
|
-
if @operations.nil?
|
430
|
-
matcher = SequenceMatcher.new(@from, @to)
|
431
|
-
@operations = matcher.operations
|
432
|
-
end
|
433
|
-
@operations
|
434
|
-
end
|
435
|
-
|
436
|
-
def default_ratio
|
437
|
-
0.74
|
438
|
-
end
|
439
|
-
|
440
|
-
def cut_off_ratio
|
441
|
-
0.75
|
442
|
-
end
|
443
|
-
|
444
|
-
def tag(mark, contents)
|
445
|
-
contents.each do |content|
|
446
|
-
@result << "#{mark}#{content}"
|
447
|
-
end
|
448
|
-
end
|
449
|
-
|
450
|
-
def tag_deleted(contents)
|
451
|
-
tag("- ", contents)
|
452
|
-
end
|
453
|
-
|
454
|
-
def tag_inserted(contents)
|
455
|
-
tag("+ ", contents)
|
456
|
-
end
|
457
|
-
|
458
|
-
def tag_equal(contents)
|
459
|
-
tag(" ", contents)
|
460
|
-
end
|
461
|
-
|
462
|
-
def tag_difference(contents)
|
463
|
-
tag("? ", contents)
|
464
|
-
end
|
465
|
-
|
466
|
-
def find_diff_line_info(from_start, from_end, to_start, to_end)
|
467
|
-
best_ratio = default_ratio
|
468
|
-
from_equal_index = to_equal_index = nil
|
469
|
-
from_best_index = to_best_index = nil
|
470
|
-
|
471
|
-
to_start.upto(to_end - 1) do |to_index|
|
472
|
-
from_start.upto(from_end - 1) do |from_index|
|
473
|
-
if @from[from_index] == @to[to_index]
|
474
|
-
from_equal_index ||= from_index
|
475
|
-
to_equal_index ||= to_index
|
476
|
-
next
|
477
|
-
end
|
478
|
-
|
479
|
-
matcher = SequenceMatcher.new(@from[from_index], @to[to_index],
|
480
|
-
&method(:space_character?))
|
481
|
-
if matcher.ratio > best_ratio
|
482
|
-
best_ratio = matcher.ratio
|
483
|
-
from_best_index = from_index
|
484
|
-
to_best_index = to_index
|
485
|
-
end
|
486
|
-
end
|
487
|
-
end
|
488
|
-
|
489
|
-
[best_ratio,
|
490
|
-
from_equal_index, to_equal_index,
|
491
|
-
from_best_index, to_best_index]
|
492
|
-
end
|
493
|
-
|
494
|
-
def diff_lines(from_start, from_end, to_start, to_end)
|
495
|
-
info = find_diff_line_info(from_start, from_end, to_start, to_end)
|
496
|
-
best_ratio, from_equal_index, to_equal_index, *info = info
|
497
|
-
from_best_index, to_best_index = info
|
498
|
-
from_best_index ||= from_start
|
499
|
-
to_best_index ||= to_start
|
500
|
-
|
501
|
-
if best_ratio < cut_off_ratio
|
502
|
-
if from_equal_index.nil?
|
503
|
-
if to_end - to_start < from_end - from_start
|
504
|
-
tag_inserted(@to[to_start...to_end])
|
505
|
-
tag_deleted(@from[from_start...from_end])
|
506
|
-
else
|
507
|
-
tag_deleted(@from[from_start...from_end])
|
508
|
-
tag_inserted(@to[to_start...to_end])
|
509
|
-
end
|
510
|
-
return
|
511
|
-
end
|
512
|
-
from_best_index = from_equal_index
|
513
|
-
to_best_index = to_equal_index
|
514
|
-
best_ratio = 1.0
|
515
|
-
end
|
516
|
-
|
517
|
-
_diff_lines(from_start, from_best_index, to_start, to_best_index)
|
518
|
-
diff_line(@from[from_best_index], @to[to_best_index])
|
519
|
-
_diff_lines(from_best_index + 1, from_end, to_best_index + 1, to_end)
|
520
|
-
end
|
521
|
-
|
522
|
-
def _diff_lines(from_start, from_end, to_start, to_end)
|
523
|
-
if from_start < from_end
|
524
|
-
if to_start < to_end
|
525
|
-
diff_lines(from_start, from_end, to_start, to_end)
|
526
|
-
else
|
527
|
-
tag_deleted(@from[from_start...from_end])
|
528
|
-
end
|
529
|
-
else
|
530
|
-
tag_inserted(@to[to_start...to_end])
|
531
|
-
end
|
532
|
-
end
|
533
|
-
|
534
|
-
def line_operations(from_line, to_line)
|
535
|
-
if !from_line.respond_to?(:force_encoding) and $KCODE == "UTF8"
|
536
|
-
from_line = UTF8Line.new(from_line)
|
537
|
-
to_line = UTF8Line.new(to_line)
|
538
|
-
end
|
539
|
-
matcher = SequenceMatcher.new(from_line, to_line,
|
540
|
-
&method(:space_character?))
|
541
|
-
[from_line, to_line, matcher.operations]
|
542
|
-
end
|
543
|
-
|
544
|
-
def compute_width(line, start, _end)
|
545
|
-
if line.respond_to?(:encoding) and
|
546
|
-
Encoding.compatible?(Encoding::UTF_8, line.encoding)
|
547
|
-
utf8_line = line[start..._end].encode(Encoding::UTF_8)
|
548
|
-
width = 0
|
549
|
-
utf8_line.each_codepoint do |unicode_codepoint|
|
550
|
-
if UTF8Line.wide_character?(unicode_codepoint)
|
551
|
-
width += 2
|
552
|
-
else
|
553
|
-
width += 1
|
554
|
-
end
|
555
|
-
end
|
556
|
-
width
|
557
|
-
elsif line.is_a?(UTF8Line)
|
558
|
-
line.compute_width(start, _end)
|
559
|
-
else
|
560
|
-
_end - start
|
561
|
-
end
|
562
|
-
end
|
563
|
-
|
564
|
-
def diff_line(from_line, to_line)
|
565
|
-
from_tags = ""
|
566
|
-
to_tags = ""
|
567
|
-
from_line, to_line, _operations = line_operations(from_line, to_line)
|
568
|
-
_operations.each do |tag, from_start, from_end, to_start, to_end|
|
569
|
-
from_width = compute_width(from_line, from_start, from_end)
|
570
|
-
to_width = compute_width(to_line, to_start, to_end)
|
571
|
-
case tag
|
572
|
-
when :replace
|
573
|
-
from_tags << "^" * from_width
|
574
|
-
to_tags << "^" * to_width
|
575
|
-
when :delete
|
576
|
-
from_tags << "-" * from_width
|
577
|
-
when :insert
|
578
|
-
to_tags << "+" * to_width
|
579
|
-
when :equal
|
580
|
-
from_tags << " " * from_width
|
581
|
-
to_tags << " " * to_width
|
582
|
-
else
|
583
|
-
raise "unknown tag: #{tag}"
|
584
|
-
end
|
585
|
-
end
|
586
|
-
format_diff_point(from_line, to_line, from_tags, to_tags)
|
587
|
-
end
|
588
|
-
|
589
|
-
def format_diff_point(from_line, to_line, from_tags, to_tags)
|
590
|
-
common = [n_leading_characters(from_line, ?\t),
|
591
|
-
n_leading_characters(to_line, ?\t)].min
|
592
|
-
common = [common,
|
593
|
-
n_leading_characters(from_tags[0, common], " "[0])].min
|
594
|
-
from_tags = from_tags[common..-1].rstrip
|
595
|
-
to_tags = to_tags[common..-1].rstrip
|
596
|
-
|
597
|
-
result = tag_deleted([from_line])
|
598
|
-
unless from_tags.empty?
|
599
|
-
tag_difference(["#{"\t" * common}#{from_tags}"])
|
600
|
-
end
|
601
|
-
tag_inserted([to_line])
|
602
|
-
unless to_tags.empty?
|
603
|
-
tag_difference(["#{"\t" * common}#{to_tags}"])
|
604
|
-
end
|
605
|
-
end
|
606
|
-
|
607
|
-
def n_leading_characters(string, character)
|
608
|
-
n = 0
|
609
|
-
while string[n] == character
|
610
|
-
n += 1
|
611
|
-
end
|
612
|
-
n
|
613
|
-
end
|
614
|
-
|
615
|
-
def space_character?(character)
|
616
|
-
[" "[0], "\t"[0]].include?(character)
|
617
|
-
end
|
618
|
-
end
|
619
|
-
|
620
|
-
class UnifiedDiffer < Differ
|
621
|
-
def diff(options={})
|
622
|
-
groups = SequenceMatcher.new(@from, @to).grouped_operations
|
623
|
-
return [] if groups.empty?
|
624
|
-
return [] if same_content?(groups)
|
625
|
-
|
626
|
-
show_context = options[:show_context]
|
627
|
-
show_context = true if show_context.nil?
|
628
|
-
result = ["--- #{options[:from_label]}".rstrip,
|
629
|
-
"+++ #{options[:to_label]}".rstrip]
|
630
|
-
groups.each do |operations|
|
631
|
-
result << format_summary(operations, show_context)
|
632
|
-
operations.each do |args|
|
633
|
-
operation_tag, from_start, from_end, to_start, to_end = args
|
634
|
-
case operation_tag
|
635
|
-
when :replace
|
636
|
-
result.concat(tag("-", @from[from_start...from_end]))
|
637
|
-
result.concat(tag("+", @to[to_start...to_end]))
|
638
|
-
when :delete
|
639
|
-
result.concat(tag("-", @from[from_start...from_end]))
|
640
|
-
when :insert
|
641
|
-
result.concat(tag("+", @to[to_start...to_end]))
|
642
|
-
when :equal
|
643
|
-
result.concat(tag(" ", @from[from_start...from_end]))
|
644
|
-
end
|
645
|
-
end
|
646
|
-
end
|
647
|
-
result
|
648
|
-
end
|
649
|
-
|
650
|
-
private
|
651
|
-
def same_content?(groups)
|
652
|
-
return false if groups.size != 1
|
653
|
-
group = groups[0]
|
654
|
-
return false if group.size != 1
|
655
|
-
tag, from_start, from_end, to_start, to_end = group[0]
|
656
|
-
|
657
|
-
tag == :equal and [from_start, from_end] == [to_start, to_end]
|
658
|
-
end
|
659
|
-
|
660
|
-
def format_summary(operations, show_context)
|
661
|
-
_, first_from_start, _, first_to_start, _ = operations[0]
|
662
|
-
_, _, last_from_end, _, last_to_end = operations[-1]
|
663
|
-
summary = "@@ -%d,%d +%d,%d @@" % [first_from_start + 1,
|
664
|
-
last_from_end - first_from_start,
|
665
|
-
first_to_start + 1,
|
666
|
-
last_to_end - first_to_start,]
|
667
|
-
if show_context
|
668
|
-
interesting_line = find_interesting_line(first_from_start,
|
669
|
-
first_to_start,
|
670
|
-
:define_line?)
|
671
|
-
summary << " #{interesting_line}" if interesting_line
|
672
|
-
end
|
673
|
-
summary
|
674
|
-
end
|
675
|
-
|
676
|
-
def find_interesting_line(from_start, to_start, predicate)
|
677
|
-
from_index = from_start
|
678
|
-
to_index = to_start
|
679
|
-
while from_index >= 0 or to_index >= 0
|
680
|
-
[@from[from_index], @to[to_index]].each do |line|
|
681
|
-
return line if line and send(predicate, line)
|
682
|
-
end
|
683
|
-
|
684
|
-
from_index -= 1
|
685
|
-
to_index -= 1
|
686
|
-
end
|
687
|
-
nil
|
688
|
-
end
|
689
|
-
|
690
|
-
def define_line?(line)
|
691
|
-
/\A(?:[_a-zA-Z$]|\s*(?:class|module|def)\b)/ =~ line
|
692
|
-
end
|
693
|
-
end
|
694
|
-
|
695
|
-
module_function
|
696
|
-
def need_fold?(diff)
|
697
|
-
/^[-+].{79}/ =~ diff
|
698
|
-
end
|
699
|
-
|
700
|
-
def fold(string)
|
701
|
-
string.split(/\r?\n/).collect do |line|
|
702
|
-
line.gsub(/(.{78})/, "\\1\n")
|
703
|
-
end.join("\n")
|
704
|
-
end
|
705
|
-
|
706
|
-
def folded_readable(from, to, options={})
|
707
|
-
readable(fold(from), fold(to), options)
|
708
|
-
end
|
709
|
-
|
710
|
-
def readable(from, to, options={})
|
711
|
-
diff(ReadableDiffer, from, to, options)
|
712
|
-
end
|
713
|
-
|
714
|
-
def unified(from, to, options={})
|
715
|
-
diff(UnifiedDiffer, from, to, options)
|
716
|
-
end
|
717
|
-
|
718
|
-
def diff(differ_class, from, to, options={})
|
719
|
-
differ = differ_class.new(from.split(/\r?\n/), to.split(/\r?\n/))
|
720
|
-
differ.diff(options).join("\n")
|
721
|
-
end
|
722
|
-
end
|
723
|
-
end
|
724
|
-
end
|