diff-lcs 1.1.3 → 1.2.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/.autotest +3 -0
- data/.rspec +2 -0
- data/.travis.yml +21 -0
- data/Contributing.rdoc +63 -0
- data/Gemfile +20 -0
- data/History.rdoc +37 -1
- data/Manifest.txt +10 -1
- data/README.rdoc +48 -23
- data/Rakefile +17 -3
- data/autotest/discover.rb +1 -0
- data/diff-lcs.gemspec +41 -29
- data/docs/COPYING.txt +21 -22
- data/docs/artistic.txt +127 -0
- data/lib/diff-lcs.rb +0 -2
- data/lib/diff/lcs.rb +654 -954
- data/lib/diff/lcs/array.rb +1 -15
- data/lib/diff/lcs/block.rb +4 -18
- data/lib/diff/lcs/callbacks.rb +222 -222
- data/lib/diff/lcs/change.rb +110 -102
- data/lib/diff/lcs/htmldiff.rb +0 -2
- data/lib/diff/lcs/hunk.rb +65 -56
- data/lib/diff/lcs/internals.rb +300 -0
- data/lib/diff/lcs/ldiff.rb +154 -169
- data/lib/diff/lcs/string.rb +1 -15
- data/spec/change_spec.rb +65 -0
- data/spec/diff_spec.rb +8 -2
- data/spec/issues_spec.rb +24 -0
- data/spec/lcs_spec.rb +23 -5
- data/spec/patch_spec.rb +51 -27
- data/spec/sdiff_spec.rb +0 -2
- data/spec/spec_helper.rb +9 -3
- data/spec/traverse_balanced_spec.rb +26 -2
- data/spec/traverse_sequences_spec.rb +84 -28
- metadata +219 -83
- data/docs/artistic.html +0 -289
data/docs/artistic.txt
ADDED
@@ -0,0 +1,127 @@
|
|
1
|
+
The "Artistic License"
|
2
|
+
|
3
|
+
Preamble
|
4
|
+
|
5
|
+
The intent of this document is to state the conditions under which a
|
6
|
+
Package may be copied, such that the Copyright Holder maintains some
|
7
|
+
semblance of artistic control over the development of the package,
|
8
|
+
while giving the users of the package the right to use and distribute
|
9
|
+
the Package in a more-or-less customary fashion, plus the right to make
|
10
|
+
reasonable modifications.
|
11
|
+
|
12
|
+
Definitions:
|
13
|
+
|
14
|
+
"Package" refers to the collection of files distributed by the
|
15
|
+
Copyright Holder, and derivatives of that collection of files
|
16
|
+
created through textual modification.
|
17
|
+
|
18
|
+
"Standard Version" refers to such a Package if it has not been
|
19
|
+
modified, or has been modified in accordance with the wishes
|
20
|
+
of the Copyright Holder as specified below.
|
21
|
+
|
22
|
+
"Copyright Holder" is whoever is named in the copyright or
|
23
|
+
copyrights for the package.
|
24
|
+
|
25
|
+
"You" is you, if you're thinking about copying or distributing
|
26
|
+
this Package.
|
27
|
+
|
28
|
+
"Reasonable copying fee" is whatever you can justify on the
|
29
|
+
basis of media cost, duplication charges, time of people involved,
|
30
|
+
and so on. (You will not be required to justify it to the
|
31
|
+
Copyright Holder, but only to the computing community at large
|
32
|
+
as a market that must bear the fee.)
|
33
|
+
|
34
|
+
"Freely Available" means that no fee is charged for the item
|
35
|
+
itself, though there may be fees involved in handling the item.
|
36
|
+
It also means that recipients of the item may redistribute it
|
37
|
+
under the same conditions they received it.
|
38
|
+
|
39
|
+
1. You may make and give away verbatim copies of the source form of the
|
40
|
+
Standard Version of this Package without restriction, provided that you
|
41
|
+
duplicate all of the original copyright notices and associated disclaimers.
|
42
|
+
|
43
|
+
2. You may apply bug fixes, portability fixes and other modifications
|
44
|
+
derived from the Public Domain or from the Copyright Holder. A Package
|
45
|
+
modified in such a way shall still be considered the Standard Version.
|
46
|
+
|
47
|
+
3. You may otherwise modify your copy of this Package in any way, provided
|
48
|
+
that you insert a prominent notice in each changed file stating how and
|
49
|
+
when you changed that file, and provided that you do at least ONE of the
|
50
|
+
following:
|
51
|
+
|
52
|
+
a) place your modifications in the Public Domain or otherwise make them
|
53
|
+
Freely Available, such as by posting said modifications to Usenet or
|
54
|
+
an equivalent medium, or placing the modifications on a major archive
|
55
|
+
site such as uunet.uu.net, or by allowing the Copyright Holder to include
|
56
|
+
your modifications in the Standard Version of the Package.
|
57
|
+
|
58
|
+
b) use the modified Package only within your corporation or organization.
|
59
|
+
|
60
|
+
c) rename any non-standard executables so the names do not conflict
|
61
|
+
with standard executables, which must also be provided, and provide
|
62
|
+
a separate manual page for each non-standard executable that clearly
|
63
|
+
documents how it differs from the Standard Version.
|
64
|
+
|
65
|
+
d) make other distribution arrangements with the Copyright Holder.
|
66
|
+
|
67
|
+
4. You may distribute the programs of this Package in object code or
|
68
|
+
executable form, provided that you do at least ONE of the following:
|
69
|
+
|
70
|
+
a) distribute a Standard Version of the executables and library files,
|
71
|
+
together with instructions (in the manual page or equivalent) on where
|
72
|
+
to get the Standard Version.
|
73
|
+
|
74
|
+
b) accompany the distribution with the machine-readable source of
|
75
|
+
the Package with your modifications.
|
76
|
+
|
77
|
+
c) give non-standard executables non-standard names, and clearly
|
78
|
+
document the differences in manual pages (or equivalent), together
|
79
|
+
with instructions on where to get the Standard Version.
|
80
|
+
|
81
|
+
d) make other distribution arrangements with the Copyright Holder.
|
82
|
+
|
83
|
+
5. You may charge a reasonable copying fee for any distribution of this
|
84
|
+
Package. You may charge any fee you choose for support of this
|
85
|
+
Package. You may not charge a fee for this Package itself. However,
|
86
|
+
you may distribute this Package in aggregate with other (possibly
|
87
|
+
commercial) programs as part of a larger (possibly commercial) software
|
88
|
+
distribution provided that you do not advertise this Package as a
|
89
|
+
product of your own. You may embed this Package's interpreter within
|
90
|
+
an executable of yours (by linking); this shall be construed as a mere
|
91
|
+
form of aggregation, provided that the complete Standard Version of the
|
92
|
+
interpreter is so embedded.
|
93
|
+
|
94
|
+
6. The scripts and library files supplied as input to or produced as
|
95
|
+
output from the programs of this Package do not automatically fall
|
96
|
+
under the copyright of this Package, but belong to whoever generated
|
97
|
+
them, and may be sold commercially, and may be aggregated with this
|
98
|
+
Package. If such scripts or library files are aggregated with this
|
99
|
+
Package via the so-called "undump" or "unexec" methods of producing a
|
100
|
+
binary executable image, then distribution of such an image shall
|
101
|
+
neither be construed as a distribution of this Package nor shall it
|
102
|
+
fall under the restrictions of Paragraphs 3 and 4, provided that you do
|
103
|
+
not represent such an executable image as a Standard Version of this
|
104
|
+
Package.
|
105
|
+
|
106
|
+
7. C subroutines (or comparably compiled subroutines in other
|
107
|
+
languages) supplied by you and linked into this Package in order to
|
108
|
+
emulate subroutines and variables of the language defined by this
|
109
|
+
Package shall not be considered part of this Package, but are the
|
110
|
+
equivalent of input as in Paragraph 6, provided these subroutines do
|
111
|
+
not change the language in any way that would cause it to fail the
|
112
|
+
regression tests for the language.
|
113
|
+
|
114
|
+
8. Aggregation of this Package with a commercial distribution is always
|
115
|
+
permitted provided that the use of this Package is embedded; that is,
|
116
|
+
when no overt attempt is made to make this Package's interfaces visible
|
117
|
+
to the end user of the commercial distribution. Such use shall not be
|
118
|
+
construed as a distribution of this Package.
|
119
|
+
|
120
|
+
9. The name of the Copyright Holder may not be used to endorse or promote
|
121
|
+
products derived from this software without specific prior written permission.
|
122
|
+
|
123
|
+
10. THIS PACKAGE IS PROVIDED "AS IS" AND WITHOUT ANY EXPRESS OR
|
124
|
+
IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
|
125
|
+
WARRANTIES OF MERCHANTIBILITY AND FITNESS FOR A PARTICULAR PURPOSE.
|
126
|
+
|
127
|
+
The End
|
data/lib/diff-lcs.rb
CHANGED
data/lib/diff/lcs.rb
CHANGED
@@ -1,166 +1,166 @@
|
|
1
1
|
# -*- ruby encoding: utf-8 -*-
|
2
2
|
|
3
|
-
module Diff
|
4
|
-
|
5
|
-
|
6
|
-
|
7
|
-
|
8
|
-
|
9
|
-
|
10
|
-
|
11
|
-
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
16
|
-
|
17
|
-
|
18
|
-
|
19
|
-
|
20
|
-
|
21
|
-
|
22
|
-
|
23
|
-
|
24
|
-
|
25
|
-
|
26
|
-
|
27
|
-
|
28
|
-
|
29
|
-
|
30
|
-
|
31
|
-
|
32
|
-
|
33
|
-
|
34
|
-
|
35
|
-
|
36
|
-
|
37
|
-
|
38
|
-
|
39
|
-
|
40
|
-
|
41
|
-
|
42
|
-
|
43
|
-
|
44
|
-
|
45
|
-
|
46
|
-
|
47
|
-
|
48
|
-
|
49
|
-
|
50
|
-
|
51
|
-
|
52
|
-
|
53
|
-
|
54
|
-
|
55
|
-
|
56
|
-
|
57
|
-
|
58
|
-
|
59
|
-
|
60
|
-
|
61
|
-
|
62
|
-
|
63
|
-
|
64
|
-
|
65
|
-
|
66
|
-
|
67
|
-
|
68
|
-
|
69
|
-
|
70
|
-
|
71
|
-
|
72
|
-
|
73
|
-
|
74
|
-
|
75
|
-
|
76
|
-
|
77
|
-
|
78
|
-
|
79
|
-
|
80
|
-
|
81
|
-
|
82
|
-
|
83
|
-
|
84
|
-
|
85
|
-
|
86
|
-
|
87
|
-
|
88
|
-
|
89
|
-
|
90
|
-
|
91
|
-
|
92
|
-
|
93
|
-
|
94
|
-
|
95
|
-
|
96
|
-
|
97
|
-
|
98
|
-
|
99
|
-
|
100
|
-
|
101
|
-
|
102
|
-
|
103
|
-
|
104
|
-
|
105
|
-
|
106
|
-
|
107
|
-
|
108
|
-
|
109
|
-
|
110
|
-
|
111
|
-
|
112
|
-
|
113
|
-
|
114
|
-
|
115
|
-
|
116
|
-
|
117
|
-
|
118
|
-
|
119
|
-
|
120
|
-
|
121
|
-
|
122
|
-
|
123
|
-
|
124
|
-
|
125
|
-
|
126
|
-
|
127
|
-
|
128
|
-
|
129
|
-
|
130
|
-
|
131
|
-
|
132
|
-
|
133
|
-
end
|
3
|
+
module Diff; end unless defined? Diff
|
4
|
+
# = Diff::LCS 1.2.0
|
5
|
+
#
|
6
|
+
# Computes "intelligent" differences between two sequenced Enumerables. This
|
7
|
+
# is an implementation of the McIlroy-Hunt "diff" algorithm for Enumerable
|
8
|
+
# objects that include Diffable.
|
9
|
+
#
|
10
|
+
# Based on Mario I. Wolczko's Smalltalk version (1.2, 1993) and Ned Konz's
|
11
|
+
# Perl version (Algorithm::Diff 1.15).
|
12
|
+
#
|
13
|
+
# == Synopsis
|
14
|
+
# require 'diff/lcs'
|
15
|
+
#
|
16
|
+
# seq1 = %w(a b c e h j l m n p)
|
17
|
+
# seq2 = %w(b c d e f j k l m r s t)
|
18
|
+
#
|
19
|
+
# lcs = Diff::LCS.lcs(seq1, seq2)
|
20
|
+
# diffs = Diff::LCS.diff(seq1, seq2)
|
21
|
+
# sdiff = Diff::LCS.sdiff(seq1, seq2)
|
22
|
+
# seq = Diff::LCS.traverse_sequences(seq1, seq2, callback_obj)
|
23
|
+
# bal = Diff::LCS.traverse_balanced(seq1, seq2, callback_obj)
|
24
|
+
# seq2 == Diff::LCS.patch(seq1, diffs)
|
25
|
+
# seq2 == Diff::LCS.patch!(seq1, diffs)
|
26
|
+
# seq1 == Diff::LCS.unpatch(seq2, diffs)
|
27
|
+
# seq1 == Diff::LCS.unpatch!(seq2, diffs)
|
28
|
+
# seq2 == Diff::LCS.patch(seq1, sdiff)
|
29
|
+
# seq2 == Diff::LCS.patch!(seq1, sdiff)
|
30
|
+
# seq1 == Diff::LCS.unpatch(seq2, sdiff)
|
31
|
+
# seq1 == Diff::LCS.unpatch!(seq2, sdiff)
|
32
|
+
#
|
33
|
+
# Alternatively, objects can be extended with Diff::LCS:
|
34
|
+
#
|
35
|
+
# seq1.extend(Diff::LCS)
|
36
|
+
# lcs = seq1.lcs(seq2)
|
37
|
+
# diffs = seq1.diff(seq2)
|
38
|
+
# sdiff = seq1.sdiff(seq2)
|
39
|
+
# seq = seq1.traverse_sequences(seq2, callback_obj)
|
40
|
+
# bal = seq1.traverse_balanced(seq2, callback_obj)
|
41
|
+
# seq2 == seq1.patch(diffs)
|
42
|
+
# seq2 == seq1.patch!(diffs)
|
43
|
+
# seq1 == seq2.unpatch(diffs)
|
44
|
+
# seq1 == seq2.unpatch!(diffs)
|
45
|
+
# seq2 == seq1.patch(sdiff)
|
46
|
+
# seq2 == seq1.patch!(sdiff)
|
47
|
+
# seq1 == seq2.unpatch(sdiff)
|
48
|
+
# seq1 == seq2.unpatch!(sdiff)
|
49
|
+
#
|
50
|
+
# Default extensions are provided for Array and String objects through the
|
51
|
+
# use of 'diff/lcs/array' and 'diff/lcs/string'.
|
52
|
+
#
|
53
|
+
# == Introduction (by Mark-Jason Dominus)
|
54
|
+
#
|
55
|
+
# <em>The following text is from the Perl documentation. The only changes
|
56
|
+
# have been to make the text appear better in Rdoc</em>.
|
57
|
+
#
|
58
|
+
# I once read an article written by the authors of +diff+; they said that
|
59
|
+
# they hard worked very hard on the algorithm until they found the right
|
60
|
+
# one.
|
61
|
+
#
|
62
|
+
# I think what they ended up using (and I hope someone will correct me,
|
63
|
+
# because I am not very confident about this) was the `longest common
|
64
|
+
# subsequence' method. In the LCS problem, you have two sequences of items:
|
65
|
+
#
|
66
|
+
# a b c d f g h j q z
|
67
|
+
# a b c d e f g i j k r x y z
|
68
|
+
#
|
69
|
+
# and you want to find the longest sequence of items that is present in both
|
70
|
+
# original sequences in the same order. That is, you want to find a new
|
71
|
+
# sequence *S* which can be obtained from the first sequence by deleting
|
72
|
+
# some items, and from the second sequence by deleting other items. You also
|
73
|
+
# want *S* to be as long as possible. In this case *S* is:
|
74
|
+
#
|
75
|
+
# a b c d f g j z
|
76
|
+
#
|
77
|
+
# From there it's only a small step to get diff-like output:
|
78
|
+
#
|
79
|
+
# e h i k q r x y
|
80
|
+
# + - + + - + + +
|
81
|
+
#
|
82
|
+
# This module solves the LCS problem. It also includes a canned function to
|
83
|
+
# generate +diff+-like output.
|
84
|
+
#
|
85
|
+
# It might seem from the example above that the LCS of two sequences is
|
86
|
+
# always pretty obvious, but that's not always the case, especially when the
|
87
|
+
# two sequences have many repeated elements. For example, consider
|
88
|
+
#
|
89
|
+
# a x b y c z p d q
|
90
|
+
# a b c a x b y c z
|
91
|
+
#
|
92
|
+
# A naive approach might start by matching up the +a+ and +b+ that appear at
|
93
|
+
# the beginning of each sequence, like this:
|
94
|
+
#
|
95
|
+
# a x b y c z p d q
|
96
|
+
# a b c a b y c z
|
97
|
+
#
|
98
|
+
# This finds the common subsequence +a b c z+. But actually, the LCS is +a x
|
99
|
+
# b y c z+:
|
100
|
+
#
|
101
|
+
# a x b y c z p d q
|
102
|
+
# a b c a x b y c z
|
103
|
+
#
|
104
|
+
# == Author
|
105
|
+
# This version is by Austin Ziegler <austin@rubyforge.org>.
|
106
|
+
#
|
107
|
+
# It is based on the Perl Algorithm::Diff (1.15) by Ned Konz , copyright
|
108
|
+
# © 2000–2002 and the Smalltalk diff version by Mario I.
|
109
|
+
# Wolczko, copyright © 1993. Documentation includes work by
|
110
|
+
# Mark-Jason Dominus.
|
111
|
+
#
|
112
|
+
# == Licence
|
113
|
+
# Copyright © 2004–2013 Austin Ziegler
|
114
|
+
# This program is free software; you can redistribute it and/or modify it
|
115
|
+
# under the same terms as Ruby, or alternatively under the Perl Artistic
|
116
|
+
# licence.
|
117
|
+
#
|
118
|
+
# == Credits
|
119
|
+
# Much of the documentation is taken directly from the Perl Algorithm::Diff
|
120
|
+
# implementation and was written originally by Mark-Jason Dominus and later
|
121
|
+
# by Ned Konz. The basic Ruby implementation was re-ported from the
|
122
|
+
# Smalltalk implementation, available at
|
123
|
+
# ftp://st.cs.uiuc.edu/pub/Smalltalk/MANCHESTER/manchester/4.0/diff.st
|
124
|
+
#
|
125
|
+
# #sdiff and #traverse_balanced were written for the Perl version by Mike
|
126
|
+
# Schilli <m@perlmeister.com>.
|
127
|
+
#
|
128
|
+
# "The algorithm is described in <em>A Fast Algorithm for Computing Longest
|
129
|
+
# Common Subsequences</em>, CACM, vol.20, no.5, pp.350-353, May
|
130
|
+
# 1977, with a few minor improvements to improve the speed."
|
131
|
+
module Diff::LCS
|
132
|
+
VERSION = '1.2.0'
|
134
133
|
end
|
135
134
|
|
136
135
|
require 'diff/lcs/callbacks'
|
136
|
+
require 'diff/lcs/internals'
|
137
137
|
|
138
138
|
module Diff::LCS
|
139
139
|
# Returns an Array containing the longest common subsequence(s) between
|
140
140
|
# +self+ and +other+. See Diff::LCS#LCS.
|
141
141
|
#
|
142
142
|
# lcs = seq1.lcs(seq2)
|
143
|
-
def lcs(other, &block) #:yields self[
|
144
|
-
Diff::LCS.
|
143
|
+
def lcs(other, &block) #:yields self[i] if there are matched subsequences:
|
144
|
+
Diff::LCS.lcs(self, other, &block)
|
145
145
|
end
|
146
146
|
|
147
147
|
# Returns the difference set between +self+ and +other+. See
|
148
148
|
# Diff::LCS#diff.
|
149
149
|
def diff(other, callbacks = nil, &block)
|
150
|
-
Diff::LCS
|
150
|
+
Diff::LCS.diff(self, other, callbacks, &block)
|
151
151
|
end
|
152
152
|
|
153
153
|
# Returns the balanced ("side-by-side") difference set between +self+ and
|
154
154
|
# +other+. See Diff::LCS#sdiff.
|
155
155
|
def sdiff(other, callbacks = nil, &block)
|
156
|
-
Diff::LCS
|
156
|
+
Diff::LCS.sdiff(self, other, callbacks, &block)
|
157
157
|
end
|
158
158
|
|
159
159
|
# Traverses the discovered longest common subsequences between +self+ and
|
160
160
|
# +other+. See Diff::LCS#traverse_sequences.
|
161
161
|
def traverse_sequences(other, callbacks = nil, &block)
|
162
162
|
traverse_sequences(self, other, callbacks ||
|
163
|
-
Diff::LCS
|
163
|
+
Diff::LCS.YieldingCallbacks, &block)
|
164
164
|
end
|
165
165
|
|
166
166
|
# Traverses the discovered longest common subsequences between +self+ and
|
@@ -168,477 +168,401 @@ module Diff::LCS
|
|
168
168
|
# Diff::LCS#traverse_balanced.
|
169
169
|
def traverse_balanced(other, callbacks = nil, &block)
|
170
170
|
traverse_balanced(self, other, callbacks ||
|
171
|
-
Diff::LCS
|
171
|
+
Diff::LCS.YieldingCallbacks, &block)
|
172
172
|
end
|
173
173
|
|
174
|
-
# Attempts to patch
|
175
|
-
# Diff::LCS#patch.
|
174
|
+
# Attempts to patch +self+ with the provided +patchset+. A new sequence
|
175
|
+
# based on +self+ and the +patchset+ will be created. See Diff::LCS#patch.
|
176
|
+
# Attempts to autodiscover the direction of the patch.
|
176
177
|
def patch(patchset)
|
177
|
-
Diff::LCS
|
178
|
+
Diff::LCS.patch(self, patchset)
|
178
179
|
end
|
180
|
+
alias_method :unpatch, :patch
|
179
181
|
|
180
|
-
# Attempts to
|
181
|
-
# Diff::LCS#patch.
|
182
|
-
|
183
|
-
Diff::LCS::unpatch(self.dup, patchset)
|
184
|
-
end
|
185
|
-
|
186
|
-
# Attempts to patch +self+ with the provided +patchset+. See
|
187
|
-
# Diff::LCS#patch!. Does no autodiscovery.
|
182
|
+
# Attempts to patch +self+ with the provided +patchset+. A new sequence
|
183
|
+
# based on +self+ and the +patchset+ will be created. See Diff::LCS#patch.
|
184
|
+
# Does no patch direction autodiscovery.
|
188
185
|
def patch!(patchset)
|
189
|
-
Diff::LCS
|
186
|
+
Diff::LCS.patch!(self, patchset)
|
190
187
|
end
|
191
188
|
|
192
|
-
# Attempts to unpatch +self+ with the provided +patchset+.
|
193
|
-
# Diff::LCS#unpatch.
|
189
|
+
# Attempts to unpatch +self+ with the provided +patchset+. A new sequence
|
190
|
+
# based on +self+ and the +patchset+ will be created. See Diff::LCS#unpatch.
|
191
|
+
# Does no patch direction autodiscovery.
|
194
192
|
def unpatch!(patchset)
|
195
|
-
Diff::LCS
|
193
|
+
Diff::LCS.unpatch!(self, patchset)
|
196
194
|
end
|
197
|
-
end
|
198
195
|
|
199
|
-
|
200
|
-
|
201
|
-
|
202
|
-
|
203
|
-
|
204
|
-
|
205
|
-
|
206
|
-
|
207
|
-
#
|
208
|
-
# lcs.each_with_index do |ee, ii|
|
209
|
-
# assert(ee.nil? || (seq1[ii] == seq2[ee]))
|
210
|
-
# end
|
211
|
-
#
|
212
|
-
# If a block is provided, the matching subsequences will be yielded from
|
213
|
-
# +seq1+ in turn and may be modified before they are placed into the
|
214
|
-
# returned Array of subsequences.
|
215
|
-
def LCS(seq1, seq2, &block) #:yields seq1[ii] for each matched:
|
216
|
-
matches = Diff::LCS.__lcs(seq1, seq2)
|
217
|
-
ret = []
|
218
|
-
matches.each_with_index do |ee, ii|
|
219
|
-
unless matches[ii].nil?
|
220
|
-
if block_given?
|
221
|
-
ret << (yield seq1[ii])
|
222
|
-
else
|
223
|
-
ret << seq1[ii]
|
224
|
-
end
|
225
|
-
end
|
226
|
-
end
|
227
|
-
ret
|
196
|
+
# Attempts to patch +self+ with the provided +patchset+, using #patch!. If
|
197
|
+
# the sequence this is used on supports #replace, the value of +self+ will
|
198
|
+
# be replaced. See Diff::LCS#patch. Does no patch direction autodiscovery.
|
199
|
+
def patch_me(patchset)
|
200
|
+
if respond_to? :replace
|
201
|
+
replace(patch!(patchset))
|
202
|
+
else
|
203
|
+
patch!(patchset)
|
228
204
|
end
|
205
|
+
end
|
229
206
|
|
230
|
-
|
231
|
-
|
232
|
-
|
233
|
-
|
234
|
-
|
235
|
-
|
236
|
-
|
237
|
-
|
238
|
-
|
239
|
-
|
240
|
-
|
241
|
-
|
242
|
-
cb = callbacks.new rescue callbacks
|
243
|
-
callbacks = cb
|
244
|
-
end
|
245
|
-
traverse_sequences(seq1, seq2, callbacks)
|
246
|
-
callbacks.finish if callbacks.respond_to?(:finish)
|
207
|
+
# Attempts to unpatch +self+ with the provided +patchset+, using
|
208
|
+
# #unpatch!. If the sequence this is used on supports #replace, the value
|
209
|
+
# of +self+ will be replaced. See Diff::LCS#unpatch. Does no patch direction
|
210
|
+
# autodiscovery.
|
211
|
+
def unpatch_me(patchset)
|
212
|
+
if respond_to? :replace
|
213
|
+
replace(unpatch!(patchset))
|
214
|
+
else
|
215
|
+
unpatch!(patchset)
|
216
|
+
end
|
217
|
+
end
|
218
|
+
end
|
247
219
|
|
248
|
-
|
249
|
-
|
250
|
-
|
251
|
-
|
252
|
-
|
253
|
-
|
254
|
-
|
255
|
-
|
256
|
-
|
257
|
-
|
258
|
-
callbacks.diffs
|
220
|
+
class << Diff::LCS
|
221
|
+
def lcs(seq1, seq2, &block) #:yields seq1[i] for each matched:
|
222
|
+
matches = Diff::LCS::Internals.lcs(seq1, seq2)
|
223
|
+
ret = []
|
224
|
+
string = seq1.kind_of? String
|
225
|
+
matches.each_with_index do |e, i|
|
226
|
+
unless matches[i].nil?
|
227
|
+
v = string ? seq1[i, 1] : seq1[i]
|
228
|
+
v = block[v] if block
|
229
|
+
ret << v
|
259
230
|
end
|
260
231
|
end
|
232
|
+
ret
|
233
|
+
end
|
234
|
+
alias_method :LCS, :lcs
|
261
235
|
|
262
|
-
|
263
|
-
|
264
|
-
|
265
|
-
|
266
|
-
|
267
|
-
|
268
|
-
|
269
|
-
|
270
|
-
|
271
|
-
|
272
|
-
|
273
|
-
|
274
|
-
|
275
|
-
# responds to #finish, it will be called.
|
276
|
-
def sdiff(seq1, seq2, callbacks = nil, &block) #:yields diff changes:
|
277
|
-
callbacks ||= Diff::LCS::SDiffCallbacks
|
278
|
-
if callbacks.kind_of?(Class)
|
279
|
-
cb = callbacks.new rescue callbacks
|
280
|
-
callbacks = cb
|
281
|
-
end
|
282
|
-
traverse_balanced(seq1, seq2, callbacks)
|
283
|
-
callbacks.finish if callbacks.respond_to?(:finish)
|
236
|
+
# #diff computes the smallest set of additions and deletions necessary to
|
237
|
+
# turn the first sequence into the second, and returns a description of
|
238
|
+
# these changes.
|
239
|
+
#
|
240
|
+
# See Diff::LCS::DiffCallbacks for the default behaviour. An alternate
|
241
|
+
# behaviour may be implemented with Diff::LCS::ContextDiffCallbacks. If a
|
242
|
+
# Class argument is provided for +callbacks+, #diff will attempt to
|
243
|
+
# initialise it. If the +callbacks+ object (possibly initialised) responds
|
244
|
+
# to #finish, it will be called.
|
245
|
+
def diff(seq1, seq2, callbacks = nil, &block) # :yields diff changes:
|
246
|
+
diff_traversal(:diff, seq1, seq2, callbacks || Diff::LCS::DiffCallbacks,
|
247
|
+
&block)
|
248
|
+
end
|
284
249
|
|
285
|
-
|
286
|
-
|
287
|
-
|
288
|
-
|
289
|
-
|
290
|
-
|
291
|
-
|
250
|
+
# #sdiff computes all necessary components to show two sequences and their
|
251
|
+
# minimized differences side by side, just like the Unix utility
|
252
|
+
# <em>sdiff</em> does:
|
253
|
+
#
|
254
|
+
# old < -
|
255
|
+
# same same
|
256
|
+
# before | after
|
257
|
+
# - > new
|
258
|
+
#
|
259
|
+
# See Diff::LCS::SDiffCallbacks for the default behaviour. An alternate
|
260
|
+
# behaviour may be implemented with Diff::LCS::ContextDiffCallbacks. If a
|
261
|
+
# Class argument is provided for +callbacks+, #diff will attempt to
|
262
|
+
# initialise it. If the +callbacks+ object (possibly initialised) responds
|
263
|
+
# to #finish, it will be called.
|
264
|
+
def sdiff(seq1, seq2, callbacks = nil, &block) #:yields diff changes:
|
265
|
+
diff_traversal(:sdiff, seq1, seq2, callbacks || Diff::LCS::SDiffCallbacks,
|
266
|
+
&block)
|
267
|
+
end
|
268
|
+
|
269
|
+
# #traverse_sequences is the most general facility provided by this
|
270
|
+
# module; #diff and #lcs are implemented as calls to it.
|
271
|
+
#
|
272
|
+
# The arguments to #traverse_sequences are the two sequences to traverse,
|
273
|
+
# and a callback object, like this:
|
274
|
+
#
|
275
|
+
# traverse_sequences(seq1, seq2, Diff::LCS::ContextDiffCallbacks.new)
|
276
|
+
#
|
277
|
+
# == Callback Methods
|
278
|
+
#
|
279
|
+
# Optional callback methods are <em>emphasized</em>.
|
280
|
+
#
|
281
|
+
# callbacks#match:: Called when +a+ and +b+ are pointing to
|
282
|
+
# common elements in +A+ and +B+.
|
283
|
+
# callbacks#discard_a:: Called when +a+ is pointing to an
|
284
|
+
# element not in +B+.
|
285
|
+
# callbacks#discard_b:: Called when +b+ is pointing to an
|
286
|
+
# element not in +A+.
|
287
|
+
# <em>callbacks#finished_a</em>:: Called when +a+ has reached the end of
|
288
|
+
# sequence +A+.
|
289
|
+
# <em>callbacks#finished_b</em>:: Called when +b+ has reached the end of
|
290
|
+
# sequence +B+.
|
291
|
+
#
|
292
|
+
# == Algorithm
|
293
|
+
#
|
294
|
+
# a---+
|
295
|
+
# v
|
296
|
+
# A = a b c e h j l m n p
|
297
|
+
# B = b c d e f j k l m r s t
|
298
|
+
# ^
|
299
|
+
# b---+
|
300
|
+
#
|
301
|
+
# If there are two arrows (+a+ and +b+) pointing to elements of sequences
|
302
|
+
# +A+ and +B+, the arrows will initially point to the first elements of
|
303
|
+
# their respective sequences. #traverse_sequences will advance the arrows
|
304
|
+
# through the sequences one element at a time, calling a method on the
|
305
|
+
# user-specified callback object before each advance. It will advance the
|
306
|
+
# arrows in such a way that if there are elements <tt>A[i]</tt> and
|
307
|
+
# <tt>B[j]</tt> which are both equal and part of the longest common
|
308
|
+
# subsequence, there will be some moment during the execution of
|
309
|
+
# #traverse_sequences when arrow +a+ is pointing to <tt>A[i]</tt> and
|
310
|
+
# arrow +b+ is pointing to <tt>B[j]</tt>. When this happens,
|
311
|
+
# #traverse_sequences will call <tt>callbacks#match</tt> and then it will
|
312
|
+
# advance both arrows.
|
313
|
+
#
|
314
|
+
# Otherwise, one of the arrows is pointing to an element of its sequence
|
315
|
+
# that is not part of the longest common subsequence. #traverse_sequences
|
316
|
+
# will advance that arrow and will call <tt>callbacks#discard_a</tt> or
|
317
|
+
# <tt>callbacks#discard_b</tt>, depending on which arrow it advanced. If
|
318
|
+
# both arrows point to elements that are not part of the longest common
|
319
|
+
# subsequence, then #traverse_sequences will advance one of them and call
|
320
|
+
# the appropriate callback, but it is not specified which it will call.
|
321
|
+
#
|
322
|
+
# The methods for <tt>callbacks#match</tt>, <tt>callbacks#discard_a</tt>,
|
323
|
+
# and <tt>callbacks#discard_b</tt> are invoked with an event comprising
|
324
|
+
# the action ("=", "+", or "-", respectively), the indicies +i+ and +j+,
|
325
|
+
# and the elements <tt>A[i]</tt> and <tt>B[j]</tt>. Return values are
|
326
|
+
# discarded by #traverse_sequences.
|
327
|
+
#
|
328
|
+
# === End of Sequences
|
329
|
+
#
|
330
|
+
# If arrow +a+ reaches the end of its sequence before arrow +b+ does,
|
331
|
+
# #traverse_sequence will try to call <tt>callbacks#finished_a</tt> with
|
332
|
+
# the last index and element of +A+ (<tt>A[-1]</tt>) and the current index
|
333
|
+
# and element of +B+ (<tt>B[j]</tt>). If <tt>callbacks#finished_a</tt>
|
334
|
+
# does not exist, then <tt>callbacks#discard_b</tt> will be called on each
|
335
|
+
# element of +B+ until the end of the sequence is reached (the call will
|
336
|
+
# be done with <tt>A[-1]</tt> and <tt>B[j]</tt> for each element).
|
337
|
+
#
|
338
|
+
# If +b+ reaches the end of +B+ before +a+ reaches the end of +A+,
|
339
|
+
# <tt>callbacks#finished_b</tt> will be called with the current index and
|
340
|
+
# element of +A+ (<tt>A[i]</tt>) and the last index and element of +B+
|
341
|
+
# (<tt>A[-1]</tt>). Again, if <tt>callbacks#finished_b</tt> does not exist
|
342
|
+
# on the callback object, then <tt>callbacks#discard_a</tt> will be called
|
343
|
+
# on each element of +A+ until the end of the sequence is reached
|
344
|
+
# (<tt>A[i]</tt> and <tt>B[-1]</tt>).
|
345
|
+
#
|
346
|
+
# There is a chance that one additional <tt>callbacks#discard_a</tt> or
|
347
|
+
# <tt>callbacks#discard_b</tt> will be called after the end of the
|
348
|
+
# sequence is reached, if +a+ has not yet reached the end of +A+ or +b+
|
349
|
+
# has not yet reached the end of +B+.
|
350
|
+
def traverse_sequences(seq1, seq2, callbacks = Diff::LCS::SequenceCallbacks, &block) #:yields change events:
|
351
|
+
callbacks ||= Diff::LCS::SequenceCallbacks
|
352
|
+
matches = Diff::LCS::Internals.lcs(seq1, seq2)
|
353
|
+
|
354
|
+
run_finished_a = run_finished_b = false
|
355
|
+
string = seq1.kind_of?(String)
|
356
|
+
|
357
|
+
a_size = seq1.size
|
358
|
+
b_size = seq2.size
|
359
|
+
ai = bj = 0
|
360
|
+
|
361
|
+
(0..matches.size).each do |i|
|
362
|
+
b_line = matches[i]
|
363
|
+
|
364
|
+
ax = string ? seq1[i, 1] : seq1[i]
|
365
|
+
bx = string ? seq2[bj, 1] : seq2[bj]
|
366
|
+
|
367
|
+
if b_line.nil?
|
368
|
+
unless ax.nil? or (string and ax.empty?)
|
369
|
+
event = Diff::LCS::ContextChange.new('-', i, ax, bj, bx)
|
370
|
+
event = yield event if block_given?
|
371
|
+
callbacks.discard_a(event)
|
292
372
|
end
|
293
|
-
res
|
294
373
|
else
|
295
|
-
|
374
|
+
loop do
|
375
|
+
break unless bj < b_line
|
376
|
+
bx = string ? seq2[bj, 1] : seq2[bj]
|
377
|
+
event = Diff::LCS::ContextChange.new('+', i, ax, bj, bx)
|
378
|
+
event = yield event if block_given?
|
379
|
+
callbacks.discard_b(event)
|
380
|
+
bj += 1
|
381
|
+
end
|
382
|
+
bx = string ? seq2[bj, 1] : seq2[bj]
|
383
|
+
event = Diff::LCS::ContextChange.new('=', i, ax, bj, bx)
|
384
|
+
event = yield event if block_given?
|
385
|
+
callbacks.match(event)
|
386
|
+
bj += 1
|
296
387
|
end
|
388
|
+
ai = i
|
297
389
|
end
|
298
|
-
|
299
|
-
|
300
|
-
#
|
301
|
-
#
|
302
|
-
|
303
|
-
|
304
|
-
|
305
|
-
|
306
|
-
|
307
|
-
|
308
|
-
|
309
|
-
|
310
|
-
|
311
|
-
|
312
|
-
# callbacks#match:: Called when +a+ and +b+ are pointing
|
313
|
-
# to common elements in +A+ and +B+.
|
314
|
-
# callbacks#discard_a:: Called when +a+ is pointing to an
|
315
|
-
# element not in +B+.
|
316
|
-
# callbacks#discard_b:: Called when +b+ is pointing to an
|
317
|
-
# element not in +A+.
|
318
|
-
# <em>callbacks#finished_a</em>:: Called when +a+ has reached the end of
|
319
|
-
# sequence +A+.
|
320
|
-
# <em>callbacks#finished_b</em>:: Called when +b+ has reached the end of
|
321
|
-
# sequence +B+.
|
322
|
-
#
|
323
|
-
# == Algorithm
|
324
|
-
# a---+
|
325
|
-
# v
|
326
|
-
# A = a b c e h j l m n p
|
327
|
-
# B = b c d e f j k l m r s t
|
328
|
-
# ^
|
329
|
-
# b---+
|
330
|
-
#
|
331
|
-
# If there are two arrows (+a+ and +b+) pointing to elements of
|
332
|
-
# sequences +A+ and +B+, the arrows will initially point to the first
|
333
|
-
# elements of their respective sequences. #traverse_sequences will
|
334
|
-
# advance the arrows through the sequences one element at a time,
|
335
|
-
# calling a method on the user-specified callback object before each
|
336
|
-
# advance. It will advance the arrows in such a way that if there are
|
337
|
-
# elements <tt>A[ii]</tt> and <tt>B[jj]</tt> which are both equal and
|
338
|
-
# part of the longest common subsequence, there will be some moment
|
339
|
-
# during the execution of #traverse_sequences when arrow +a+ is pointing
|
340
|
-
# to <tt>A[ii]</tt> and arrow +b+ is pointing to <tt>B[jj]</tt>. When
|
341
|
-
# this happens, #traverse_sequences will call <tt>callbacks#match</tt>
|
342
|
-
# and then it will advance both arrows.
|
343
|
-
#
|
344
|
-
# Otherwise, one of the arrows is pointing to an element of its sequence
|
345
|
-
# that is not part of the longest common subsequence.
|
346
|
-
# #traverse_sequences will advance that arrow and will call
|
347
|
-
# <tt>callbacks#discard_a</tt> or <tt>callbacks#discard_b</tt>, depending
|
348
|
-
# on which arrow it advanced. If both arrows point to elements that are
|
349
|
-
# not part of the longest common subsequence, then #traverse_sequences
|
350
|
-
# will advance one of them and call the appropriate callback, but it is
|
351
|
-
# not specified which it will call.
|
352
|
-
#
|
353
|
-
# The methods for <tt>callbacks#match</tt>, <tt>callbacks#discard_a</tt>,
|
354
|
-
# and <tt>callbacks#discard_b</tt> are invoked with an event comprising
|
355
|
-
# the action ("=", "+", or "-", respectively), the indicies +ii+ and
|
356
|
-
# +jj+, and the elements <tt>A[ii]</tt> and <tt>B[jj]</tt>. Return
|
357
|
-
# values are discarded by #traverse_sequences.
|
358
|
-
#
|
359
|
-
# === End of Sequences
|
360
|
-
# If arrow +a+ reaches the end of its sequence before arrow +b+ does,
|
361
|
-
# #traverse_sequence will try to call <tt>callbacks#finished_a</tt> with
|
362
|
-
# the last index and element of +A+ (<tt>A[-1]</tt>) and the current
|
363
|
-
# index and element of +B+ (<tt>B[jj]</tt>). If
|
364
|
-
# <tt>callbacks#finished_a</tt> does not exist, then
|
365
|
-
# <tt>callbacks#discard_b</tt> will be called on each element of +B+
|
366
|
-
# until the end of the sequence is reached (the call
|
367
|
-
# will be done with <tt>A[-1]</tt> and <tt>B[jj]</tt> for each element).
|
368
|
-
#
|
369
|
-
# If +b+ reaches the end of +B+ before +a+ reaches the end of +A+,
|
370
|
-
# <tt>callbacks#finished_b</tt> will be called with the current index
|
371
|
-
# and element of +A+ (<tt>A[ii]</tt>) and the last index and element of
|
372
|
-
# +B+ (<tt>A[-1]</tt>). Again, if <tt>callbacks#finished_b</tt> does not
|
373
|
-
# exist on the callback object, then <tt>callbacks#discard_a</tt> will
|
374
|
-
# be called on each element of +A+ until the end of the sequence is
|
375
|
-
# reached (<tt>A[ii]</tt> and <tt>B[-1]</tt>).
|
376
|
-
#
|
377
|
-
# There is a chance that one additional <tt>callbacks#discard_a</tt> or
|
378
|
-
# <tt>callbacks#discard_b</tt> will be called after the end of the
|
379
|
-
# sequence is reached, if +a+ has not yet reached the end of +A+ or +b+
|
380
|
-
# has not yet reached the end of +B+.
|
381
|
-
def traverse_sequences(seq1, seq2, callbacks = Diff::LCS::SequenceCallbacks, &block) #:yields change events:
|
382
|
-
matches = Diff::LCS.__lcs(seq1, seq2)
|
383
|
-
|
384
|
-
run_finished_a = run_finished_b = false
|
385
|
-
string = seq1.kind_of?(String)
|
386
|
-
|
387
|
-
a_size = seq1.size
|
388
|
-
b_size = seq2.size
|
389
|
-
ai = bj = 0
|
390
|
-
|
391
|
-
(0 .. matches.size).each do |ii|
|
392
|
-
b_line = matches[ii]
|
393
|
-
|
394
|
-
ax = string ? seq1[ii, 1] : seq1[ii]
|
395
|
-
bx = string ? seq2[bj, 1] : seq2[bj]
|
396
|
-
|
397
|
-
if b_line.nil?
|
398
|
-
unless ax.nil?
|
399
|
-
event = Diff::LCS::ContextChange.new('-', ii, ax, bj, bx)
|
400
|
-
event = yield event if block_given?
|
401
|
-
callbacks.discard_a(event)
|
402
|
-
end
|
390
|
+
ai += 1
|
391
|
+
|
392
|
+
# The last entry (if any) processed was a match. +ai+ and +bj+ point
|
393
|
+
# just past the last matching lines in their sequences.
|
394
|
+
while (ai < a_size) or (bj < b_size)
|
395
|
+
# last A?
|
396
|
+
if ai == a_size and bj < b_size
|
397
|
+
if callbacks.respond_to?(:finished_a) and not run_finished_a
|
398
|
+
ax = string ? seq1[-1, 1] : seq1[-1]
|
399
|
+
bx = string ? seq2[bj, 1] : seq2[bj]
|
400
|
+
event = Diff::LCS::ContextChange.new('>', (a_size - 1), ax, bj, bx)
|
401
|
+
event = yield event if block_given?
|
402
|
+
callbacks.finished_a(event)
|
403
|
+
run_finished_a = true
|
403
404
|
else
|
405
|
+
ax = string ? seq1[ai, 1] : seq1[ai]
|
404
406
|
loop do
|
405
|
-
break unless bj < b_line
|
406
407
|
bx = string ? seq2[bj, 1] : seq2[bj]
|
407
|
-
event = Diff::LCS::ContextChange.new('+',
|
408
|
+
event = Diff::LCS::ContextChange.new('+', ai, ax, bj, bx)
|
408
409
|
event = yield event if block_given?
|
409
410
|
callbacks.discard_b(event)
|
410
411
|
bj += 1
|
412
|
+
break unless bj < b_size
|
411
413
|
end
|
412
|
-
bx = string ? seq2[bj, 1] : seq2[bj]
|
413
|
-
event = Diff::LCS::ContextChange.new('=', ii, ax, bj, bx)
|
414
|
-
event = yield event if block_given?
|
415
|
-
callbacks.match(event)
|
416
|
-
bj += 1
|
417
414
|
end
|
418
|
-
ai = ii
|
419
415
|
end
|
420
|
-
ai += 1
|
421
|
-
|
422
|
-
# The last entry (if any) processed was a match. +ai+ and +bj+ point
|
423
|
-
# just past the last matching lines in their sequences.
|
424
|
-
while (ai < a_size) or (bj < b_size)
|
425
|
-
# last A?
|
426
|
-
if ai == a_size and bj < b_size
|
427
|
-
if callbacks.respond_to?(:finished_a) and not run_finished_a
|
428
|
-
ax = string ? seq1[-1, 1] : seq1[-1]
|
429
|
-
bx = string ? seq2[bj, 1] : seq2[bj]
|
430
|
-
event = Diff::LCS::ContextChange.new('>', (a_size - 1), ax, bj, bx)
|
431
|
-
event = yield event if block_given?
|
432
|
-
callbacks.finished_a(event)
|
433
|
-
run_finished_a = true
|
434
|
-
else
|
435
|
-
ax = string ? seq1[ai, 1] : seq1[ai]
|
436
|
-
loop do
|
437
|
-
bx = string ? seq2[bj, 1] : seq2[bj]
|
438
|
-
event = Diff::LCS::ContextChange.new('+', ai, ax, bj, bx)
|
439
|
-
event = yield event if block_given?
|
440
|
-
callbacks.discard_b(event)
|
441
|
-
bj += 1
|
442
|
-
break unless bj < b_size
|
443
|
-
end
|
444
|
-
end
|
445
|
-
end
|
446
416
|
|
447
|
-
|
448
|
-
|
449
|
-
|
450
|
-
ax = string ? seq1[ai, 1] : seq1[ai]
|
451
|
-
bx = string ? seq2[-1, 1] : seq2[-1]
|
452
|
-
event = Diff::LCS::ContextChange.new('<', ai, ax, (b_size - 1), bx)
|
453
|
-
event = yield event if block_given?
|
454
|
-
callbacks.finished_b(event)
|
455
|
-
run_finished_b = true
|
456
|
-
else
|
457
|
-
bx = string ? seq2[bj, 1] : seq2[bj]
|
458
|
-
loop do
|
459
|
-
ax = string ? seq1[ai, 1] : seq1[ai]
|
460
|
-
event = Diff::LCS::ContextChange.new('-', ai, ax, bj, bx)
|
461
|
-
event = yield event if block_given?
|
462
|
-
callbacks.discard_a(event)
|
463
|
-
ai += 1
|
464
|
-
break unless bj < b_size
|
465
|
-
end
|
466
|
-
end
|
467
|
-
end
|
468
|
-
|
469
|
-
if ai < a_size
|
470
|
-
ax = string ? seq1[ai, 1] : seq1[ai]
|
471
|
-
bx = string ? seq2[bj, 1] : seq2[bj]
|
472
|
-
event = Diff::LCS::ContextChange.new('-', ai, ax, bj, bx)
|
473
|
-
event = yield event if block_given?
|
474
|
-
callbacks.discard_a(event)
|
475
|
-
ai += 1
|
476
|
-
end
|
477
|
-
|
478
|
-
if bj < b_size
|
417
|
+
# last B?
|
418
|
+
if bj == b_size and ai < a_size
|
419
|
+
if callbacks.respond_to?(:finished_b) and not run_finished_b
|
479
420
|
ax = string ? seq1[ai, 1] : seq1[ai]
|
480
|
-
bx = string ? seq2[
|
481
|
-
event = Diff::LCS::ContextChange.new('
|
421
|
+
bx = string ? seq2[-1, 1] : seq2[-1]
|
422
|
+
event = Diff::LCS::ContextChange.new('<', ai, ax, (b_size - 1), bx)
|
482
423
|
event = yield event if block_given?
|
483
|
-
callbacks.
|
484
|
-
|
485
|
-
|
486
|
-
end
|
487
|
-
end
|
488
|
-
|
489
|
-
# #traverse_balanced is an alternative to #traverse_sequences. It
|
490
|
-
# uses a different algorithm to iterate through the entries in the
|
491
|
-
# computed longest common subsequence. Instead of viewing the changes as
|
492
|
-
# insertions or deletions from one of the sequences, #traverse_balanced
|
493
|
-
# will report <em>changes</em> between the sequences. To represent a
|
494
|
-
#
|
495
|
-
# The arguments to #traverse_balanced are the two sequences to traverse
|
496
|
-
# and a callback object, like this:
|
497
|
-
#
|
498
|
-
# traverse_balanced(seq1, seq2, Diff::LCS::ContextDiffCallbacks.new)
|
499
|
-
#
|
500
|
-
# #sdiff is implemented with #traverse_balanced.
|
501
|
-
#
|
502
|
-
# == Callback Methods
|
503
|
-
# Optional callback methods are <em>emphasized</em>.
|
504
|
-
#
|
505
|
-
# callbacks#match:: Called when +a+ and +b+ are pointing
|
506
|
-
# to common elements in +A+ and +B+.
|
507
|
-
# callbacks#discard_a:: Called when +a+ is pointing to an
|
508
|
-
# element not in +B+.
|
509
|
-
# callbacks#discard_b:: Called when +b+ is pointing to an
|
510
|
-
# element not in +A+.
|
511
|
-
# <em>callbacks#change</em>:: Called when +a+ and +b+ are pointing
|
512
|
-
# to the same relative position, but
|
513
|
-
# <tt>A[a]</tt> and <tt>B[b]</tt> are
|
514
|
-
# not the same; a <em>change</em> has
|
515
|
-
# occurred.
|
516
|
-
#
|
517
|
-
# #traverse_balanced might be a bit slower than #traverse_sequences,
|
518
|
-
# noticable only while processing huge amounts of data.
|
519
|
-
#
|
520
|
-
# The +sdiff+ function of this module is implemented as call to
|
521
|
-
# #traverse_balanced.
|
522
|
-
#
|
523
|
-
# == Algorithm
|
524
|
-
# a---+
|
525
|
-
# v
|
526
|
-
# A = a b c e h j l m n p
|
527
|
-
# B = b c d e f j k l m r s t
|
528
|
-
# ^
|
529
|
-
# b---+
|
530
|
-
#
|
531
|
-
# === Matches
|
532
|
-
# If there are two arrows (+a+ and +b+) pointing to elements of
|
533
|
-
# sequences +A+ and +B+, the arrows will initially point to the first
|
534
|
-
# elements of their respective sequences. #traverse_sequences will
|
535
|
-
# advance the arrows through the sequences one element at a time,
|
536
|
-
# calling a method on the user-specified callback object before each
|
537
|
-
# advance. It will advance the arrows in such a way that if there are
|
538
|
-
# elements <tt>A[ii]</tt> and <tt>B[jj]</tt> which are both equal and
|
539
|
-
# part of the longest common subsequence, there will be some moment
|
540
|
-
# during the execution of #traverse_sequences when arrow +a+ is pointing
|
541
|
-
# to <tt>A[ii]</tt> and arrow +b+ is pointing to <tt>B[jj]</tt>. When
|
542
|
-
# this happens, #traverse_sequences will call <tt>callbacks#match</tt>
|
543
|
-
# and then it will advance both arrows.
|
544
|
-
#
|
545
|
-
# === Discards
|
546
|
-
# Otherwise, one of the arrows is pointing to an element of its sequence
|
547
|
-
# that is not part of the longest common subsequence.
|
548
|
-
# #traverse_sequences will advance that arrow and will call
|
549
|
-
# <tt>callbacks#discard_a</tt> or <tt>callbacks#discard_b</tt>,
|
550
|
-
# depending on which arrow it advanced.
|
551
|
-
#
|
552
|
-
# === Changes
|
553
|
-
# If both +a+ and +b+ point to elements that are not part of the longest
|
554
|
-
# common subsequence, then #traverse_sequences will try to call
|
555
|
-
# <tt>callbacks#change</tt> and advance both arrows. If
|
556
|
-
# <tt>callbacks#change</tt> is not implemented, then
|
557
|
-
# <tt>callbacks#discard_a</tt> and <tt>callbacks#discard_b</tt> will be
|
558
|
-
# called in turn.
|
559
|
-
#
|
560
|
-
# The methods for <tt>callbacks#match</tt>, <tt>callbacks#discard_a</tt>,
|
561
|
-
# <tt>callbacks#discard_b</tt>, and <tt>callbacks#change</tt> are
|
562
|
-
# invoked with an event comprising the action ("=", "+", "-", or "!",
|
563
|
-
# respectively), the indicies +ii+ and +jj+, and the elements
|
564
|
-
# <tt>A[ii]</tt> and <tt>B[jj]</tt>. Return values are discarded by
|
565
|
-
# #traverse_balanced.
|
566
|
-
#
|
567
|
-
# === Context
|
568
|
-
# Note that +ii+ and +jj+ may not be the same index position, even if
|
569
|
-
# +a+ and +b+ are considered to be pointing to matching or changed
|
570
|
-
# elements.
|
571
|
-
def traverse_balanced(seq1, seq2, callbacks = Diff::LCS::BalancedCallbacks)
|
572
|
-
matches = Diff::LCS.__lcs(seq1, seq2)
|
573
|
-
a_size = seq1.size
|
574
|
-
b_size = seq2.size
|
575
|
-
ai = bj = mb = 0
|
576
|
-
ma = -1
|
577
|
-
string = seq1.kind_of?(String)
|
578
|
-
|
579
|
-
# Process all the lines in the match vector.
|
580
|
-
loop do
|
581
|
-
# Find next match indices +ma+ and +mb+
|
582
|
-
loop do
|
583
|
-
ma += 1
|
584
|
-
break unless ma < matches.size and matches[ma].nil?
|
585
|
-
end
|
586
|
-
|
587
|
-
break if ma >= matches.size # end of matches?
|
588
|
-
mb = matches[ma]
|
589
|
-
|
590
|
-
# Change(seq2)
|
591
|
-
while (ai < ma) or (bj < mb)
|
592
|
-
ax = string ? seq1[ai, 1] : seq1[ai]
|
424
|
+
callbacks.finished_b(event)
|
425
|
+
run_finished_b = true
|
426
|
+
else
|
593
427
|
bx = string ? seq2[bj, 1] : seq2[bj]
|
594
|
-
|
595
|
-
|
596
|
-
when [true, true]
|
597
|
-
if callbacks.respond_to?(:change)
|
598
|
-
event = Diff::LCS::ContextChange.new('!', ai, ax, bj, bx)
|
599
|
-
event = yield event if block_given?
|
600
|
-
callbacks.change(event)
|
601
|
-
ai += 1
|
602
|
-
bj += 1
|
603
|
-
else
|
604
|
-
event = Diff::LCS::ContextChange.new('-', ai, ax, bj, bx)
|
605
|
-
event = yield event if block_given?
|
606
|
-
callbacks.discard_a(event)
|
607
|
-
ai += 1
|
608
|
-
ax = string ? seq1[ai, 1] : seq1[ai]
|
609
|
-
event = Diff::LCS::ContextChange.new('+', ai, ax, bj, bx)
|
610
|
-
event = yield event if block_given?
|
611
|
-
callbacks.discard_b(event)
|
612
|
-
bj += 1
|
613
|
-
end
|
614
|
-
when [true, false]
|
428
|
+
loop do
|
429
|
+
ax = string ? seq1[ai, 1] : seq1[ai]
|
615
430
|
event = Diff::LCS::ContextChange.new('-', ai, ax, bj, bx)
|
616
431
|
event = yield event if block_given?
|
617
432
|
callbacks.discard_a(event)
|
618
433
|
ai += 1
|
619
|
-
|
620
|
-
event = Diff::LCS::ContextChange.new('+', ai, ax, bj, bx)
|
621
|
-
event = yield event if block_given?
|
622
|
-
callbacks.discard_b(event)
|
623
|
-
bj += 1
|
434
|
+
break unless bj < b_size
|
624
435
|
end
|
625
436
|
end
|
437
|
+
end
|
626
438
|
|
627
|
-
|
439
|
+
if ai < a_size
|
628
440
|
ax = string ? seq1[ai, 1] : seq1[ai]
|
629
441
|
bx = string ? seq2[bj, 1] : seq2[bj]
|
630
|
-
event = Diff::LCS::ContextChange.new('
|
442
|
+
event = Diff::LCS::ContextChange.new('-', ai, ax, bj, bx)
|
631
443
|
event = yield event if block_given?
|
632
|
-
callbacks.
|
444
|
+
callbacks.discard_a(event)
|
633
445
|
ai += 1
|
446
|
+
end
|
447
|
+
|
448
|
+
if bj < b_size
|
449
|
+
ax = string ? seq1[ai, 1] : seq1[ai]
|
450
|
+
bx = string ? seq2[bj, 1] : seq2[bj]
|
451
|
+
event = Diff::LCS::ContextChange.new('+', ai, ax, bj, bx)
|
452
|
+
event = yield event if block_given?
|
453
|
+
callbacks.discard_b(event)
|
634
454
|
bj += 1
|
635
455
|
end
|
456
|
+
end
|
457
|
+
end
|
636
458
|
|
637
|
-
|
459
|
+
# #traverse_balanced is an alternative to #traverse_sequences. It uses a
|
460
|
+
# different algorithm to iterate through the entries in the computed
|
461
|
+
# longest common subsequence. Instead of viewing the changes as insertions
|
462
|
+
# or deletions from one of the sequences, #traverse_balanced will report
|
463
|
+
# <em>changes</em> between the sequences.
|
464
|
+
#
|
465
|
+
# The arguments to #traverse_balanced are the two sequences to traverse
|
466
|
+
# and a callback object, like this:
|
467
|
+
#
|
468
|
+
# traverse_balanced(seq1, seq2, Diff::LCS::ContextDiffCallbacks.new)
|
469
|
+
#
|
470
|
+
# #sdiff is implemented with #traverse_balanced.
|
471
|
+
#
|
472
|
+
# == Callback Methods
|
473
|
+
#
|
474
|
+
# Optional callback methods are <em>emphasized</em>.
|
475
|
+
#
|
476
|
+
# callbacks#match:: Called when +a+ and +b+ are pointing to
|
477
|
+
# common elements in +A+ and +B+.
|
478
|
+
# callbacks#discard_a:: Called when +a+ is pointing to an
|
479
|
+
# element not in +B+.
|
480
|
+
# callbacks#discard_b:: Called when +b+ is pointing to an
|
481
|
+
# element not in +A+.
|
482
|
+
# <em>callbacks#change</em>:: Called when +a+ and +b+ are pointing to
|
483
|
+
# the same relative position, but
|
484
|
+
# <tt>A[a]</tt> and <tt>B[b]</tt> are not
|
485
|
+
# the same; a <em>change</em> has
|
486
|
+
# occurred.
|
487
|
+
#
|
488
|
+
# #traverse_balanced might be a bit slower than #traverse_sequences,
|
489
|
+
# noticable only while processing huge amounts of data.
|
490
|
+
#
|
491
|
+
# == Algorithm
|
492
|
+
#
|
493
|
+
# a---+
|
494
|
+
# v
|
495
|
+
# A = a b c e h j l m n p
|
496
|
+
# B = b c d e f j k l m r s t
|
497
|
+
# ^
|
498
|
+
# b---+
|
499
|
+
#
|
500
|
+
# === Matches
|
501
|
+
#
|
502
|
+
# If there are two arrows (+a+ and +b+) pointing to elements of sequences
|
503
|
+
# +A+ and +B+, the arrows will initially point to the first elements of
|
504
|
+
# their respective sequences. #traverse_sequences will advance the arrows
|
505
|
+
# through the sequences one element at a time, calling a method on the
|
506
|
+
# user-specified callback object before each advance. It will advance the
|
507
|
+
# arrows in such a way that if there are elements <tt>A[i]</tt> and
|
508
|
+
# <tt>B[j]</tt> which are both equal and part of the longest common
|
509
|
+
# subsequence, there will be some moment during the execution of
|
510
|
+
# #traverse_sequences when arrow +a+ is pointing to <tt>A[i]</tt> and
|
511
|
+
# arrow +b+ is pointing to <tt>B[j]</tt>. When this happens,
|
512
|
+
# #traverse_sequences will call <tt>callbacks#match</tt> and then it will
|
513
|
+
# advance both arrows.
|
514
|
+
#
|
515
|
+
# === Discards
|
516
|
+
#
|
517
|
+
# Otherwise, one of the arrows is pointing to an element of its sequence
|
518
|
+
# that is not part of the longest common subsequence. #traverse_sequences
|
519
|
+
# will advance that arrow and will call <tt>callbacks#discard_a</tt> or
|
520
|
+
# <tt>callbacks#discard_b</tt>, depending on which arrow it advanced.
|
521
|
+
#
|
522
|
+
# === Changes
|
523
|
+
#
|
524
|
+
# If both +a+ and +b+ point to elements that are not part of the longest
|
525
|
+
# common subsequence, then #traverse_sequences will try to call
|
526
|
+
# <tt>callbacks#change</tt> and advance both arrows. If
|
527
|
+
# <tt>callbacks#change</tt> is not implemented, then
|
528
|
+
# <tt>callbacks#discard_a</tt> and <tt>callbacks#discard_b</tt> will be
|
529
|
+
# called in turn.
|
530
|
+
#
|
531
|
+
# The methods for <tt>callbacks#match</tt>, <tt>callbacks#discard_a</tt>,
|
532
|
+
# <tt>callbacks#discard_b</tt>, and <tt>callbacks#change</tt> are invoked
|
533
|
+
# with an event comprising the action ("=", "+", "-", or "!",
|
534
|
+
# respectively), the indicies +i+ and +j+, and the elements
|
535
|
+
# <tt>A[i]</tt> and <tt>B[j]</tt>. Return values are discarded by
|
536
|
+
# #traverse_balanced.
|
537
|
+
#
|
538
|
+
# === Context
|
539
|
+
# Note that +i+ and +j+ may not be the same index position, even if +a+
|
540
|
+
# and +b+ are considered to be pointing to matching or changed elements.
|
541
|
+
def traverse_balanced(seq1, seq2, callbacks = Diff::LCS::BalancedCallbacks)
|
542
|
+
matches = Diff::LCS::Internals.lcs(seq1, seq2)
|
543
|
+
a_size = seq1.size
|
544
|
+
b_size = seq2.size
|
545
|
+
ai = bj = mb = 0
|
546
|
+
ma = -1
|
547
|
+
string = seq1.kind_of?(String)
|
548
|
+
|
549
|
+
# Process all the lines in the match vector.
|
550
|
+
loop do
|
551
|
+
# Find next match indices +ma+ and +mb+
|
552
|
+
loop do
|
553
|
+
ma += 1
|
554
|
+
break unless ma < matches.size and matches[ma].nil?
|
555
|
+
end
|
556
|
+
|
557
|
+
break if ma >= matches.size # end of matches?
|
558
|
+
mb = matches[ma]
|
559
|
+
|
560
|
+
# Change(seq2)
|
561
|
+
while (ai < ma) or (bj < mb)
|
638
562
|
ax = string ? seq1[ai, 1] : seq1[ai]
|
639
563
|
bx = string ? seq2[bj, 1] : seq2[bj]
|
640
564
|
|
641
|
-
case [(ai <
|
565
|
+
case [(ai < ma), (bj < mb)]
|
642
566
|
when [true, true]
|
643
567
|
if callbacks.respond_to?(:change)
|
644
568
|
event = Diff::LCS::ContextChange.new('!', ai, ax, bj, bx)
|
@@ -669,437 +593,213 @@ module Diff::LCS
|
|
669
593
|
bj += 1
|
670
594
|
end
|
671
595
|
end
|
672
|
-
end
|
673
|
-
|
674
|
-
PATCH_MAP = { #:nodoc:
|
675
|
-
:patch => { '+' => '+', '-' => '-', '!' => '!', '=' => '=' },
|
676
|
-
:unpatch => { '+' => '-', '-' => '+', '!' => '!', '=' => '=' }
|
677
|
-
}
|
678
|
-
|
679
|
-
# Given a patchset, convert the current version to the new
|
680
|
-
# version. If +direction+ is not specified (must be
|
681
|
-
# <tt>:patch</tt> or <tt>:unpatch</tt>), then discovery of the
|
682
|
-
# direction of the patch will be attempted.
|
683
|
-
def patch(src, patchset, direction = nil)
|
684
|
-
string = src.kind_of?(String)
|
685
|
-
# Start with a new empty type of the source's class
|
686
|
-
res = src.class.new
|
687
|
-
|
688
|
-
# Normalize the patchset.
|
689
|
-
patchset = __normalize_patchset(patchset)
|
690
|
-
|
691
|
-
direction ||= Diff::LCS.__diff_direction(src, patchset)
|
692
|
-
direction ||= :patch
|
693
|
-
|
694
|
-
ai = bj = 0
|
695
|
-
|
696
|
-
patchset.each do |change|
|
697
|
-
# Both Change and ContextChange support #action
|
698
|
-
action = PATCH_MAP[direction][change.action]
|
699
|
-
|
700
|
-
case change
|
701
|
-
when Diff::LCS::ContextChange
|
702
|
-
case direction
|
703
|
-
when :patch
|
704
|
-
el = change.new_element
|
705
|
-
op = change.old_position
|
706
|
-
np = change.new_position
|
707
|
-
when :unpatch
|
708
|
-
el = change.old_element
|
709
|
-
op = change.new_position
|
710
|
-
np = change.old_position
|
711
|
-
end
|
712
|
-
|
713
|
-
case action
|
714
|
-
when '-' # Remove details from the old string
|
715
|
-
while ai < op
|
716
|
-
res << (string ? src[ai, 1] : src[ai])
|
717
|
-
ai += 1
|
718
|
-
bj += 1
|
719
|
-
end
|
720
|
-
ai += 1
|
721
|
-
when '+'
|
722
|
-
while bj < np
|
723
|
-
res << (string ? src[ai, 1] : src[ai])
|
724
|
-
ai += 1
|
725
|
-
bj += 1
|
726
|
-
end
|
727
|
-
|
728
|
-
res << el
|
729
|
-
bj += 1
|
730
|
-
when '='
|
731
|
-
# This only appears in sdiff output with the SDiff callback.
|
732
|
-
# Therefore, we only need to worry about dealing with a single
|
733
|
-
# element.
|
734
|
-
res << el
|
735
|
-
|
736
|
-
ai += 1
|
737
|
-
bj += 1
|
738
|
-
when '!'
|
739
|
-
while ai < op
|
740
|
-
res << (string ? src[ai, 1] : src[ai])
|
741
|
-
ai += 1
|
742
|
-
bj += 1
|
743
|
-
end
|
744
596
|
|
745
|
-
|
746
|
-
|
747
|
-
|
748
|
-
|
749
|
-
|
750
|
-
|
751
|
-
|
752
|
-
|
753
|
-
|
754
|
-
res << (string ? src[ai, 1] : src[ai])
|
755
|
-
ai += 1
|
756
|
-
bj += 1
|
757
|
-
end
|
758
|
-
ai += 1
|
759
|
-
when '+'
|
760
|
-
while bj < change.position
|
761
|
-
res << (string ? src[ai, 1] : src[ai])
|
762
|
-
ai += 1
|
763
|
-
bj += 1
|
764
|
-
end
|
597
|
+
# Match
|
598
|
+
ax = string ? seq1[ai, 1] : seq1[ai]
|
599
|
+
bx = string ? seq2[bj, 1] : seq2[bj]
|
600
|
+
event = Diff::LCS::ContextChange.new('=', ai, ax, bj, bx)
|
601
|
+
event = yield event if block_given?
|
602
|
+
callbacks.match(event)
|
603
|
+
ai += 1
|
604
|
+
bj += 1
|
605
|
+
end
|
765
606
|
|
766
|
-
|
607
|
+
while (ai < a_size) or (bj < b_size)
|
608
|
+
ax = string ? seq1[ai, 1] : seq1[ai]
|
609
|
+
bx = string ? seq2[bj, 1] : seq2[bj]
|
767
610
|
|
768
|
-
|
769
|
-
|
611
|
+
case [(ai < a_size), (bj < b_size)]
|
612
|
+
when [true, true]
|
613
|
+
if callbacks.respond_to?(:change)
|
614
|
+
event = Diff::LCS::ContextChange.new('!', ai, ax, bj, bx)
|
615
|
+
event = yield event if block_given?
|
616
|
+
callbacks.change(event)
|
617
|
+
ai += 1
|
618
|
+
bj += 1
|
619
|
+
else
|
620
|
+
event = Diff::LCS::ContextChange.new('-', ai, ax, bj, bx)
|
621
|
+
event = yield event if block_given?
|
622
|
+
callbacks.discard_a(event)
|
623
|
+
ai += 1
|
624
|
+
ax = string ? seq1[ai, 1] : seq1[ai]
|
625
|
+
event = Diff::LCS::ContextChange.new('+', ai, ax, bj, bx)
|
626
|
+
event = yield event if block_given?
|
627
|
+
callbacks.discard_b(event)
|
628
|
+
bj += 1
|
770
629
|
end
|
771
|
-
|
772
|
-
|
773
|
-
|
774
|
-
|
630
|
+
when [true, false]
|
631
|
+
event = Diff::LCS::ContextChange.new('-', ai, ax, bj, bx)
|
632
|
+
event = yield event if block_given?
|
633
|
+
callbacks.discard_a(event)
|
775
634
|
ai += 1
|
635
|
+
when [false, true]
|
636
|
+
event = Diff::LCS::ContextChange.new('+', ai, ax, bj, bx)
|
637
|
+
event = yield event if block_given?
|
638
|
+
callbacks.discard_b(event)
|
776
639
|
bj += 1
|
777
640
|
end
|
778
|
-
|
779
|
-
res
|
780
641
|
end
|
642
|
+
end
|
781
643
|
|
782
|
-
|
783
|
-
|
784
|
-
|
785
|
-
|
786
|
-
end
|
644
|
+
PATCH_MAP = { #:nodoc:
|
645
|
+
:patch => { '+' => '+', '-' => '-', '!' => '!', '=' => '=' },
|
646
|
+
:unpatch => { '+' => '-', '-' => '+', '!' => '!', '=' => '=' }
|
647
|
+
}
|
787
648
|
|
788
|
-
|
789
|
-
|
790
|
-
|
791
|
-
|
649
|
+
# Applies a +patchset+ to the sequence +src+ according to the +direction+
|
650
|
+
# (<tt>:patch</tt> or <tt>:unpatch</tt>), producing a new sequence.
|
651
|
+
#
|
652
|
+
# If the +direction+ is not specified, Diff::LCS::patch will attempt to
|
653
|
+
# discover the direction of the +patchset+.
|
654
|
+
#
|
655
|
+
# A +patchset+ can be considered to apply forward (<tt>:patch</tt>) if the
|
656
|
+
# following expression is true:
|
657
|
+
#
|
658
|
+
# patch(s1, diff(s1, s2)) -> s2
|
659
|
+
#
|
660
|
+
# A +patchset+ can be considered to apply backward (<tt>:unpatch</tt>) if
|
661
|
+
# the following expression is true:
|
662
|
+
#
|
663
|
+
# patch(s2, diff(s1, s2)) -> s1
|
664
|
+
#
|
665
|
+
# If the +patchset+ contains no changes, the +src+ value will be returned
|
666
|
+
# as either <tt>src.dup</tt> or +src+. A +patchset+ can be deemed as
|
667
|
+
# having no changes if the following predicate returns true:
|
668
|
+
#
|
669
|
+
# patchset.empty? or
|
670
|
+
# patchset.flatten.all? { |change| change.unchanged? }
|
671
|
+
#
|
672
|
+
# === Patchsets
|
673
|
+
#
|
674
|
+
# A +patchset+ is always an enumerable sequence of changes, hunks of
|
675
|
+
# changes, or a mix of the two. A hunk of changes is an enumerable
|
676
|
+
# sequence of changes:
|
677
|
+
#
|
678
|
+
# [ # patchset
|
679
|
+
# # change
|
680
|
+
# [ # hunk
|
681
|
+
# # change
|
682
|
+
# ]
|
683
|
+
# ]
|
684
|
+
#
|
685
|
+
# The +patch+ method accepts <tt>patchset</tt>s that are enumerable
|
686
|
+
# sequences containing either Diff::LCS::Change objects (or a subclass) or
|
687
|
+
# the array representations of those objects. Prior to application, array
|
688
|
+
# representations of Diff::LCS::Change objects will be reified.
|
689
|
+
def patch(src, patchset, direction = nil)
|
690
|
+
# Normalize the patchset.
|
691
|
+
has_changes, patchset = Diff::LCS::Internals.analyze_patchset(patchset)
|
692
|
+
|
693
|
+
if not has_changes
|
694
|
+
return src.dup if src.respond_to? :dup
|
695
|
+
return src
|
792
696
|
end
|
793
697
|
|
794
|
-
|
795
|
-
#
|
796
|
-
|
797
|
-
# that
|
798
|
-
#
|
799
|
-
# result = Diff::LCS.__lcs(a, b)
|
800
|
-
# result.each_with_index do |e, ii|
|
801
|
-
# assert_equal(a[ii], b[e]) unless e.nil?
|
802
|
-
# end
|
803
|
-
#
|
804
|
-
# Note: This will be deprecated as a public function in a future release.
|
805
|
-
def __lcs(a, b)
|
806
|
-
a_start = b_start = 0
|
807
|
-
a_finish = a.size - 1
|
808
|
-
b_finish = b.size - 1
|
809
|
-
vector = []
|
698
|
+
string = src.kind_of?(String)
|
699
|
+
# Start with a new empty type of the source's class
|
700
|
+
res = src.class.new
|
810
701
|
|
811
|
-
|
812
|
-
while (a_start <= a_finish) and
|
813
|
-
(b_start <= b_finish) and
|
814
|
-
(a[a_start] == b[b_start])
|
815
|
-
vector[a_start] = b_start
|
816
|
-
a_start += 1
|
817
|
-
b_start += 1
|
818
|
-
end
|
702
|
+
direction ||= Diff::LCS::Internals.intuit_diff_direction(src, patchset)
|
819
703
|
|
820
|
-
|
821
|
-
while (a_start <= a_finish) and
|
822
|
-
(b_start <= b_finish) and
|
823
|
-
(a[a_finish] == b[b_finish])
|
824
|
-
vector[a_finish] = b_finish
|
825
|
-
a_finish -= 1
|
826
|
-
b_finish -= 1
|
827
|
-
end
|
704
|
+
ai = bj = 0
|
828
705
|
|
829
|
-
|
830
|
-
b_matches = Diff::LCS.__position_hash(b, b_start .. b_finish)
|
706
|
+
patch_map = PATCH_MAP[direction]
|
831
707
|
|
832
|
-
|
833
|
-
|
708
|
+
patchset.flatten.each do |change|
|
709
|
+
# Both Change and ContextChange support #action
|
710
|
+
action = patch_map[change.action]
|
834
711
|
|
835
|
-
|
836
|
-
|
837
|
-
|
838
|
-
|
839
|
-
|
840
|
-
|
841
|
-
|
842
|
-
|
843
|
-
|
844
|
-
|
845
|
-
|
712
|
+
case change
|
713
|
+
when Diff::LCS::ContextChange
|
714
|
+
case direction
|
715
|
+
when :patch
|
716
|
+
el = change.new_element
|
717
|
+
op = change.old_position
|
718
|
+
np = change.new_position
|
719
|
+
when :unpatch
|
720
|
+
el = change.old_element
|
721
|
+
op = change.new_position
|
722
|
+
np = change.old_position
|
846
723
|
end
|
847
|
-
end
|
848
|
-
|
849
|
-
unless thresh.empty?
|
850
|
-
link = links[thresh.size - 1]
|
851
|
-
while not link.nil?
|
852
|
-
vector[link[1]] = link[2]
|
853
|
-
link = link[0]
|
854
|
-
end
|
855
|
-
end
|
856
724
|
|
857
|
-
|
858
|
-
|
725
|
+
case action
|
726
|
+
when '-' # Remove details from the old string
|
727
|
+
while ai < op
|
728
|
+
res << (string ? src[ai, 1] : src[ai])
|
729
|
+
ai += 1
|
730
|
+
bj += 1
|
731
|
+
end
|
732
|
+
ai += 1
|
733
|
+
when '+'
|
734
|
+
while bj < np
|
735
|
+
res << (string ? src[ai, 1] : src[ai])
|
736
|
+
ai += 1
|
737
|
+
bj += 1
|
738
|
+
end
|
859
739
|
|
860
|
-
|
861
|
-
|
862
|
-
|
863
|
-
|
864
|
-
|
865
|
-
|
866
|
-
|
867
|
-
# This operation preserves the sort order.
|
868
|
-
#
|
869
|
-
# Note: This will be deprecated as a public function in a future release.
|
870
|
-
def __replace_next_larger(enum, value, last_index = nil)
|
871
|
-
# Off the end?
|
872
|
-
if enum.empty? or (value > enum[-1])
|
873
|
-
enum << value
|
874
|
-
return enum.size - 1
|
875
|
-
end
|
740
|
+
res << el
|
741
|
+
bj += 1
|
742
|
+
when '='
|
743
|
+
# This only appears in sdiff output with the SDiff callback.
|
744
|
+
# Therefore, we only need to worry about dealing with a single
|
745
|
+
# element.
|
746
|
+
res << el
|
876
747
|
|
877
|
-
|
878
|
-
|
879
|
-
|
880
|
-
|
881
|
-
|
748
|
+
ai += 1
|
749
|
+
bj += 1
|
750
|
+
when '!'
|
751
|
+
while ai < op
|
752
|
+
res << (string ? src[ai, 1] : src[ai])
|
753
|
+
ai += 1
|
754
|
+
bj += 1
|
755
|
+
end
|
882
756
|
|
883
|
-
|
757
|
+
bj += 1
|
758
|
+
ai += 1
|
884
759
|
|
885
|
-
|
886
|
-
return nil
|
887
|
-
elsif value > found
|
888
|
-
first_index = ii + 1
|
889
|
-
else
|
890
|
-
last_index = ii - 1
|
760
|
+
res << el
|
891
761
|
end
|
892
|
-
|
762
|
+
when Diff::LCS::Change
|
763
|
+
case action
|
764
|
+
when '-'
|
765
|
+
while ai < change.position
|
766
|
+
res << (string ? src[ai, 1] : src[ai])
|
767
|
+
ai += 1
|
768
|
+
bj += 1
|
769
|
+
end
|
770
|
+
ai += 1
|
771
|
+
when '+'
|
772
|
+
while bj < change.position
|
773
|
+
res << (string ? src[ai, 1] : src[ai])
|
774
|
+
ai += 1
|
775
|
+
bj += 1
|
776
|
+
end
|
893
777
|
|
894
|
-
|
895
|
-
# value.
|
896
|
-
enum[first_index] = value
|
897
|
-
return first_index
|
898
|
-
end
|
778
|
+
bj += 1
|
899
779
|
|
900
|
-
|
901
|
-
|
902
|
-
# onto the collection. (Currently unused.)
|
903
|
-
#
|
904
|
-
# Note: This will be deprecated as a public function in a future release.
|
905
|
-
def __inverse_vector(a, vector)
|
906
|
-
inverse = a.dup
|
907
|
-
(0 ... vector.size).each do |ii|
|
908
|
-
inverse[vector[ii]] = ii unless vector[ii].nil?
|
780
|
+
res << change.element
|
781
|
+
end
|
909
782
|
end
|
910
|
-
inverse
|
911
783
|
end
|
912
784
|
|
913
|
-
|
914
|
-
|
915
|
-
|
916
|
-
|
917
|
-
# Note: This will be deprecated as a public function in a future release.
|
918
|
-
def __position_hash(enum, interval = 0 .. -1)
|
919
|
-
hash = Hash.new { |hh, kk| hh[kk] = [] }
|
920
|
-
interval.each do |ii|
|
921
|
-
kk = enum.kind_of?(String) ? enum[ii, 1] : enum[ii]
|
922
|
-
hash[kk] << ii
|
923
|
-
end
|
924
|
-
hash
|
785
|
+
while ai < src.size
|
786
|
+
res << (string ? src[ai, 1] : src[ai])
|
787
|
+
ai += 1
|
788
|
+
bj += 1
|
925
789
|
end
|
926
790
|
|
927
|
-
|
928
|
-
|
929
|
-
#
|
930
|
-
# WARNING: By default, this examines the whole patch, so this could take
|
931
|
-
# some time. This also works better with Diff::LCS::ContextChange or
|
932
|
-
# Diff::LCS::Change as its source, as an array will cause the creation
|
933
|
-
# of one of the above.
|
934
|
-
#
|
935
|
-
# Note: This will be deprecated as a public function in a future release.
|
936
|
-
def __diff_direction(src, patchset, limit = nil)
|
937
|
-
count = left = left_miss = right = right_miss = 0
|
938
|
-
string = src.kind_of?(String)
|
939
|
-
|
940
|
-
patchset.each do |change|
|
941
|
-
count += 1
|
942
|
-
|
943
|
-
case change
|
944
|
-
when Diff::LCS::Change
|
945
|
-
# With a simplistic change, we can't tell the difference between
|
946
|
-
# the left and right on '!' actions, so we ignore those. On '='
|
947
|
-
# actions, if there's a miss, we miss both left and right.
|
948
|
-
element = string ? src[change.position, 1] : src[change.position]
|
949
|
-
|
950
|
-
case change.action
|
951
|
-
when '-'
|
952
|
-
if element == change.element
|
953
|
-
left += 1
|
954
|
-
else
|
955
|
-
left_miss += 1
|
956
|
-
end
|
957
|
-
when '+'
|
958
|
-
if element == change.element
|
959
|
-
right += 1
|
960
|
-
else
|
961
|
-
right_miss += 1
|
962
|
-
end
|
963
|
-
when '='
|
964
|
-
if element != change.element
|
965
|
-
left_miss += 1
|
966
|
-
right_miss += 1
|
967
|
-
end
|
968
|
-
end
|
969
|
-
when Diff::LCS::ContextChange
|
970
|
-
case change.action
|
971
|
-
when '-' # Remove details from the old string
|
972
|
-
element = string ? src[change.old_position, 1] : src[change.old_position]
|
973
|
-
if element == change.old_element
|
974
|
-
left += 1
|
975
|
-
else
|
976
|
-
left_miss += 1
|
977
|
-
end
|
978
|
-
when '+'
|
979
|
-
element = string ? src[change.new_position, 1] : src[change.new_position]
|
980
|
-
if element == change.new_element
|
981
|
-
right += 1
|
982
|
-
else
|
983
|
-
right_miss += 1
|
984
|
-
end
|
985
|
-
when '='
|
986
|
-
le = string ? src[change.old_position, 1] : src[change.old_position]
|
987
|
-
re = string ? src[change.new_position, 1] : src[change.new_position]
|
988
|
-
|
989
|
-
left_miss += 1 if le != change.old_element
|
990
|
-
right_miss += 1 if re != change.new_element
|
991
|
-
when '!'
|
992
|
-
element = string ? src[change.old_position, 1] : src[change.old_position]
|
993
|
-
if element == change.old_element
|
994
|
-
left += 1
|
995
|
-
else
|
996
|
-
element = string ? src[change.new_position, 1] : src[change.new_position]
|
997
|
-
if element == change.new_element
|
998
|
-
right += 1
|
999
|
-
else
|
1000
|
-
left_miss += 1
|
1001
|
-
right_miss += 1
|
1002
|
-
end
|
1003
|
-
end
|
1004
|
-
end
|
1005
|
-
end
|
1006
|
-
|
1007
|
-
break if (not limit.nil?) && (count > limit)
|
1008
|
-
end
|
1009
|
-
|
1010
|
-
no_left = (left == 0) and (left_miss >= 0)
|
1011
|
-
no_right = (right == 0) and (right_miss >= 0)
|
791
|
+
res
|
792
|
+
end
|
1012
793
|
|
1013
|
-
|
1014
|
-
|
1015
|
-
|
1016
|
-
|
1017
|
-
|
1018
|
-
else
|
1019
|
-
raise "The provided patchset does not appear to apply to the provided value as either source or destination value."
|
1020
|
-
end
|
1021
|
-
end
|
794
|
+
# Given a set of patchset, convert the current version to the prior
|
795
|
+
# version. Does no auto-discovery.
|
796
|
+
def unpatch!(src, patchset)
|
797
|
+
patch(src, patchset, :unpatch)
|
798
|
+
end
|
1022
799
|
|
1023
|
-
|
1024
|
-
|
1025
|
-
|
1026
|
-
|
1027
|
-
#
|
1028
|
-
# [ # patchset <- Diff::LCS.diff(a, b)
|
1029
|
-
# [ # one or more hunks
|
1030
|
-
# Diff::LCS::Change # one or more changes
|
1031
|
-
# ] ]
|
1032
|
-
#
|
1033
|
-
# [ # patchset, equivalent to the above
|
1034
|
-
# [ # one or more hunks
|
1035
|
-
# [ action, line, value ] # one or more changes
|
1036
|
-
# ] ]
|
1037
|
-
#
|
1038
|
-
# [ # patchset <- Diff::LCS.diff(a, b, Diff::LCS::ContextDiffCallbacks)
|
1039
|
-
# # OR <- Diff::LCS.sdiff(a, b, Diff::LCS::ContextDiffCallbacks)
|
1040
|
-
# [ # one or more hunks
|
1041
|
-
# Diff::LCS::ContextChange # one or more changes
|
1042
|
-
# ] ]
|
1043
|
-
#
|
1044
|
-
# [ # patchset, equivalent to the above
|
1045
|
-
# [ # one or more hunks
|
1046
|
-
# [ action, [ old line, old value ], [ new line, new value ] ]
|
1047
|
-
# # one or more changes
|
1048
|
-
# ] ]
|
1049
|
-
#
|
1050
|
-
# [ # patchset <- Diff::LCS.sdiff(a, b)
|
1051
|
-
# # OR <- Diff::LCS.diff(a, b, Diff::LCS::SDiffCallbacks)
|
1052
|
-
# Diff::LCS::ContextChange # one or more changes
|
1053
|
-
# ]
|
1054
|
-
#
|
1055
|
-
# [ # patchset, equivalent to the above
|
1056
|
-
# [ action, [ old line, old value ], [ new line, new value ] ]
|
1057
|
-
# # one or more changes
|
1058
|
-
# ]
|
1059
|
-
#
|
1060
|
-
# The result of this will be either of the following.
|
1061
|
-
#
|
1062
|
-
# [ # patchset
|
1063
|
-
# Diff::LCS::ContextChange # one or more changes
|
1064
|
-
# ]
|
1065
|
-
#
|
1066
|
-
# [ # patchset
|
1067
|
-
# Diff::LCS::Change # one or more changes
|
1068
|
-
# ]
|
1069
|
-
#
|
1070
|
-
# If either of the above is provided, it will be returned as such.
|
1071
|
-
#
|
1072
|
-
# Note: This will be deprecated as a public function in a future release.
|
1073
|
-
def __normalize_patchset(patchset)
|
1074
|
-
patchset.map do |hunk|
|
1075
|
-
case hunk
|
1076
|
-
when Diff::LCS::ContextChange, Diff::LCS::Change
|
1077
|
-
hunk
|
1078
|
-
when Array
|
1079
|
-
if (not hunk[0].kind_of?(Array)) and hunk[1].kind_of?(Array) and hunk[2].kind_of?(Array)
|
1080
|
-
Diff::LCS::ContextChange.from_a(hunk)
|
1081
|
-
else
|
1082
|
-
hunk.map do |change|
|
1083
|
-
case change
|
1084
|
-
when Diff::LCS::ContextChange, Diff::LCS::Change
|
1085
|
-
change
|
1086
|
-
when Array
|
1087
|
-
# change[1] will ONLY be an array in a ContextChange#to_a call.
|
1088
|
-
# In Change#to_a, it represents the line (singular).
|
1089
|
-
if change[1].kind_of?(Array)
|
1090
|
-
Diff::LCS::ContextChange.from_a(change)
|
1091
|
-
else
|
1092
|
-
Diff::LCS::Change.from_a(change)
|
1093
|
-
end
|
1094
|
-
end
|
1095
|
-
end
|
1096
|
-
end
|
1097
|
-
else
|
1098
|
-
raise ArgumentError, "Cannot normalise a hunk of class #{hunk.class}."
|
1099
|
-
end
|
1100
|
-
end.flatten
|
1101
|
-
end
|
800
|
+
# Given a set of patchset, convert the current version to the next
|
801
|
+
# version. Does no auto-discovery.
|
802
|
+
def patch!(src, patchset)
|
803
|
+
patch(src, patchset, :patch)
|
1102
804
|
end
|
1103
805
|
end
|
1104
|
-
|
1105
|
-
# vim: ft=ruby
|