summaryrefslogtreecommitdiff
path: root/lib/diff/lcs/callbacks.rb
diff options
context:
space:
mode:
authorAustin Ziegler <austin@halostatue.ca>2011-07-30 19:40:23 -0400
committerAustin Ziegler <austin@halostatue.ca>2011-07-30 19:40:23 -0400
commit9feacf82a4859362662c05ffaaeaf26b40a36018 (patch)
tree57be359c74bcdabd2510835f5568b64ba61f769d /lib/diff/lcs/callbacks.rb
parentca444f81819ee49d3a174271dbca75061a4067f5 (diff)
downloaddiff-lcs-9feacf82a4859362662c05ffaaeaf26b40a36018.tar.gz
Converting diff-lcs from svn to git format.
Diffstat (limited to 'lib/diff/lcs/callbacks.rb')
-rw-r--r--lib/diff/lcs/callbacks.rb322
1 files changed, 322 insertions, 0 deletions
diff --git a/lib/diff/lcs/callbacks.rb b/lib/diff/lcs/callbacks.rb
new file mode 100644
index 0000000..74a1cdc
--- /dev/null
+++ b/lib/diff/lcs/callbacks.rb
@@ -0,0 +1,322 @@
+#! /usr/env/bin ruby
+#--
+# Copyright 2004 Austin Ziegler <diff-lcs@halostatue.ca>
+# adapted from:
+# Algorithm::Diff (Perl) by Ned Konz <perl@bike-nomad.com>
+# Smalltalk by Mario I. Wolczko <mario@wolczko.com>
+# implements McIlroy-Hunt diff algorithm
+#
+# This program is free software. It may be redistributed and/or modified under
+# the terms of the GPL version 2 (or later), the Perl Artistic licence, or the
+# Ruby licence.
+#
+# $Id$
+#++
+# Contains definitions for all default callback objects.
+
+require 'diff/lcs/change'
+
+module Diff::LCS
+ # This callback object implements the default set of callback events, which
+ # only returns the event itself. Note that #finished_a and #finished_b are
+ # not implemented -- I haven't yet figured out where they would be useful.
+ #
+ # Note that this is intended to be called as is, e.g.,
+ #
+ # Diff::LCS.LCS(seq1, seq2, Diff::LCS::DefaultCallbacks)
+ class DefaultCallbacks
+ class << self
+ # Called when two items match.
+ def match(event)
+ event
+ end
+ # Called when the old value is discarded in favour of the new value.
+ def discard_a(event)
+ event
+ end
+ # Called when the new value is discarded in favour of the old value.
+ def discard_b(event)
+ event
+ end
+ # Called when both the old and new values have changed.
+ def change(event)
+ event
+ end
+
+ private :new
+ end
+ end
+
+ # An alias for DefaultCallbacks that is used in Diff::LCS#traverse_sequences.
+ #
+ # Diff::LCS.LCS(seq1, seq2, Diff::LCS::SequenceCallbacks)
+ SequenceCallbacks = DefaultCallbacks
+ # An alias for DefaultCallbacks that is used in Diff::LCS#traverse_balanced.
+ #
+ # Diff::LCS.LCS(seq1, seq2, Diff::LCS::BalancedCallbacks)
+ BalancedCallbacks = DefaultCallbacks
+end
+
+ # This will produce a compound array of simple diff change objects. Each
+ # element in the #diffs array is a +hunk+ or +hunk+ array, where each
+ # element in each +hunk+ array is a single Change object representing the
+ # addition or removal of a single element from one of the two tested
+ # sequences. The +hunk+ provides the full context for the changes.
+ #
+ # diffs = Diff::LCS.diff(seq1, seq2)
+ # # This example shows a simplified array format.
+ # # [ [ [ '-', 0, 'a' ] ], # 1
+ # # [ [ '+', 2, 'd' ] ], # 2
+ # # [ [ '-', 4, 'h' ], # 3
+ # # [ '+', 4, 'f' ] ],
+ # # [ [ '+', 6, 'k' ] ], # 4
+ # # [ [ '-', 8, 'n' ], # 5
+ # # [ '-', 9, 'p' ],
+ # # [ '+', 9, 'r' ],
+ # # [ '+', 10, 's' ],
+ # # [ '+', 11, 't' ] ] ]
+ #
+ # There are five hunks here. The first hunk says that the +a+ at position 0
+ # of the first sequence should be deleted (<tt>'-'</tt>). The second hunk
+ # says that the +d+ at position 2 of the second sequence should be inserted
+ # (<tt>'+'</tt>). The third hunk says that the +h+ at position 4 of the
+ # first sequence should be removed and replaced with the +f+ from position 4
+ # of the second sequence. The other two hunks are described similarly.
+ #
+ # === Use
+ # This callback object must be initialised and is used by the Diff::LCS#diff
+ # method.
+ #
+ # cbo = Diff::LCS::DiffCallbacks.new
+ # Diff::LCS.LCS(seq1, seq2, cbo)
+ # cbo.finish
+ #
+ # Note that the call to #finish is absolutely necessary, or the last set of
+ # changes will not be visible. Alternatively, can be used as:
+ #
+ # cbo = Diff::LCS::DiffCallbacks.new { |tcbo| Diff::LCS.LCS(seq1, seq2, tcbo) }
+ #
+ # The necessary #finish call will be made.
+ #
+ # === Simplified Array Format
+ # The simplified array format used in the example above can be obtained
+ # with:
+ #
+ # require 'pp'
+ # pp diffs.map { |e| e.map { |f| f.to_a } }
+class Diff::LCS::DiffCallbacks
+ # Returns the difference set collected during the diff process.
+ attr_reader :diffs
+
+ def initialize # :yields self:
+ @hunk = []
+ @diffs = []
+
+ if block_given?
+ begin
+ yield self
+ ensure
+ self.finish
+ end
+ end
+ end
+
+ # Finalizes the diff process. If an unprocessed hunk still exists, then it
+ # is appended to the diff list.
+ def finish
+ add_nonempty_hunk
+ end
+
+ def match(event)
+ add_nonempty_hunk
+ end
+
+ def discard_a(event)
+ @hunk << Diff::LCS::Change.new('-', event.old_position, event.old_element)
+ end
+
+ def discard_b(event)
+ @hunk << Diff::LCS::Change.new('+', event.new_position, event.new_element)
+ end
+
+private
+ def add_nonempty_hunk
+ @diffs << @hunk unless @hunk.empty?
+ @hunk = []
+ end
+end
+
+ # This will produce a compound array of contextual diff change objects. Each
+ # element in the #diffs array is a "hunk" array, where each element in each
+ # "hunk" array is a single change. Each change is a Diff::LCS::ContextChange
+ # that contains both the old index and new index values for the change. The
+ # "hunk" provides the full context for the changes. Both old and new objects
+ # will be presented for changed objects. +nil+ will be substituted for a
+ # discarded object.
+ #
+ # seq1 = %w(a b c e h j l m n p)
+ # seq2 = %w(b c d e f j k l m r s t)
+ #
+ # diffs = Diff::LCS.diff(seq1, seq2, Diff::LCS::ContextDiffCallbacks)
+ # # This example shows a simplified array format.
+ # # [ [ [ '-', [ 0, 'a' ], [ 0, nil ] ] ], # 1
+ # # [ [ '+', [ 3, nil ], [ 2, 'd' ] ] ], # 2
+ # # [ [ '-', [ 4, 'h' ], [ 4, nil ] ], # 3
+ # # [ '+', [ 5, nil ], [ 4, 'f' ] ] ],
+ # # [ [ '+', [ 6, nil ], [ 6, 'k' ] ] ], # 4
+ # # [ [ '-', [ 8, 'n' ], [ 9, nil ] ], # 5
+ # # [ '+', [ 9, nil ], [ 9, 'r' ] ],
+ # # [ '-', [ 9, 'p' ], [ 10, nil ] ],
+ # # [ '+', [ 10, nil ], [ 10, 's' ] ],
+ # # [ '+', [ 10, nil ], [ 11, 't' ] ] ] ]
+ #
+ # The five hunks shown are comprised of individual changes; if there is a
+ # related set of changes, they are still shown individually.
+ #
+ # This callback can also be used with Diff::LCS#sdiff, which will produce
+ # results like:
+ #
+ # diffs = Diff::LCS.sdiff(seq1, seq2, Diff::LCS::ContextCallbacks)
+ # # This example shows a simplified array format.
+ # # [ [ [ "-", [ 0, "a" ], [ 0, nil ] ] ], # 1
+ # # [ [ "+", [ 3, nil ], [ 2, "d" ] ] ], # 2
+ # # [ [ "!", [ 4, "h" ], [ 4, "f" ] ] ], # 3
+ # # [ [ "+", [ 6, nil ], [ 6, "k" ] ] ], # 4
+ # # [ [ "!", [ 8, "n" ], [ 9, "r" ] ], # 5
+ # # [ "!", [ 9, "p" ], [ 10, "s" ] ],
+ # # [ "+", [ 10, nil ], [ 11, "t" ] ] ] ]
+ #
+ # The five hunks are still present, but are significantly shorter in total
+ # presentation, because changed items are shown as changes ("!") instead of
+ # potentially "mismatched" pairs of additions and deletions.
+ #
+ # The result of this operation is similar to that of
+ # Diff::LCS::SDiffCallbacks. They may be compared as:
+ #
+ # s = Diff::LCS.sdiff(seq1, seq2).reject { |e| e.action == "=" }
+ # c = Diff::LCS.sdiff(seq1, seq2, Diff::LCS::ContextDiffCallbacks).flatten
+ #
+ # s == c # -> true
+ #
+ # === Use
+ # This callback object must be initialised and can be used by the
+ # Diff::LCS#diff or Diff::LCS#sdiff methods.
+ #
+ # cbo = Diff::LCS::ContextDiffCallbacks.new
+ # Diff::LCS.LCS(seq1, seq2, cbo)
+ # cbo.finish
+ #
+ # Note that the call to #finish is absolutely necessary, or the last set of
+ # changes will not be visible. Alternatively, can be used as:
+ #
+ # cbo = Diff::LCS::ContextDiffCallbacks.new { |tcbo| Diff::LCS.LCS(seq1, seq2, tcbo) }
+ #
+ # The necessary #finish call will be made.
+ #
+ # === Simplified Array Format
+ # The simplified array format used in the example above can be obtained
+ # with:
+ #
+ # require 'pp'
+ # pp diffs.map { |e| e.map { |f| f.to_a } }
+class Diff::LCS::ContextDiffCallbacks < Diff::LCS::DiffCallbacks
+ def discard_a(event)
+ @hunk << Diff::LCS::ContextChange.simplify(event)
+ end
+
+ def discard_b(event)
+ @hunk << Diff::LCS::ContextChange.simplify(event)
+ end
+
+ def change(event)
+ @hunk << Diff::LCS::ContextChange.simplify(event)
+ end
+end
+
+ # This will produce a simple array of diff change objects. Each element in
+ # the #diffs array is a single ContextChange. In the set of #diffs provided
+ # by SDiffCallbacks, both old and new objects will be presented for both
+ # changed <strong>and unchanged</strong> objects. +nil+ will be substituted
+ # for a discarded object.
+ #
+ # The diffset produced by this callback, when provided to Diff::LCS#sdiff,
+ # will compute and display the necessary components to show two sequences
+ # and their minimized differences side by side, just like the Unix utility
+ # +sdiff+.
+ #
+ # same same
+ # before | after
+ # old < -
+ # - > new
+ #
+ # seq1 = %w(a b c e h j l m n p)
+ # seq2 = %w(b c d e f j k l m r s t)
+ #
+ # diffs = Diff::LCS.sdiff(seq1, seq2)
+ # # This example shows a simplified array format.
+ # # [ [ "-", [ 0, "a"], [ 0, nil ] ],
+ # # [ "=", [ 1, "b"], [ 0, "b" ] ],
+ # # [ "=", [ 2, "c"], [ 1, "c" ] ],
+ # # [ "+", [ 3, nil], [ 2, "d" ] ],
+ # # [ "=", [ 3, "e"], [ 3, "e" ] ],
+ # # [ "!", [ 4, "h"], [ 4, "f" ] ],
+ # # [ "=", [ 5, "j"], [ 5, "j" ] ],
+ # # [ "+", [ 6, nil], [ 6, "k" ] ],
+ # # [ "=", [ 6, "l"], [ 7, "l" ] ],
+ # # [ "=", [ 7, "m"], [ 8, "m" ] ],
+ # # [ "!", [ 8, "n"], [ 9, "r" ] ],
+ # # [ "!", [ 9, "p"], [ 10, "s" ] ],
+ # # [ "+", [ 10, nil], [ 11, "t" ] ] ]
+ #
+ # The result of this operation is similar to that of
+ # Diff::LCS::ContextDiffCallbacks. They may be compared as:
+ #
+ # s = Diff::LCS.sdiff(seq1, seq2).reject { |e| e.action == "=" }
+ # c = Diff::LCS.sdiff(seq1, seq2, Diff::LCS::ContextDiffCallbacks).flatten
+ #
+ # s == c # -> true
+ #
+ # === Use
+ # This callback object must be initialised and is used by the Diff::LCS#sdiff
+ # method.
+ #
+ # cbo = Diff::LCS::SDiffCallbacks.new
+ # Diff::LCS.LCS(seq1, seq2, cbo)
+ #
+ # As with the other initialisable callback objects, Diff::LCS::SDiffCallbacks
+ # can be initialised with a block. As there is no "fininishing" to be done,
+ # this has no effect on the state of the object.
+ #
+ # cbo = Diff::LCS::SDiffCallbacks.new { |tcbo| Diff::LCS.LCS(seq1, seq2, tcbo) }
+ #
+ # === Simplified Array Format
+ # The simplified array format used in the example above can be obtained
+ # with:
+ #
+ # require 'pp'
+ # pp diffs.map { |e| e.to_a }
+class Diff::LCS::SDiffCallbacks
+ # Returns the difference set collected during the diff process.
+ attr_reader :diffs
+
+ def initialize #:yields self:
+ @diffs = []
+ yield self if block_given?
+ end
+
+ def match(event)
+ @diffs << Diff::LCS::ContextChange.simplify(event)
+ end
+
+ def discard_a(event)
+ @diffs << Diff::LCS::ContextChange.simplify(event)
+ end
+
+ def discard_b(event)
+ @diffs << Diff::LCS::ContextChange.simplify(event)
+ end
+
+ def change(event)
+ @diffs << Diff::LCS::ContextChange.simplify(event)
+ end
+end