1 | <?php |
||
2 | /** |
||
3 | * (c) Steve Nebes <[email protected]> |
||
4 | * |
||
5 | * For the full copyright and license information, please view the LICENSE |
||
6 | * file that was distributed with this source code. |
||
7 | */ |
||
8 | |||
9 | declare(strict_types=1); |
||
10 | |||
11 | namespace SN\DaisyDiff\RangeDifferencer; |
||
12 | |||
13 | /** |
||
14 | * The algorithm used is an objectified version of one described in: A File Comparison Program, by Webb Miller and |
||
15 | * Eugene W. Myers, Software Practice and Experience, Vol. 15, Nov. 1985. |
||
16 | */ |
||
17 | final class OldDifferencer |
||
18 | { |
||
19 | /** |
||
20 | * Prevent class instantiation. |
||
21 | * |
||
22 | * @codeCoverageIgnore |
||
23 | */ |
||
24 | private function __construct() |
||
25 | { |
||
26 | } |
||
27 | |||
28 | /** |
||
29 | * Finds the differences between two RangeComparatorInterfaces. The differences are returned as an array of |
||
30 | * RangeDifferences. If no differences are detected an empty array is returned. |
||
31 | * |
||
32 | * @param RangeComparatorInterface $left |
||
33 | * @param RangeComparatorInterface $right |
||
34 | * @return RangeDifference[] |
||
35 | */ |
||
36 | 66 | public static function findDifferences(RangeComparatorInterface $left, RangeComparatorInterface $right): array |
|
37 | { |
||
38 | // Assert that both RangeComparatorInterface are of the same class. |
||
39 | 66 | \assert(\get_class($right) === \get_class($left)); |
|
40 | |||
41 | 66 | $rightSize = $right->getRangeCount(); |
|
42 | 66 | $leftSize = $left->getRangeCount(); |
|
43 | |||
44 | // Differences matrix: |
||
45 | // Only the last d of each diagonal is stored, i.e., $lastDiagonal[$k] = row of d |
||
46 | 66 | $diagLen = (int) (2 * \max($rightSize, $leftSize)); |
|
47 | 66 | $maxDiagonal = $diagLen; |
|
48 | |||
49 | /** @var int[] The row containing the last d */ |
||
50 | 66 | $lastDiagonal = \array_fill(0, $diagLen + 1, 0); |
|
51 | |||
52 | // On diagonal $k ($lastDiagonal[$k] = $row |
||
53 | 66 | $origin = (int) ($diagLen / 2); |
|
54 | |||
55 | // Script corresponding to $d[$k] |
||
56 | /** @var LinkedRangeDifference[] $script */ |
||
57 | 66 | $script = \array_fill(0, $diagLen + 1, null); |
|
58 | 66 | $row = 0; |
|
59 | |||
60 | // Find common prefix. |
||
61 | 66 | for (;$row < $rightSize && $row < $leftSize && self::rangesEqual($right, $row, $left, $row);) { |
|
62 | 58 | $row++; |
|
63 | } |
||
64 | |||
65 | 66 | $lastDiagonal[$origin] = $row; |
|
66 | 66 | $script[$origin] = null; |
|
67 | |||
68 | 66 | $lower = ($row === $rightSize) ? $origin + 1 : $origin - 1; |
|
69 | 66 | $upper = ($row === $leftSize) ? $origin - 1 : $origin + 1; |
|
70 | |||
71 | 66 | if ($lower > $upper) { |
|
72 | 42 | return []; |
|
73 | } |
||
74 | |||
75 | // For each value of the edit distance. |
||
76 | 63 | for ($d = 1; $d <= $maxDiagonal; $d++) { |
|
77 | // $d is the current edit distance. |
||
78 | |||
79 | 63 | if ($right->skipRangeComparison($d, $maxDiagonal, $left)) { |
|
80 | // This condition always returns false, so the following code is never executed. |
||
81 | // It should be something we already found. |
||
82 | return []; // @codeCoverageIgnore |
||
83 | } |
||
84 | |||
85 | // For each relevant diagonal (-d, -d+2, ... d-2, d) |
||
86 | 63 | for ($k = $lower; $k <= $upper; $k += 2) { |
|
87 | // $k is the current diagonal. |
||
88 | 63 | if ($k === $origin - $d || $k !== $origin + $d && $lastDiagonal[$k + 1] >= $lastDiagonal[$k - 1]) { |
|
89 | // Move down. |
||
90 | 59 | $row = $lastDiagonal[$k + 1] + 1; |
|
91 | 59 | $edit = new LinkedRangeDifference($script[$k + 1], LinkedRangeDifference::DELETE); |
|
92 | } else { |
||
93 | // Move right. |
||
94 | 54 | $row = $lastDiagonal[$k - 1]; |
|
95 | 54 | $edit = new LinkedRangeDifference($script[$k - 1], LinkedRangeDifference::INSERT); |
|
96 | } |
||
97 | |||
98 | 63 | $col = $row + $k - $origin; |
|
99 | |||
100 | 63 | $edit->setRightStart($row); |
|
101 | 63 | $edit->setLeftStart($col); |
|
102 | |||
103 | 63 | \assert($k >= 0 && $k <= $maxDiagonal); |
|
104 | 63 | $script[$k] = $edit; |
|
105 | |||
106 | // Slide down the diagonal as far as possible. |
||
107 | 63 | while ($row < $rightSize && $col < $leftSize && self::rangesEqual($right, $row, $left, $col)) { |
|
108 | 38 | $row++; |
|
109 | 38 | $col++; |
|
110 | } |
||
111 | |||
112 | // Unreasonable value for diagonal index. |
||
113 | 63 | \assert($k >= 0 && $k <= $maxDiagonal); |
|
114 | 63 | $lastDiagonal[$k] = $row; |
|
115 | |||
116 | 63 | if ($row === $rightSize && $col === $leftSize) { |
|
117 | 63 | return self::createRangeDifferences($script[$k]); |
|
118 | } |
||
119 | |||
120 | 54 | if ($row === $rightSize) { |
|
121 | 30 | $lower = $k + 2; |
|
122 | } |
||
123 | |||
124 | 54 | if ($col === $leftSize) { |
|
125 | 25 | $upper = $k - 2; |
|
126 | } |
||
127 | } |
||
128 | |||
129 | 48 | $lower--; |
|
130 | 48 | $upper++; |
|
131 | } |
||
132 | |||
133 | // Too many differences. |
||
134 | throw new \RuntimeException(); // @codeCoverageIgnore |
||
135 | } |
||
136 | |||
137 | /** |
||
138 | * Tests if two ranges are equal |
||
139 | * |
||
140 | * @param RangeComparatorInterface $a |
||
141 | * @param int $ai |
||
142 | * @param RangeComparatorInterface $b |
||
143 | * @param int $bi |
||
144 | * @return bool |
||
145 | */ |
||
146 | 62 | private static function rangesEqual( |
|
147 | RangeComparatorInterface $a, |
||
148 | int $ai, |
||
149 | RangeComparatorInterface $b, |
||
150 | int $bi |
||
151 | ): bool { |
||
152 | 62 | return $a->rangesEqual($ai, $b, $bi); |
|
153 | } |
||
154 | |||
155 | /** |
||
156 | * Creates a Vector of DifferencesRanges out of the LinkedRangeDifference. It coalesces adjacent changes. In |
||
157 | * addition, indices are changed such that the ranges are 1) open, i.e, the end of the range is not included, and 2) |
||
158 | * are zero based. |
||
159 | * |
||
160 | * @param LinkedRangeDifference $start |
||
161 | * @return RangeDifference[] |
||
162 | */ |
||
163 | 63 | private static function createRangeDifferences(LinkedRangeDifference $start): array |
|
164 | { |
||
165 | 63 | $ep = self::reverseDifferences($start); |
|
166 | 63 | $result = []; |
|
167 | |||
168 | 63 | while (null !== $ep) { |
|
169 | 63 | $es = new RangeDifference(RangeDifference::CHANGE); |
|
170 | |||
171 | 63 | if ($ep->isInsert()) { |
|
172 | 22 | $es->setRightStart($ep->getRightStart() + 1); |
|
173 | 22 | $es->setLeftStart($ep->getLeftStart()); |
|
174 | 22 | $b = $ep; |
|
175 | |||
176 | do { |
||
177 | 22 | $ep = $ep->getNext(); |
|
178 | 22 | $es->setLeftLength($es->getLeftLength() + 1); |
|
179 | 22 | } while (null !== $ep && $ep->isInsert() && $ep->getRightStart() === $b->getRightStart()); |
|
180 | } else { |
||
181 | 50 | $es->setRightStart($ep->getRightStart()); |
|
182 | 50 | $es->setLeftStart($ep->getLeftStart()); |
|
183 | |||
184 | // Deleted lines. |
||
185 | do { |
||
186 | 50 | $a = $ep; |
|
187 | 50 | $ep = $ep->getNext(); |
|
188 | 50 | $es->setRightLength($es->getRightLength() + 1); |
|
189 | 50 | } while (null !== $ep && $ep->isDelete() && $ep->getRightStart() === $a->getRightStart() + 1); |
|
190 | |||
191 | 50 | $change = (null !== $ep && $ep->isInsert() && $ep->getRightStart() === $a->getRightStart()); |
|
192 | |||
193 | 50 | if ($change) { |
|
194 | 27 | $b = $ep; |
|
195 | |||
196 | // Replacement lines. |
||
197 | do { |
||
198 | 27 | $ep = $ep->getNext(); |
|
199 | 27 | $es->setLeftLength($es->getLeftLength() + 1); |
|
200 | 27 | } while (null !== $ep && $ep->isInsert() && $ep->getRightStart() === $b->getRightStart()); |
|
201 | } else { |
||
202 | 31 | $es->setLeftLength(0); |
|
203 | } |
||
204 | |||
205 | // Meaning of range changes from "insert after", to "replace with". |
||
206 | 50 | $es->setLeftStart($es->getLeftStart() + 1); |
|
207 | } |
||
208 | |||
209 | // The script commands are 1 based, subtract one to make them zero based. |
||
210 | 63 | $es->setRightStart($es->getRightStart() - 1); |
|
211 | 63 | $es->setLeftStart($es->getLeftStart() - 1); |
|
212 | |||
213 | 63 | $result[] = $es; |
|
214 | } |
||
215 | |||
216 | 63 | return $result; |
|
217 | } |
||
218 | |||
219 | /** |
||
220 | * Reverses the range differences. |
||
221 | * |
||
222 | * @param LinkedRangeDifference $start |
||
223 | * @return LinkedRangeDifference |
||
224 | */ |
||
225 | 63 | private static function reverseDifferences(LinkedRangeDifference $start): LinkedRangeDifference |
|
226 | { |
||
227 | 63 | $ahead = $start; |
|
228 | 63 | $ep = null; |
|
229 | |||
230 | 63 | while (null !== $ahead) { |
|
231 | 63 | $behind = $ep; |
|
232 | 63 | $ep = $ahead; |
|
233 | 63 | $ahead = $ahead->getNext(); |
|
234 | 63 | $ep->setNext($behind); |
|
235 | } |
||
236 | |||
237 | 63 | return $ep; |
|
0 ignored issues
–
show
Bug
Best Practice
introduced
by
![]() |
|||
238 | } |
||
239 | } |
||
240 |