Viewing file: Differ.php (6.96 KB) -rw-r--r-- Select action/file-type: (+) | (+) | (+) | Code (+) | Session (+) | (+) | SDB (+) | (+) | (+) | (+) | (+) | (+) |
<?php /* * This file is part of the Diff package. * * (c) Sebastian Bergmann <sebastian@phpunit.de> * * For the full copyright and license information, please view the LICENSE * file that was distributed with this source code. */
namespace SebastianBergmann\Diff;
use SebastianBergmann\Diff\LCS\LongestCommonSubsequence; use SebastianBergmann\Diff\LCS\TimeEfficientImplementation; use SebastianBergmann\Diff\LCS\MemoryEfficientImplementation;
/** * Diff implementation. */ class Differ { /** * @var string */ private $header;
/** * @var bool */ private $showNonDiffLines;
/** * @param string $header */ public function __construct($header = "--- Original\n+++ New\n", $showNonDiffLines = true) { $this->header = $header; $this->showNonDiffLines = $showNonDiffLines; }
/** * Returns the diff between two arrays or strings as string. * * @param array|string $from * @param array|string $to * @param LongestCommonSubsequence $lcs * * @return string */ public function diff($from, $to, LongestCommonSubsequence $lcs = null) { if (!is_array($from) && !is_string($from)) { $from = (string) $from; }
if (!is_array($to) && !is_string($to)) { $to = (string) $to; }
$buffer = $this->header; $diff = $this->diffToArray($from, $to, $lcs);
$inOld = false; $i = 0; $old = array();
foreach ($diff as $line) { if ($line[1] === 0 /* OLD */) { if ($inOld === false) { $inOld = $i; } } elseif ($inOld !== false) { if (($i - $inOld) > 5) { $old[$inOld] = $i - 1; }
$inOld = false; }
++$i; }
$start = isset($old[0]) ? $old[0] : 0; $end = count($diff);
if ($tmp = array_search($end, $old)) { $end = $tmp; }
$newChunk = true;
for ($i = $start; $i < $end; $i++) { if (isset($old[$i])) { $buffer .= "\n"; $newChunk = true; $i = $old[$i]; }
if ($newChunk) { if ($this->showNonDiffLines === true) { $buffer .= "@@ @@\n"; } $newChunk = false; }
if ($diff[$i][1] === 1 /* ADDED */) { $buffer .= '+' . $diff[$i][0] . "\n"; } elseif ($diff[$i][1] === 2 /* REMOVED */) { $buffer .= '-' . $diff[$i][0] . "\n"; } elseif ($this->showNonDiffLines === true) { $buffer .= ' ' . $diff[$i][0] . "\n"; } }
return $buffer; }
/** * Returns the diff between two arrays or strings as array. * * Each array element contains two elements: * - [0] => string $token * - [1] => 2|1|0 * * - 2: REMOVED: $token was removed from $from * - 1: ADDED: $token was added to $from * - 0: OLD: $token is not changed in $to * * @param array|string $from * @param array|string $to * @param LongestCommonSubsequence $lcs * * @return array */ public function diffToArray($from, $to, LongestCommonSubsequence $lcs = null) { preg_match_all('(\r\n|\r|\n)', $from, $fromMatches); preg_match_all('(\r\n|\r|\n)', $to, $toMatches);
if (is_string($from)) { $from = preg_split('(\r\n|\r|\n)', $from); }
if (is_string($to)) { $to = preg_split('(\r\n|\r|\n)', $to); }
$start = array(); $end = array(); $fromLength = count($from); $toLength = count($to); $length = min($fromLength, $toLength);
for ($i = 0; $i < $length; ++$i) { if ($from[$i] === $to[$i]) { $start[] = $from[$i]; unset($from[$i], $to[$i]); } else { break; } }
$length -= $i;
for ($i = 1; $i < $length; ++$i) { if ($from[$fromLength - $i] === $to[$toLength - $i]) { array_unshift($end, $from[$fromLength - $i]); unset($from[$fromLength - $i], $to[$toLength - $i]); } else { break; } }
if ($lcs === null) { $lcs = $this->selectLcsImplementation($from, $to); }
$common = $lcs->calculate(array_values($from), array_values($to)); $diff = array();
if (isset($fromMatches[0]) && $toMatches[0] && count($fromMatches[0]) === count($toMatches[0]) && $fromMatches[0] !== $toMatches[0]) { $diff[] = array( '#Warning: Strings contain different line endings!', 0 ); }
foreach ($start as $token) { $diff[] = array($token, 0 /* OLD */); }
reset($from); reset($to);
foreach ($common as $token) { while ((($fromToken = reset($from)) !== $token)) { $diff[] = array(array_shift($from), 2 /* REMOVED */); }
while ((($toToken = reset($to)) !== $token)) { $diff[] = array(array_shift($to), 1 /* ADDED */); }
$diff[] = array($token, 0 /* OLD */);
array_shift($from); array_shift($to); }
while (($token = array_shift($from)) !== null) { $diff[] = array($token, 2 /* REMOVED */); }
while (($token = array_shift($to)) !== null) { $diff[] = array($token, 1 /* ADDED */); }
foreach ($end as $token) { $diff[] = array($token, 0 /* OLD */); }
return $diff; }
/** * @param array $from * @param array $to * * @return LongestCommonSubsequence */ private function selectLcsImplementation(array $from, array $to) { // We do not want to use the time-efficient implementation if its memory // footprint will probably exceed this value. Note that the footprint // calculation is only an estimation for the matrix and the LCS method // will typically allocate a bit more memory than this. $memoryLimit = 100 * 1024 * 1024;
if ($this->calculateEstimatedFootprint($from, $to) > $memoryLimit) { return new MemoryEfficientImplementation; }
return new TimeEfficientImplementation; }
/** * Calculates the estimated memory footprint for the DP-based method. * * @param array $from * @param array $to * * @return int */ private function calculateEstimatedFootprint(array $from, array $to) { $itemSize = PHP_INT_SIZE == 4 ? 76 : 144;
return $itemSize * pow(min(count($from), count($to)), 2); } }
|