getChangeSetFromEmptyLeft( $right ); } $diffs = new Diff( explode( "\n", $left ), explode( "\n", $right ) ); $format = new UnifiedDiffFormatter(); $diff = $format->format( $diffs ); return $this->parse( $diff, $left, $right ); } /** * If we add content to an empty page the changeSet can be composed straightaway * * @param string $right * @return array[] see getChangeSet() */ private function getChangeSetFromEmptyLeft( $right ) { $rightLines = explode( "\n", $right ); return [ '_info' => [ 'lhs-length' => 1, 'rhs-length' => count( $rightLines ), 'lhs' => [ '' ], 'rhs' => $rightLines ], [ 'right-pos' => 1, 'left-pos' => 1, 'action' => 'add', 'content' => $right, ] ]; } /** * Duplicates the check from the global wfDiff function to determine * if we are using internal or external diff utilities * * @deprecated since 1.29, the internal diff parser is always used */ protected static function usingInternalDiff() { return true; } /** * Parse the unified diff output into an array of changes to individual groups of the text * * @param string $diff The unified diff output * @param string $left The left side of the diff used for sanity checks * @param string $right The right side of the diff used for sanity checks * * @return array[] */ protected function parse( $diff, $left, $right ) { $this->left = explode( "\n", $left ); $this->right = explode( "\n", $right ); $diff = explode( "\n", $diff ); $this->leftPos = 0; $this->rightPos = 0; $this->changeSet = [ '_info' => [ 'lhs-length' => count( $this->left ), 'rhs-length' => count( $this->right ), 'lhs' => $this->left, 'rhs' => $this->right, ], ]; $change = null; foreach ( $diff as $line ) { $change = $this->parseLine( $line, $change ); } if ( $change === null ) { return $this->changeSet; } else { return array_merge( $this->changeSet, $change->getChangeSet() ); } } /** * Parse the next line of the unified diff output * * @param string $line The next line of the unified diff * @param EchoDiffGroup $change Changes the the immediately previous lines * * @throws MWException * @return EchoDiffGroup Changes to this line and any changed lines immediately previous */ protected function parseLine( $line, EchoDiffGroup $change = null ) { if ( $line ) { $op = $line[0]; if ( strlen( $line ) > $this->prefixLength ) { $line = substr( $line, $this->prefixLength ); } else { $line = ''; } } else { $op = ' '; } switch ( $op ) { case '@': // metadata if ( $change !== null ) { $this->changeSet = array_merge( $this->changeSet, $change->getChangeSet() ); $change = null; } // @@ -start,numLines +start,numLines @@ list( , $left, $right ) = explode( ' ', $line ); list( $this->leftPos ) = explode( ',', substr( $left, 1 ) ); list( $this->rightPos ) = explode( ',', substr( $right, 1 ) ); // -1 because diff is 1 indexed and we are 0 indexed $this->leftPos--; $this->rightPos--; break; case ' ': // No changes if ( $change !== null ) { $this->changeSet = array_merge( $this->changeSet, $change->getChangeSet() ); $change = null; } $this->leftPos++; $this->rightPos++; break; case '-': // subtract if ( $this->left[$this->leftPos] !== $line ) { throw new MWException( 'Positional error: left' ); } if ( $change === null ) { $change = new EchoDiffGroup( $this->leftPos, $this->rightPos ); } $change->subtract( $line ); $this->leftPos++; break; case '+': // add if ( $this->right[$this->rightPos] !== $line ) { throw new MWException( 'Positional error: right' ); } if ( $change === null ) { $change = new EchoDiffGroup( $this->leftPos, $this->rightPos ); } $change->add( $line ); $this->rightPos++; break; default: throw new MWException( 'Unknown Diff Operation: ' . $op ); } return $change; } } /** * Represents a single set of changes all effecting neighboring lines */ class EchoDiffGroup { /** * @var array The left and right position this change starts at */ protected $position; /** * @var array The lines that have been added */ protected $new = []; /** * @var array The lines that have been removed */ protected $old = []; /** * @param integer $leftPos The starting line number in the left text * @param integer $rightPos The starting line number in the right text */ public function __construct( $leftPos, $rightPos ) { // +1 due to the origional code use 1 indexing for this result $this->position = [ 'right-pos' => $rightPos + 1, 'left-pos' => $leftPos + 1, ]; } /** * @param string $line Line in the right text but not in the left */ public function add( $line ) { $this->new[] = $line; } /** * @param string $line Line in the left text but not in the right */ public function subtract( $line ) { $this->old[] = $line; } /** * @return array[] set of changes * Each change consists of: * An 'action', one of: * - add * - subtract * - change * 'content' that was added or removed, or in the case * of a change, 'old_content' and 'new_content' * 'left_pos' and 'right_pos' (in 1-indexed lines) of the change. */ public function getChangeSet() { $old = implode( "\n", $this->old ); $new = implode( "\n", $this->new ); $position = $this->position; $changeSet = []; // The implodes must come first because we consider array( '' ) to also be false // meaning a blank link replaced with content is an addition if ( $old && $new ) { $min = min( count( $this->old ), count( $this->new ) ); $changeSet[] = $position + [ 'action' => 'change', 'old_content' => implode( "\n", array_slice( $this->old, 0, $min ) ), 'new_content' => implode( "\n", array_slice( $this->new, 0, $min ) ), ]; $position['left-pos'] += $min; $position['right-pos'] += $min; $old = implode( "\n", array_slice( $this->old, $min ) ); $new = implode( "\n", array_slice( $this->new, $min ) ); } if ( $new ) { $changeSet[] = $position + [ 'action' => 'add', 'content' => $new, ]; } elseif ( $old ) { $changeSet[] = $position + [ 'action' => 'subtract', 'content' => $old, ]; } return $changeSet; } }