MediaWiki REL1_39
TextSlotDiffRenderer.php
Go to the documentation of this file.
1<?php
26use Wikimedia\Assert\Assert;
27
39
41 public const ENGINE_PHP = 'php';
42
44 public const ENGINE_WIKIDIFF2 = 'wikidiff2';
45
47 public const ENGINE_WIKIDIFF2_INLINE = 'wikidiff2inline';
48
50 public const ENGINE_EXTERNAL = 'external';
51
53 private $statsdDataFactory;
54
56 private $language;
57
59 private $engine = self::ENGINE_PHP;
60
62 private $externalEngine;
63
65 public function getExtraCacheKeys() {
66 // Tell DifferenceEngine this is a different variant from the standard wikidiff2 variant
67 return $this->engine === self::ENGINE_WIKIDIFF2_INLINE ? [
68 phpversion( 'wikidiff2' ), 'inline'
69 ] : [];
70 }
71
78 public static function diff( $oldText, $newText ) {
80 $slotDiffRenderer = MediaWikiServices::getInstance()
81 ->getContentHandlerFactory()
82 ->getContentHandler( CONTENT_MODEL_TEXT )
83 ->getSlotDiffRenderer( RequestContext::getMain() );
84 '@phan-var TextSlotDiffRenderer $slotDiffRenderer';
85 return $slotDiffRenderer->getTextDiff( $oldText, $newText );
86 }
87
91 public function setStatsdDataFactory( IBufferingStatsdDataFactory $statsdDataFactory ) {
92 $this->statsdDataFactory = $statsdDataFactory;
93 }
94
98 public function setLanguage( Language $language ) {
99 $this->language = $language;
100 }
101
107 public function setEngine( $type, $executable = null ) {
110 Assert::parameter( in_array( $type, $engines, true ), '$type',
111 'must be one of the TextSlotDiffRenderer::ENGINE_* constants' );
112 if ( $type === self::ENGINE_EXTERNAL ) {
113 Assert::parameter( is_string( $executable ) && is_executable( $executable ), '$executable',
114 'must be a path to a valid executable' );
115 } else {
116 Assert::parameter( $executable === null, '$executable',
117 'must not be set unless $type is ENGINE_EXTERNAL' );
118 }
119 $this->engine = $type;
120 $this->externalEngine = $executable;
121 }
122
124 public function getDiff( Content $oldContent = null, Content $newContent = null ) {
125 $this->normalizeContents( $oldContent, $newContent, TextContent::class );
126
127 $oldText = $oldContent->serialize();
128 $newText = $newContent->serialize();
129
130 return $this->getTextDiff( $oldText, $newText );
131 }
132
139 public function getTextDiff( string $oldText, string $newText ) {
140 $diff = function () use ( $oldText, $newText ) {
141 $time = microtime( true );
142
143 $result = $this->getTextDiffInternal( $oldText, $newText );
144
145 $time = intval( ( microtime( true ) - $time ) * 1000 );
146 if ( $this->statsdDataFactory ) {
147 $this->statsdDataFactory->timing( 'diff_time', $time );
148 }
149
150 // TODO reimplement this using T142313
151 /*
152 // Log requests slower than 99th percentile
153 if ( $time > 100 && $this->mOldPage && $this->mNewPage ) {
154 wfDebugLog( 'diff',
155 "$time ms diff: {$this->mOldid} -> {$this->mNewid} {$this->mNewPage}" );
156 }
157 */
158
159 return $result;
160 };
161
167 $error = static function ( $status ) {
168 throw new FatalError( $status->getWikiText() );
169 };
170
171 // Use PoolCounter if the diff looks like it can be expensive
172 if ( strlen( $oldText ) + strlen( $newText ) > 20000 ) {
173 $work = new PoolCounterWorkViaCallback( 'diff',
174 md5( $oldText ) . md5( $newText ),
175 [ 'doWork' => $diff, 'error' => $error ]
176 );
177 return $work->execute();
178 }
179
180 return $diff();
181 }
182
192 protected function getTextDiffInternal( $oldText, $newText ) {
193 // TODO move most of this into three parallel implementations of a text diff generator
194 // class, choose which one to use via dependency injection
195
196 $oldText = str_replace( "\r\n", "\n", $oldText );
197 $newText = str_replace( "\r\n", "\n", $newText );
198
199 // Better external diff engine, the 2 may some day be dropped
200 // This one does the escaping and segmenting itself
201 if ( $this->engine === self::ENGINE_WIKIDIFF2 ) {
202 $wikidiff2Version = phpversion( 'wikidiff2' );
203 if (
204 $wikidiff2Version !== false &&
205 version_compare( $wikidiff2Version, '1.5.0', '>=' ) &&
206 version_compare( $wikidiff2Version, '1.8.0', '<' )
207 ) {
208 $text = wikidiff2_do_diff(
209 $oldText,
210 $newText,
211 2,
212 0
213 );
214 } else {
215 // Don't pass the 4th parameter introduced in version 1.5.0 and removed in version 1.8.0
216 $text = wikidiff2_do_diff(
217 $oldText,
218 $newText,
219 2
220 );
221 }
222
223 return $text;
224 } elseif ( $this->engine === self::ENGINE_EXTERNAL ) {
225 # Diff via the shell
226 $tmpDir = wfTempDir();
227 $tempName1 = tempnam( $tmpDir, 'diff_' );
228 $tempName2 = tempnam( $tmpDir, 'diff_' );
229
230 $tempFile1 = fopen( $tempName1, "w" );
231 if ( !$tempFile1 ) {
232 throw new Exception( "Could not create temporary file $tempName1 for external diffing" );
233 }
234 $tempFile2 = fopen( $tempName2, "w" );
235 if ( !$tempFile2 ) {
236 throw new Exception( "Could not create temporary file $tempName2 for external diffing" );
237 }
238 fwrite( $tempFile1, $oldText );
239 fwrite( $tempFile2, $newText );
240 fclose( $tempFile1 );
241 fclose( $tempFile2 );
242 $cmd = [ $this->externalEngine, $tempName1, $tempName2 ];
243 $result = Shell::command( $cmd )
244 ->execute();
245 $exitCode = $result->getExitCode();
246 if ( $exitCode !== 0 ) {
247 throw new Exception( "External diff command returned code {$exitCode}. Stderr: "
248 . wfEscapeWikiText( $result->getStderr() )
249 );
250 }
251 $difftext = $result->getStdout();
252 unlink( $tempName1 );
253 unlink( $tempName2 );
254
255 return $difftext;
256 } elseif ( $this->engine === self::ENGINE_PHP ) {
257 if ( $this->language ) {
258 $oldText = $this->language->segmentForDiff( $oldText );
259 $newText = $this->language->segmentForDiff( $newText );
260 }
261 $ota = explode( "\n", $oldText );
262 $nta = explode( "\n", $newText );
263 $diffs = new Diff( $ota, $nta );
264 $formatter = new TableDiffFormatter();
265 $difftext = $formatter->format( $diffs );
266 if ( $this->language ) {
267 $difftext = $this->language->unsegmentForDiff( $difftext );
268 }
269
270 return $difftext;
271 } elseif ( $this->engine === self::ENGINE_WIKIDIFF2_INLINE ) {
272 // Note wikidiff2_inline_diff returns an element sans table.
273 // Due to the way other diffs work (return a table with before and after), we need to wrap
274 // the output in a row that spans the 4 columns that are expected, so that our diff appears in
275 // the correct place!
276 return '<tr><td colspan="4">' . wikidiff2_inline_diff( $oldText, $newText, 2 ) . '</td></tr>';
277 }
278 throw new LogicException( 'Invalid engine: ' . $this->engine );
279 }
280
281}
const CONTENT_MODEL_TEXT
Definition Defines.php:214
wfTempDir()
Tries to get the system directory for temporary files.
wfEscapeWikiText( $text)
Escapes the given text so that it may be output using addWikiText() without any linking,...
Class representing a 'diff' between two sequences of strings.
Definition Diff.php:32
Abort the web request with a custom HTML string that will represent the entire response.
Base class for language-specific code.
Definition Language.php:53
Service locator for MediaWiki core services.
Executes shell commands.
Definition Shell.php:46
Convenience class for dealing with PoolCounters using callbacks.
Renders a diff for a single slot (that is, a diff between two content objects).
normalizeContents(Content &$oldContent=null, Content &$newContent=null, $allowedClasses=null)
Helper method to normalize the input of getDiff().
MediaWiki default table style diff formatter.
Renders a slot diff by doing a text diff on the native representation.
setStatsdDataFactory(IBufferingStatsdDataFactory $statsdDataFactory)
setEngine( $type, $executable=null)
Set which diff engine to use.
const ENGINE_PHP
Use the PHP diff implementation (DiffEngine).
const ENGINE_EXTERNAL
Use an external executable.
getTextDiffInternal( $oldText, $newText)
Diff the text representations of two content objects (or just two pieces of text in general).
const ENGINE_WIKIDIFF2
Use the wikidiff2 PHP module.
getDiff(Content $oldContent=null, Content $newContent=null)
Get a diff between two content objects.One of them might be null (meaning a slot was created or remov...
setLanguage(Language $language)
getExtraCacheKeys()
Return any extra keys to split the diff cache by.to override string[]
getTextDiff(string $oldText, string $newText)
Diff the text representations of two content objects (or just two pieces of text in general).
const ENGINE_WIKIDIFF2_INLINE
Use the wikidiff2 PHP module.
static diff( $oldText, $newText)
Convenience helper to use getTextDiff without an instance.
Base interface for content objects.
Definition Content.php:35
MediaWiki adaptation of StatsdDataFactory that provides buffering functionality.