MediaWiki REL1_33
Go to the documentation of this file.
8 protected $doc, $xpath, $invalid;
10 public static function normalize( $text, $funcs ) {
11 $norm = new self( $text );
12 if ( $norm->invalid ) {
13 return $text;
14 }
15 foreach ( $funcs as $func ) {
16 $norm->$func();
17 }
18 return $norm->serialize();
19 }
21 protected function __construct( $text ) {
22 $this->doc = new DOMDocument( '1.0', 'utf-8' );
24 // Note: parsing a supposedly XHTML document with an XML parser is not
25 // guaranteed to give accurate results. For example, it may introduce
26 // differences in the number of line breaks in <pre> tags.
29 if ( !$this->doc->loadXML( '<html><body>' . $text . '</body></html>' ) ) {
30 $this->invalid = true;
31 }
33 $this->xpath = new DOMXPath( $this->doc );
34 $this->body = $this->xpath->query( '//body' )->item( 0 );
35 }
37 protected function removeTbody() {
38 foreach ( $this->xpath->query( '//tbody' ) as $tbody ) {
39 while ( $tbody->firstChild ) {
40 $child = $tbody->firstChild;
41 $tbody->removeChild( $child );
42 $tbody->parentNode->insertBefore( $child, $tbody );
43 }
44 $tbody->parentNode->removeChild( $tbody );
45 }
46 }
59 protected function trimWhitespace() {
60 foreach ( $this->xpath->query( '//text()' ) as $child ) {
61 if ( strtolower( $child->parentNode->nodeName ) === 'pre' ) {
62 // Just trim one line break from the start and end
63 if ( substr_compare( $child->data, "\n", 0 ) === 0 ) {
64 $child->data = substr( $child->data, 1 );
65 }
66 if ( substr_compare( $child->data, "\n", -1 ) === 0 ) {
67 $child->data = substr( $child->data, 0, -1 );
68 }
69 } else {
70 // Trim all whitespace
71 $child->data = trim( $child->data );
72 }
73 if ( $child->data === '' ) {
74 $child->parentNode->removeChild( $child );
75 }
76 }
77 }
83 protected function serialize() {
84 return strtr( $this->doc->saveXML( $this->body ),
85 [ '<body>' => '', '</body>' => '' ] );
86 }
and that you know you can do these things To protect your we need to make restrictions that forbid anyone to deny you these rights or to ask you to surrender the rights These restrictions translate to certain responsibilities for you if you distribute copies of the or if you modify it For if you distribute copies of such a whether gratis or for a you must give the recipients all the rights that you have You must make sure that receive or can get the source code And you must show them these terms so they know their rights We protect your rights with two and(2) offer you this license which gives you legal permission to copy
Serialize the XML DOM for comparison purposes.
The point of this function is to produce a normalized DOM in which Tidy's output matches the output o...