silverstripe
diff --git a/‎code/HTML5Value.php
Lines changed: 1 addition & 1 deletion b/‎code/HTML5Value.php
Lines changed: 1 addition & 1 deletion
diff --git a/‎thirdparty/html5lib-php/bin/html5-parse.php
Lines changed: 1 addition & 1 deletion b/‎thirdparty/html5lib-php/bin/html5-parse.php
Lines changed: 1 addition & 1 deletion
diff --git a/‎thirdparty/html5lib-php/library/HTML5/Data.php
Lines changed: 5 additions & 5 deletions b/‎thirdparty/html5lib-php/library/HTML5/Data.php
Lines changed: 5 additions & 5 deletions
diff --git a/‎thirdparty/html5lib-php/library/HTML5/InputStream.php
Lines changed: 23 additions & 23 deletions b/‎thirdparty/html5lib-php/library/HTML5/InputStream.php
Lines changed: 23 additions & 23 deletions
diff --git a/‎thirdparty/html5lib-php/library/HTML5/Tokenizer.php
Lines changed: 25 additions & 25 deletions b/‎thirdparty/html5lib-php/library/HTML5/Tokenizer.php
Lines changed: 25 additions & 25 deletions
@@ -19,7 +19,7 @@ function ($no, $str) {
 
         // Use HTML5 parser to parse the HTML fragment
         try {
-            $content = str_replace("\r\n", "\n", $content);
+            $content = str_replace("\r\n", "\n", $content ?? '');
             $parserPath = implode(
                 DIRECTORY_SEPARATOR,
                 [
 
@@ -6,5 +6,5 @@
 } else {
     $file = $argv[1];
 }
-$result = HTML5_Parser::parse(file_get_contents($file));
+$result = HTML5_Parser::parse(file_get_contents($file ?? ''));
 // nop
@@ -63,7 +63,7 @@ public static function getRealCodepoint($ref) {
     public static function getNamedCharacterReferences() {
         if (!self::$namedCharacterReferences) {
             self::$namedCharacterReferences = unserialize(
-                file_get_contents(dirname(__FILE__) . '/named-character-references.ser'));
+                file_get_contents(dirname(__FILE__) . '/named-character-references.ser') ?? '');
         }
         return self::$namedCharacterReferences;
     }
@@ -103,10 +103,10 @@ public static function utf8chr($code) {
         }
         // set up the actual character
         $ret = '';
-        if($w) $ret .= chr($w);
-        if($z) $ret .= chr($z);
-        if($y) $ret .= chr($y);
-        $ret .= chr($x);
+        if($w) $ret .= chr($w ?? 0);
+        if($z) $ret .= chr($z ?? 0);
+        if($y) $ret .= chr($y ?? 0);
+        $ret .= chr($x ?? 0);
 
         return $ret;
     }
 
@@ -73,16 +73,16 @@ public function __construct($data) {
         // omitted.
         if (extension_loaded('iconv')) {
             // non-conforming
-            $data = @iconv('UTF-8', 'UTF-8//IGNORE', $data);
+            $data = @iconv('UTF-8', 'UTF-8//IGNORE', $data ?? '');
         } else {
             // we can make a conforming native implementation
             throw new Exception('Not implemented, please install mbstring or iconv');
         }
 
         /* One leading U+FEFF BYTE ORDER MARK character must be
         ignored if any are present. */
-        if (substr($data, 0, 3) === "\xEF\xBB\xBF") {
-            $data = substr($data, 3);
+        if (substr($data ?? '', 0, 3) === "\xEF\xBB\xBF") {
+            $data = substr($data ?? '', 3);
         }
 
         /* All U+0000 NULL characters in the input must be replaced
@@ -112,7 +112,7 @@ public function __construct($data) {
                 "\n",
                 "\n"
             ),
-            $data
+            $data ?? ''
         );
 
         /* Any occurrences of any characters in the ranges U+0001 to
@@ -141,7 +141,7 @@ public function __construct($data) {
                 |
                     [\xF0-\xF4][\x8F-\xBF]\xBF[\xBE\xBF] # U+nFFFE and U+nFFFF (1 <= n <= 10_{16})
                 )/x',
-                $data,
+                $data ?? '',
                 $matches
             );
             for ($i = 0; $i < $count; $i++) {
@@ -156,7 +156,7 @@ public function __construct($data) {
 
         $this->data = $data;
         $this->char = 0;
-        $this->EOF  = strlen($data);
+        $this->EOF  = strlen($data ?? '');
     }
 
     /**
@@ -167,7 +167,7 @@ public function getCurrentLine() {
         if($this->EOF) {
             // Add one to $this->char because we want the number for the next
             // byte to be processed.
-            return substr_count($this->data, "\n", 0, min($this->char, $this->EOF)) + 1;
+            return substr_count($this->data ?? '', "\n", 0, min($this->char, $this->EOF)) + 1;
         } else {
             // If the string is empty, we are on the first line (sorta).
             return 1;
@@ -183,29 +183,29 @@ public function getColumnOffset() {
         // one (to make it point to the next character, the one we want the
         // position of) added to it because strrpos's behaviour includes the
         // final offset byte.
-        $lastLine = strrpos($this->data, "\n", $this->char - 1 - strlen($this->data));
+        $lastLine = strrpos($this->data ?? '', "\n", $this->char - 1 - strlen($this->data ?? ''));
 
         // However, for here we want the length up until the next byte to be
         // processed, so add one to the current byte ($this->char).
         if($lastLine !== false) {
-            $findLengthOf = substr($this->data, $lastLine + 1, $this->char - 1 - $lastLine);
+            $findLengthOf = substr($this->data ?? '', $lastLine + 1, $this->char - 1 - $lastLine);
         } else {
-            $findLengthOf = substr($this->data, 0, $this->char);
+            $findLengthOf = substr($this->data ?? '', 0, $this->char);
         }
 
         // Get the length for the string we need.
         if(extension_loaded('iconv')) {
-            return iconv_strlen($findLengthOf, 'utf-8');
+            return iconv_strlen($findLengthOf ?? '', 'utf-8');
         } elseif(extension_loaded('mbstring')) {
-            return mb_strlen($findLengthOf, 'utf-8');
+            return mb_strlen($findLengthOf ?? '', 'utf-8');
         } elseif(extension_loaded('xml')) {
-            return strlen(utf8_decode($findLengthOf));
+            return strlen(utf8_decode($findLengthOf ?? ''));
         } else {
-            $count = count_chars($findLengthOf);
+            $count = count_chars($findLengthOf ?? '');
             // 0x80 = 0x7F - 0 + 1 (one added to get inclusive range)
             // 0x33 = 0xF4 - 0x2C + 1 (one added to get inclusive range)
-            return array_sum(array_slice($count, 0, 0x80)) +
-                   array_sum(array_slice($count, 0xC2, 0x33));
+            return array_sum(array_slice($count ?? [], 0, 0x80)) +
+                   array_sum(array_slice($count ?? [], 0xC2, 0x33));
         }
     }
 
@@ -225,7 +225,7 @@ public function char() {
      */
     public function remainingChars() {
         if($this->char < $this->EOF) {
-            $data = substr($this->data, $this->char);
+            $data = substr($this->data ?? '', $this->char ?? 0);
             $this->char = $this->EOF;
             return $data;
         } else {
@@ -241,11 +241,11 @@ public function remainingChars() {
     public function charsUntil($bytes, $max = null) {
         if ($this->char < $this->EOF) {
             if ($max === 0 || $max) {
-                $len = strcspn($this->data, $bytes, $this->char, $max);
+                $len = strcspn($this->data ?? '', $bytes ?? '', $this->char ?? 0, $max);
             } else {
-                $len = strcspn($this->data, $bytes, $this->char);
+                $len = strcspn($this->data ?? '', $bytes ?? '', $this->char ?? 0);
             }
-            $string = (string) substr($this->data, $this->char, $len);
+            $string = (string) substr($this->data ?? '', $this->char ?? 0, $len);
             $this->char += $len;
             return $string;
         } else {
@@ -261,11 +261,11 @@ public function charsUntil($bytes, $max = null) {
     public function charsWhile($bytes, $max = null) {
         if ($this->char < $this->EOF) {
             if ($max === 0 || $max) {
-                $len = strspn($this->data, $bytes, $this->char, $max);
+                $len = strspn($this->data ?? '', $bytes ?? '', $this->char ?? 0, $max);
             } else {
-                $len = strspn($this->data, $bytes, $this->char);
+                $len = strspn($this->data ?? '', $bytes ?? '', $this->char ?? 0);
             }
-            $string = (string) substr($this->data, $this->char, $len);
+            $string = (string) substr($this->data ?? '', $this->char ?? 0, $len);
             $this->char += $len;
             return $string;
         } else {
 
@@ -135,7 +135,7 @@ public function parse() {
                     /* Consume the next input character */
                     $char = $this->stream->char();
                     $lastFourChars .= $char;
-                    if (strlen($lastFourChars) > 4) $lastFourChars = substr($lastFourChars, -4);
+                    if (strlen($lastFourChars ?? '') > 4) $lastFourChars = substr($lastFourChars ?? '', -4);
 
                     // see below for meaning
                     $hyp_cond = 
@@ -213,7 +213,7 @@ public function parse() {
                     } elseif(
                         $char === '>' &&
                         $gt_cond &&
-                        substr($lastFourChars, 1) === '-->'
+                        substr($lastFourChars ?? '', 1) === '-->'
                     ) {
                         /* If the content model flag is set to either the RCDATA state or
                         the CDATA state, and the escape flag is true, and the last three
@@ -248,7 +248,7 @@ public function parse() {
                             'data' => $char . $chars
                         ));
                         $lastFourChars .= $chars;
-                        if (strlen($lastFourChars) > 4) $lastFourChars = substr($lastFourChars, -4);
+                        if (strlen($lastFourChars ?? '') > 4) $lastFourChars = substr($lastFourChars ?? '', -4);
 
                     } else {
                         /* Anything else
@@ -274,7 +274,7 @@ public function parse() {
                         ));
 
                         $lastFourChars .= $chars;
-                        if (strlen($lastFourChars) > 4) $lastFourChars = substr($lastFourChars, -4);
+                        if (strlen($lastFourChars ?? '') > 4) $lastFourChars = substr($lastFourChars ?? '', -4);
 
                         $state = 'data';
                     }
@@ -351,7 +351,7 @@ public function parse() {
                                 point), then switch to the tag name state. (Don't emit the token
                                 yet; further details will be filled in before it is emitted.) */
                                 $this->token = array(
-                                    'name'  => strtolower($char),
+                                    'name'  => strtolower($char ?? ''),
                                     'type'  => self::STARTTAG,
                                     'attr'  => array()
                                 );
@@ -427,7 +427,7 @@ public function parse() {
                     ) {
                         /* If the content model flag is set to the RCDATA or CDATA
                         states... */
-                        $name = strtolower($this->stream->charsWhile(self::ALPHA));
+                        $name = strtolower($this->stream->charsWhile(self::ALPHA) ?? '');
                         $following = $this->stream->char();
                         $this->stream->unget();
                         if (
@@ -489,7 +489,7 @@ public function parse() {
                             switch to the tag name state. (Don't emit the token yet; further details
                             will be filled in before it is emitted.) */
                             $this->token = array(
-                                'name'  => strtolower($char),
+                                'name'  => strtolower($char ?? ''),
                                 'type'  => self::ENDTAG
                             );
 
@@ -635,7 +635,7 @@ public function parse() {
                         point), and its value to the empty string. Switch to the
                         attribute name state.*/
                         $this->token['attr'][] = array(
-                            'name'  => strtolower($char),
+                            'name'  => strtolower($char ?? ''),
                             'value' => ''
                         );
 
@@ -716,7 +716,7 @@ public function parse() {
                         state. */
                         $chars = $this->stream->charsWhile(self::UPPER_ALPHA);
 
-                        $last = count($this->token['attr']) - 1;
+                        $last = count($this->token['attr'] ?? []) - 1;
                         $this->token['attr'][$last]['name'] .= strtolower($char . $chars);
 
                         $state = 'attribute name';
@@ -750,7 +750,7 @@ public function parse() {
                         Stay in the attribute name state. */
                         $chars = $this->stream->charsUntil("\t\n\x0C /=>\"'" . self::UPPER_ALPHA);
 
-                        $last = count($this->token['attr']) - 1;
+                        $last = count($this->token['attr'] ?? []) - 1;
                         $this->token['attr'][$last]['name'] .= $char . $chars;
 
                         $state = 'attribute name';
@@ -803,7 +803,7 @@ public function parse() {
                         point), and its value to the empty string. Switch to the
                         attribute name state. */
                         $this->token['attr'][] = array(
-                            'name'  => strtolower($char),
+                            'name'  => strtolower($char ?? ''),
                             'value' => ''
                         );
 
@@ -910,7 +910,7 @@ public function parse() {
                         /* Anything else
                         Append the current input character to the current attribute's value.
                         Switch to the attribute value (unquoted) state. */
-                        $last = count($this->token['attr']) - 1;
+                        $last = count($this->token['attr'] ?? []) - 1;
                         $this->token['attr'][$last]['value'] .= $char;
 
                         $state = 'attribute value (unquoted)';
@@ -950,7 +950,7 @@ public function parse() {
                         Stay in the attribute value (double-quoted) state. */
                         $chars = $this->stream->charsUntil('"&');
 
-                        $last = count($this->token['attr']) - 1;
+                        $last = count($this->token['attr'] ?? []) - 1;
                         $this->token['attr'][$last]['value'] .= $char . $chars;
 
                         $state = 'attribute value (double-quoted)';
@@ -988,7 +988,7 @@ public function parse() {
                         Stay in the attribute value (single-quoted) state. */
                         $chars = $this->stream->charsUntil("'&");
 
-                        $last = count($this->token['attr']) - 1;
+                        $last = count($this->token['attr'] ?? []) - 1;
                         $this->token['attr'][$last]['value'] .= $char . $chars;
 
                         $state = 'attribute value (single-quoted)';
@@ -1049,7 +1049,7 @@ public function parse() {
                         Stay in the attribute value (unquoted) state. */
                         $chars = $this->stream->charsUntil("\t\n\x0c &>\"'=");
 
-                        $last = count($this->token['attr']) - 1;
+                        $last = count($this->token['attr'] ?? []) - 1;
                         $this->token['attr'][$last]['value'] .= $char . $chars;
 
                         $state = 'attribute value (unquoted)';
@@ -1179,7 +1179,7 @@ public function parse() {
                     /* Otherwise if the next seven characters are a case-insensitive match
                     for the word "DOCTYPE", then consume those characters and switch to the
                     DOCTYPE state. */
-                    } elseif(strtoupper($alpha) === 'DOCTYPE') {
+                    } elseif(strtoupper($alpha ?? '') === 'DOCTYPE') {
                         $state = 'DOCTYPE';
 
                     // XXX not implemented
@@ -1526,7 +1526,7 @@ public function parse() {
                         the character's code point). Switch to the DOCTYPE name
                         state. */
                         $this->token = array(
-                            'name' => strtolower($char),
+                            'name' => strtolower($char ?? ''),
                             'type' => self::DOCTYPE,
                             'error' => true
                         );
@@ -1589,7 +1589,7 @@ public function parse() {
                         Append the lowercase version of the input character
                         (add 0x0020 to the character's code point) to the current
                         DOCTYPE token's name. Stay in the DOCTYPE name state. */
-                        $this->token['name'] .= strtolower($char);
+                        $this->token['name'] .= strtolower($char ?? '');
 
                     } elseif($char === false) {
                         /* EOF
@@ -2289,7 +2289,7 @@ private function consumeCharacterReference($allowed = false, $inattr = false) {
             // alphanumeric so we can just concat it to whatever we get later).
             $this->stream->unget();
             if ($char !== false) {
-                $chars = substr($chars, 0, -1);
+                $chars = substr($chars ?? '', 0, -1);
             }
 
             /* If no match can be made, then this is a parse error.
@@ -2305,7 +2305,7 @@ private function consumeCharacterReference($allowed = false, $inattr = false) {
             /* If the last character matched is not a U+003B SEMICOLON
             (;), there is a parse error. */
             $semicolon = true;
-            if (substr($id, -1) !== ';') {
+            if (substr($id ?? '', -1) !== ';') {
                 $this->emitToken(array(
                     'type' => self::PARSEERROR,
                     'data' => 'named-entity-without-semicolon'
@@ -2324,8 +2324,8 @@ private function consumeCharacterReference($allowed = false, $inattr = false) {
             and nothing is returned. */
             if ($inattr && !$semicolon) {
                 // The next character is either the next character in $chars or in the stream.
-                if (strlen($chars) > strlen($id)) {
-                    $next = substr($chars, strlen($id), 1);
+                if (strlen($chars ?? '') > strlen($id ?? '')) {
+                    $next = substr($chars ?? '', strlen($id ?? ''), 1);
                 } else {
                     $next = $this->stream->char();
                     $this->stream->unget();
@@ -2342,7 +2342,7 @@ private function consumeCharacterReference($allowed = false, $inattr = false) {
             /* Otherwise, return a character token for the character
             corresponding to the character reference name (as given
             by the second column of the named character references table). */
-            return HTML5_Data::utf8chr($codepoint) . substr($chars, strlen($id));
+            return HTML5_Data::utf8chr($codepoint) . substr($chars ?? '', strlen($id ?? ''));
         }
     }
 
@@ -2359,7 +2359,7 @@ private function characterReferenceInAttributeValue($allowed = false) {
             ? '&'
             : $entity;
 
-        $last = count($this->token['attr']) - 1;
+        $last = count($this->token['attr'] ?? []) - 1;
         $this->token['attr'][$last]['value'] .= $char;
 
         /* Finally, switch back to the attribute value state that you
@@ -2377,7 +2377,7 @@ protected function emitToken($token, $checkStream = true, $dry = false) {
             }
         }
         if($token['type'] === self::ENDTAG && !empty($token['attr'])) {
-            for ($i = 0; $i < count($token['attr']); $i++) {
+            for ($i = 0; $i < count($token['attr'] ?? []); $i++) {
                 $this->emitToken(array(
                     'type' => self::PARSEERROR,
                     'data' => 'attributes-in-end-tag'
Original file line number	Diff line number	Diff line change
`@@ -19,7 +19,7 @@ function ($no, $str) {`
`19`	`19`
`20`	`20`	`// Use HTML5 parser to parse the HTML fragment`
`21`	`21`	`try {`
`22`		`- $content = str_replace("\r\n", "\n", $content);`
	`22`	`+ $content = str_replace("\r\n", "\n", $content ?? '');`
`23`	`23`	`$parserPath = implode(`
`24`	`24`	`DIRECTORY_SEPARATOR,`
`25`	`25`	`[`
Original file line number	Diff line number	Diff line change
`@@ -6,5 +6,5 @@`
`6`	`6`	`} else {`
`7`	`7`	`$file = $argv[1];`
`8`	`8`	`}`
`9`		`-$result = HTML5_Parser::parse(file_get_contents($file));`
	`9`	`+$result = HTML5_Parser::parse(file_get_contents($file ?? ''));`
`10`	`10`	`// nop`
Original file line number	Diff line number	Diff line change
`@@ -63,7 +63,7 @@ public static function getRealCodepoint($ref) {`
`63`	`63`	`public static function getNamedCharacterReferences() {`
`64`	`64`	`if (!self::$namedCharacterReferences) {`
`65`	`65`	`self::$namedCharacterReferences = unserialize(`
`66`		`- file_get_contents(dirname(__FILE__) . '/named-character-references.ser'));`
	`66`	`+ file_get_contents(dirname(__FILE__) . '/named-character-references.ser') ?? '');`
`67`	`67`	`}`
`68`	`68`	`return self::$namedCharacterReferences;`
`69`	`69`	`}`
`@@ -103,10 +103,10 @@ public static function utf8chr($code) {`
`103`	`103`	`}`
`104`	`104`	`// set up the actual character`
`105`	`105`	`$ret = '';`
`106`		`- if($w) $ret .= chr($w);`
`107`		`- if($z) $ret .= chr($z);`
`108`		`- if($y) $ret .= chr($y);`
`109`		`- $ret .= chr($x);`
	`106`	`+ if($w) $ret .= chr($w ?? 0);`
	`107`	`+ if($z) $ret .= chr($z ?? 0);`
	`108`	`+ if($y) $ret .= chr($y ?? 0);`
	`109`	`+ $ret .= chr($x ?? 0);`
`110`	`110`
`111`	`111`	`return $ret;`
`112`	`112`	`}`