[ Index ]

PHP Cross Reference of DokuWiki

title

Body

[close]

/vendor/simplepie/simplepie/library/SimplePie/Decode/HTML/ -> Entities.php (source)

   1  <?php
   2  /**
   3   * SimplePie
   4   *
   5   * A PHP-Based RSS and Atom Feed Framework.
   6   * Takes the hard work out of managing a complete RSS/Atom solution.
   7   *
   8   * Copyright (c) 2004-2016, Ryan Parman, Geoffrey Sneddon, Ryan McCue, and contributors
   9   * All rights reserved.
  10   *
  11   * Redistribution and use in source and binary forms, with or without modification, are
  12   * permitted provided that the following conditions are met:
  13   *
  14   *     * Redistributions of source code must retain the above copyright notice, this list of
  15   *       conditions and the following disclaimer.
  16   *
  17   *     * Redistributions in binary form must reproduce the above copyright notice, this list
  18   *       of conditions and the following disclaimer in the documentation and/or other materials
  19   *       provided with the distribution.
  20   *
  21   *     * Neither the name of the SimplePie Team nor the names of its contributors may be used
  22   *       to endorse or promote products derived from this software without specific prior
  23   *       written permission.
  24   *
  25   * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS
  26   * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY
  27   * AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS
  28   * AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  29   * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
  30   * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  31   * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
  32   * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  33   * POSSIBILITY OF SUCH DAMAGE.
  34   *
  35   * @package SimplePie
  36   * @copyright 2004-2016 Ryan Parman, Geoffrey Sneddon, Ryan McCue
  37   * @author Ryan Parman
  38   * @author Geoffrey Sneddon
  39   * @author Ryan McCue
  40   * @link http://simplepie.org/ SimplePie
  41   * @license http://www.opensource.org/licenses/bsd-license.php BSD License
  42   */
  43  
  44  
  45  /**
  46   * Decode HTML Entities
  47   *
  48   * This implements HTML5 as of revision 967 (2007-06-28)
  49   *
  50   * @deprecated Use DOMDocument instead!
  51   * @package SimplePie
  52   */
  53  class SimplePie_Decode_HTML_Entities
  54  {
  55      /**
  56       * Data to be parsed
  57       *
  58       * @access private
  59       * @var string
  60       */
  61      var $data = '';
  62  
  63      /**
  64       * Currently consumed bytes
  65       *
  66       * @access private
  67       * @var string
  68       */
  69      var $consumed = '';
  70  
  71      /**
  72       * Position of the current byte being parsed
  73       *
  74       * @access private
  75       * @var int
  76       */
  77      var $position = 0;
  78  
  79      /**
  80       * Create an instance of the class with the input data
  81       *
  82       * @access public
  83       * @param string $data Input data
  84       */
  85  	public function __construct($data)
  86      {
  87          $this->data = $data;
  88      }
  89  
  90      /**
  91       * Parse the input data
  92       *
  93       * @access public
  94       * @return string Output data
  95       */
  96  	public function parse()
  97      {
  98          while (($this->position = strpos($this->data, '&', $this->position)) !== false)
  99          {
 100              $this->consume();
 101              $this->entity();
 102              $this->consumed = '';
 103          }
 104          return $this->data;
 105      }
 106  
 107      /**
 108       * Consume the next byte
 109       *
 110       * @access private
 111       * @return mixed The next byte, or false, if there is no more data
 112       */
 113  	public function consume()
 114      {
 115          if (isset($this->data[$this->position]))
 116          {
 117              $this->consumed .= $this->data[$this->position];
 118              return $this->data[$this->position++];
 119          }
 120  
 121          return false;
 122      }
 123  
 124      /**
 125       * Consume a range of characters
 126       *
 127       * @access private
 128       * @param string $chars Characters to consume
 129       * @return mixed A series of characters that match the range, or false
 130       */
 131  	public function consume_range($chars)
 132      {
 133          if ($len = strspn($this->data, $chars, $this->position))
 134          {
 135              $data = substr($this->data, $this->position, $len);
 136              $this->consumed .= $data;
 137              $this->position += $len;
 138              return $data;
 139          }
 140  
 141          return false;
 142      }
 143  
 144      /**
 145       * Unconsume one byte
 146       *
 147       * @access private
 148       */
 149  	public function unconsume()
 150      {
 151          $this->consumed = substr($this->consumed, 0, -1);
 152          $this->position--;
 153      }
 154  
 155      /**
 156       * Decode an entity
 157       *
 158       * @access private
 159       */
 160  	public function entity()
 161      {
 162          switch ($this->consume())
 163          {
 164              case "\x09":
 165              case "\x0A":
 166              case "\x0B":
 167              case "\x0C":
 168              case "\x20":
 169              case "\x3C":
 170              case "\x26":
 171              case false:
 172                  break;
 173  
 174              case "\x23":
 175                  switch ($this->consume())
 176                  {
 177                      case "\x78":
 178                      case "\x58":
 179                          $range = '0123456789ABCDEFabcdef';
 180                          $hex = true;
 181                          break;
 182  
 183                      default:
 184                          $range = '0123456789';
 185                          $hex = false;
 186                          $this->unconsume();
 187                          break;
 188                  }
 189  
 190                  if ($codepoint = $this->consume_range($range))
 191                  {
 192                      static $windows_1252_specials = array(0x0D => "\x0A", 0x80 => "\xE2\x82\xAC", 0x81 => "\xEF\xBF\xBD", 0x82 => "\xE2\x80\x9A", 0x83 => "\xC6\x92", 0x84 => "\xE2\x80\x9E", 0x85 => "\xE2\x80\xA6", 0x86 => "\xE2\x80\xA0", 0x87 => "\xE2\x80\xA1", 0x88 => "\xCB\x86", 0x89 => "\xE2\x80\xB0", 0x8A => "\xC5\xA0", 0x8B => "\xE2\x80\xB9", 0x8C => "\xC5\x92", 0x8D => "\xEF\xBF\xBD", 0x8E => "\xC5\xBD", 0x8F => "\xEF\xBF\xBD", 0x90 => "\xEF\xBF\xBD", 0x91 => "\xE2\x80\x98", 0x92 => "\xE2\x80\x99", 0x93 => "\xE2\x80\x9C", 0x94 => "\xE2\x80\x9D", 0x95 => "\xE2\x80\xA2", 0x96 => "\xE2\x80\x93", 0x97 => "\xE2\x80\x94", 0x98 => "\xCB\x9C", 0x99 => "\xE2\x84\xA2", 0x9A => "\xC5\xA1", 0x9B => "\xE2\x80\xBA", 0x9C => "\xC5\x93", 0x9D => "\xEF\xBF\xBD", 0x9E => "\xC5\xBE", 0x9F => "\xC5\xB8");
 193  
 194                      if ($hex)
 195                      {
 196                          $codepoint = hexdec($codepoint);
 197                      }
 198                      else
 199                      {
 200                          $codepoint = intval($codepoint);
 201                      }
 202  
 203                      if (isset($windows_1252_specials[$codepoint]))
 204                      {
 205                          $replacement = $windows_1252_specials[$codepoint];
 206                      }
 207                      else
 208                      {
 209                          $replacement = SimplePie_Misc::codepoint_to_utf8($codepoint);
 210                      }
 211  
 212                      if (!in_array($this->consume(), array(';', false), true))
 213                      {
 214                          $this->unconsume();
 215                      }
 216  
 217                      $consumed_length = strlen($this->consumed);
 218                      $this->data = substr_replace($this->data, $replacement, $this->position - $consumed_length, $consumed_length);
 219                      $this->position += strlen($replacement) - $consumed_length;
 220                  }
 221                  break;
 222  
 223              default:
 224                  static $entities = array(
 225                      'Aacute' => "\xC3\x81",
 226                      'aacute' => "\xC3\xA1",
 227                      'Aacute;' => "\xC3\x81",
 228                      'aacute;' => "\xC3\xA1",
 229                      'Acirc' => "\xC3\x82",
 230                      'acirc' => "\xC3\xA2",
 231                      'Acirc;' => "\xC3\x82",
 232                      'acirc;' => "\xC3\xA2",
 233                      'acute' => "\xC2\xB4",
 234                      'acute;' => "\xC2\xB4",
 235                      'AElig' => "\xC3\x86",
 236                      'aelig' => "\xC3\xA6",
 237                      'AElig;' => "\xC3\x86",
 238                      'aelig;' => "\xC3\xA6",
 239                      'Agrave' => "\xC3\x80",
 240                      'agrave' => "\xC3\xA0",
 241                      'Agrave;' => "\xC3\x80",
 242                      'agrave;' => "\xC3\xA0",
 243                      'alefsym;' => "\xE2\x84\xB5",
 244                      'Alpha;' => "\xCE\x91",
 245                      'alpha;' => "\xCE\xB1",
 246                      'AMP' => "\x26",
 247                      'amp' => "\x26",
 248                      'AMP;' => "\x26",
 249                      'amp;' => "\x26",
 250                      'and;' => "\xE2\x88\xA7",
 251                      'ang;' => "\xE2\x88\xA0",
 252                      'apos;' => "\x27",
 253                      'Aring' => "\xC3\x85",
 254                      'aring' => "\xC3\xA5",
 255                      'Aring;' => "\xC3\x85",
 256                      'aring;' => "\xC3\xA5",
 257                      'asymp;' => "\xE2\x89\x88",
 258                      'Atilde' => "\xC3\x83",
 259                      'atilde' => "\xC3\xA3",
 260                      'Atilde;' => "\xC3\x83",
 261                      'atilde;' => "\xC3\xA3",
 262                      'Auml' => "\xC3\x84",
 263                      'auml' => "\xC3\xA4",
 264                      'Auml;' => "\xC3\x84",
 265                      'auml;' => "\xC3\xA4",
 266                      'bdquo;' => "\xE2\x80\x9E",
 267                      'Beta;' => "\xCE\x92",
 268                      'beta;' => "\xCE\xB2",
 269                      'brvbar' => "\xC2\xA6",
 270                      'brvbar;' => "\xC2\xA6",
 271                      'bull;' => "\xE2\x80\xA2",
 272                      'cap;' => "\xE2\x88\xA9",
 273                      'Ccedil' => "\xC3\x87",
 274                      'ccedil' => "\xC3\xA7",
 275                      'Ccedil;' => "\xC3\x87",
 276                      'ccedil;' => "\xC3\xA7",
 277                      'cedil' => "\xC2\xB8",
 278                      'cedil;' => "\xC2\xB8",
 279                      'cent' => "\xC2\xA2",
 280                      'cent;' => "\xC2\xA2",
 281                      'Chi;' => "\xCE\xA7",
 282                      'chi;' => "\xCF\x87",
 283                      'circ;' => "\xCB\x86",
 284                      'clubs;' => "\xE2\x99\xA3",
 285                      'cong;' => "\xE2\x89\x85",
 286                      'COPY' => "\xC2\xA9",
 287                      'copy' => "\xC2\xA9",
 288                      'COPY;' => "\xC2\xA9",
 289                      'copy;' => "\xC2\xA9",
 290                      'crarr;' => "\xE2\x86\xB5",
 291                      'cup;' => "\xE2\x88\xAA",
 292                      'curren' => "\xC2\xA4",
 293                      'curren;' => "\xC2\xA4",
 294                      'Dagger;' => "\xE2\x80\xA1",
 295                      'dagger;' => "\xE2\x80\xA0",
 296                      'dArr;' => "\xE2\x87\x93",
 297                      'darr;' => "\xE2\x86\x93",
 298                      'deg' => "\xC2\xB0",
 299                      'deg;' => "\xC2\xB0",
 300                      'Delta;' => "\xCE\x94",
 301                      'delta;' => "\xCE\xB4",
 302                      'diams;' => "\xE2\x99\xA6",
 303                      'divide' => "\xC3\xB7",
 304                      'divide;' => "\xC3\xB7",
 305                      'Eacute' => "\xC3\x89",
 306                      'eacute' => "\xC3\xA9",
 307                      'Eacute;' => "\xC3\x89",
 308                      'eacute;' => "\xC3\xA9",
 309                      'Ecirc' => "\xC3\x8A",
 310                      'ecirc' => "\xC3\xAA",
 311                      'Ecirc;' => "\xC3\x8A",
 312                      'ecirc;' => "\xC3\xAA",
 313                      'Egrave' => "\xC3\x88",
 314                      'egrave' => "\xC3\xA8",
 315                      'Egrave;' => "\xC3\x88",
 316                      'egrave;' => "\xC3\xA8",
 317                      'empty;' => "\xE2\x88\x85",
 318                      'emsp;' => "\xE2\x80\x83",
 319                      'ensp;' => "\xE2\x80\x82",
 320                      'Epsilon;' => "\xCE\x95",
 321                      'epsilon;' => "\xCE\xB5",
 322                      'equiv;' => "\xE2\x89\xA1",
 323                      'Eta;' => "\xCE\x97",
 324                      'eta;' => "\xCE\xB7",
 325                      'ETH' => "\xC3\x90",
 326                      'eth' => "\xC3\xB0",
 327                      'ETH;' => "\xC3\x90",
 328                      'eth;' => "\xC3\xB0",
 329                      'Euml' => "\xC3\x8B",
 330                      'euml' => "\xC3\xAB",
 331                      'Euml;' => "\xC3\x8B",
 332                      'euml;' => "\xC3\xAB",
 333                      'euro;' => "\xE2\x82\xAC",
 334                      'exist;' => "\xE2\x88\x83",
 335                      'fnof;' => "\xC6\x92",
 336                      'forall;' => "\xE2\x88\x80",
 337                      'frac12' => "\xC2\xBD",
 338                      'frac12;' => "\xC2\xBD",
 339                      'frac14' => "\xC2\xBC",
 340                      'frac14;' => "\xC2\xBC",
 341                      'frac34' => "\xC2\xBE",
 342                      'frac34;' => "\xC2\xBE",
 343                      'frasl;' => "\xE2\x81\x84",
 344                      'Gamma;' => "\xCE\x93",
 345                      'gamma;' => "\xCE\xB3",
 346                      'ge;' => "\xE2\x89\xA5",
 347                      'GT' => "\x3E",
 348                      'gt' => "\x3E",
 349                      'GT;' => "\x3E",
 350                      'gt;' => "\x3E",
 351                      'hArr;' => "\xE2\x87\x94",
 352                      'harr;' => "\xE2\x86\x94",
 353                      'hearts;' => "\xE2\x99\xA5",
 354                      'hellip;' => "\xE2\x80\xA6",
 355                      'Iacute' => "\xC3\x8D",
 356                      'iacute' => "\xC3\xAD",
 357                      'Iacute;' => "\xC3\x8D",
 358                      'iacute;' => "\xC3\xAD",
 359                      'Icirc' => "\xC3\x8E",
 360                      'icirc' => "\xC3\xAE",
 361                      'Icirc;' => "\xC3\x8E",
 362                      'icirc;' => "\xC3\xAE",
 363                      'iexcl' => "\xC2\xA1",
 364                      'iexcl;' => "\xC2\xA1",
 365                      'Igrave' => "\xC3\x8C",
 366                      'igrave' => "\xC3\xAC",
 367                      'Igrave;' => "\xC3\x8C",
 368                      'igrave;' => "\xC3\xAC",
 369                      'image;' => "\xE2\x84\x91",
 370                      'infin;' => "\xE2\x88\x9E",
 371                      'int;' => "\xE2\x88\xAB",
 372                      'Iota;' => "\xCE\x99",
 373                      'iota;' => "\xCE\xB9",
 374                      'iquest' => "\xC2\xBF",
 375                      'iquest;' => "\xC2\xBF",
 376                      'isin;' => "\xE2\x88\x88",
 377                      'Iuml' => "\xC3\x8F",
 378                      'iuml' => "\xC3\xAF",
 379                      'Iuml;' => "\xC3\x8F",
 380                      'iuml;' => "\xC3\xAF",
 381                      'Kappa;' => "\xCE\x9A",
 382                      'kappa;' => "\xCE\xBA",
 383                      'Lambda;' => "\xCE\x9B",
 384                      'lambda;' => "\xCE\xBB",
 385                      'lang;' => "\xE3\x80\x88",
 386                      'laquo' => "\xC2\xAB",
 387                      'laquo;' => "\xC2\xAB",
 388                      'lArr;' => "\xE2\x87\x90",
 389                      'larr;' => "\xE2\x86\x90",
 390                      'lceil;' => "\xE2\x8C\x88",
 391                      'ldquo;' => "\xE2\x80\x9C",
 392                      'le;' => "\xE2\x89\xA4",
 393                      'lfloor;' => "\xE2\x8C\x8A",
 394                      'lowast;' => "\xE2\x88\x97",
 395                      'loz;' => "\xE2\x97\x8A",
 396                      'lrm;' => "\xE2\x80\x8E",
 397                      'lsaquo;' => "\xE2\x80\xB9",
 398                      'lsquo;' => "\xE2\x80\x98",
 399                      'LT' => "\x3C",
 400                      'lt' => "\x3C",
 401                      'LT;' => "\x3C",
 402                      'lt;' => "\x3C",
 403                      'macr' => "\xC2\xAF",
 404                      'macr;' => "\xC2\xAF",
 405                      'mdash;' => "\xE2\x80\x94",
 406                      'micro' => "\xC2\xB5",
 407                      'micro;' => "\xC2\xB5",
 408                      'middot' => "\xC2\xB7",
 409                      'middot;' => "\xC2\xB7",
 410                      'minus;' => "\xE2\x88\x92",
 411                      'Mu;' => "\xCE\x9C",
 412                      'mu;' => "\xCE\xBC",
 413                      'nabla;' => "\xE2\x88\x87",
 414                      'nbsp' => "\xC2\xA0",
 415                      'nbsp;' => "\xC2\xA0",
 416                      'ndash;' => "\xE2\x80\x93",
 417                      'ne;' => "\xE2\x89\xA0",
 418                      'ni;' => "\xE2\x88\x8B",
 419                      'not' => "\xC2\xAC",
 420                      'not;' => "\xC2\xAC",
 421                      'notin;' => "\xE2\x88\x89",
 422                      'nsub;' => "\xE2\x8A\x84",
 423                      'Ntilde' => "\xC3\x91",
 424                      'ntilde' => "\xC3\xB1",
 425                      'Ntilde;' => "\xC3\x91",
 426                      'ntilde;' => "\xC3\xB1",
 427                      'Nu;' => "\xCE\x9D",
 428                      'nu;' => "\xCE\xBD",
 429                      'Oacute' => "\xC3\x93",
 430                      'oacute' => "\xC3\xB3",
 431                      'Oacute;' => "\xC3\x93",
 432                      'oacute;' => "\xC3\xB3",
 433                      'Ocirc' => "\xC3\x94",
 434                      'ocirc' => "\xC3\xB4",
 435                      'Ocirc;' => "\xC3\x94",
 436                      'ocirc;' => "\xC3\xB4",
 437                      'OElig;' => "\xC5\x92",
 438                      'oelig;' => "\xC5\x93",
 439                      'Ograve' => "\xC3\x92",
 440                      'ograve' => "\xC3\xB2",
 441                      'Ograve;' => "\xC3\x92",
 442                      'ograve;' => "\xC3\xB2",
 443                      'oline;' => "\xE2\x80\xBE",
 444                      'Omega;' => "\xCE\xA9",
 445                      'omega;' => "\xCF\x89",
 446                      'Omicron;' => "\xCE\x9F",
 447                      'omicron;' => "\xCE\xBF",
 448                      'oplus;' => "\xE2\x8A\x95",
 449                      'or;' => "\xE2\x88\xA8",
 450                      'ordf' => "\xC2\xAA",
 451                      'ordf;' => "\xC2\xAA",
 452                      'ordm' => "\xC2\xBA",
 453                      'ordm;' => "\xC2\xBA",
 454                      'Oslash' => "\xC3\x98",
 455                      'oslash' => "\xC3\xB8",
 456                      'Oslash;' => "\xC3\x98",
 457                      'oslash;' => "\xC3\xB8",
 458                      'Otilde' => "\xC3\x95",
 459                      'otilde' => "\xC3\xB5",
 460                      'Otilde;' => "\xC3\x95",
 461                      'otilde;' => "\xC3\xB5",
 462                      'otimes;' => "\xE2\x8A\x97",
 463                      'Ouml' => "\xC3\x96",
 464                      'ouml' => "\xC3\xB6",
 465                      'Ouml;' => "\xC3\x96",
 466                      'ouml;' => "\xC3\xB6",
 467                      'para' => "\xC2\xB6",
 468                      'para;' => "\xC2\xB6",
 469                      'part;' => "\xE2\x88\x82",
 470                      'permil;' => "\xE2\x80\xB0",
 471                      'perp;' => "\xE2\x8A\xA5",
 472                      'Phi;' => "\xCE\xA6",
 473                      'phi;' => "\xCF\x86",
 474                      'Pi;' => "\xCE\xA0",
 475                      'pi;' => "\xCF\x80",
 476                      'piv;' => "\xCF\x96",
 477                      'plusmn' => "\xC2\xB1",
 478                      'plusmn;' => "\xC2\xB1",
 479                      'pound' => "\xC2\xA3",
 480                      'pound;' => "\xC2\xA3",
 481                      'Prime;' => "\xE2\x80\xB3",
 482                      'prime;' => "\xE2\x80\xB2",
 483                      'prod;' => "\xE2\x88\x8F",
 484                      'prop;' => "\xE2\x88\x9D",
 485                      'Psi;' => "\xCE\xA8",
 486                      'psi;' => "\xCF\x88",
 487                      'QUOT' => "\x22",
 488                      'quot' => "\x22",
 489                      'QUOT;' => "\x22",
 490                      'quot;' => "\x22",
 491                      'radic;' => "\xE2\x88\x9A",
 492                      'rang;' => "\xE3\x80\x89",
 493                      'raquo' => "\xC2\xBB",
 494                      'raquo;' => "\xC2\xBB",
 495                      'rArr;' => "\xE2\x87\x92",
 496                      'rarr;' => "\xE2\x86\x92",
 497                      'rceil;' => "\xE2\x8C\x89",
 498                      'rdquo;' => "\xE2\x80\x9D",
 499                      'real;' => "\xE2\x84\x9C",
 500                      'REG' => "\xC2\xAE",
 501                      'reg' => "\xC2\xAE",
 502                      'REG;' => "\xC2\xAE",
 503                      'reg;' => "\xC2\xAE",
 504                      'rfloor;' => "\xE2\x8C\x8B",
 505                      'Rho;' => "\xCE\xA1",
 506                      'rho;' => "\xCF\x81",
 507                      'rlm;' => "\xE2\x80\x8F",
 508                      'rsaquo;' => "\xE2\x80\xBA",
 509                      'rsquo;' => "\xE2\x80\x99",
 510                      'sbquo;' => "\xE2\x80\x9A",
 511                      'Scaron;' => "\xC5\xA0",
 512                      'scaron;' => "\xC5\xA1",
 513                      'sdot;' => "\xE2\x8B\x85",
 514                      'sect' => "\xC2\xA7",
 515                      'sect;' => "\xC2\xA7",
 516                      'shy' => "\xC2\xAD",
 517                      'shy;' => "\xC2\xAD",
 518                      'Sigma;' => "\xCE\xA3",
 519                      'sigma;' => "\xCF\x83",
 520                      'sigmaf;' => "\xCF\x82",
 521                      'sim;' => "\xE2\x88\xBC",
 522                      'spades;' => "\xE2\x99\xA0",
 523                      'sub;' => "\xE2\x8A\x82",
 524                      'sube;' => "\xE2\x8A\x86",
 525                      'sum;' => "\xE2\x88\x91",
 526                      'sup;' => "\xE2\x8A\x83",
 527                      'sup1' => "\xC2\xB9",
 528                      'sup1;' => "\xC2\xB9",
 529                      'sup2' => "\xC2\xB2",
 530                      'sup2;' => "\xC2\xB2",
 531                      'sup3' => "\xC2\xB3",
 532                      'sup3;' => "\xC2\xB3",
 533                      'supe;' => "\xE2\x8A\x87",
 534                      'szlig' => "\xC3\x9F",
 535                      'szlig;' => "\xC3\x9F",
 536                      'Tau;' => "\xCE\xA4",
 537                      'tau;' => "\xCF\x84",
 538                      'there4;' => "\xE2\x88\xB4",
 539                      'Theta;' => "\xCE\x98",
 540                      'theta;' => "\xCE\xB8",
 541                      'thetasym;' => "\xCF\x91",
 542                      'thinsp;' => "\xE2\x80\x89",
 543                      'THORN' => "\xC3\x9E",
 544                      'thorn' => "\xC3\xBE",
 545                      'THORN;' => "\xC3\x9E",
 546                      'thorn;' => "\xC3\xBE",
 547                      'tilde;' => "\xCB\x9C",
 548                      'times' => "\xC3\x97",
 549                      'times;' => "\xC3\x97",
 550                      'TRADE;' => "\xE2\x84\xA2",
 551                      'trade;' => "\xE2\x84\xA2",
 552                      'Uacute' => "\xC3\x9A",
 553                      'uacute' => "\xC3\xBA",
 554                      'Uacute;' => "\xC3\x9A",
 555                      'uacute;' => "\xC3\xBA",
 556                      'uArr;' => "\xE2\x87\x91",
 557                      'uarr;' => "\xE2\x86\x91",
 558                      'Ucirc' => "\xC3\x9B",
 559                      'ucirc' => "\xC3\xBB",
 560                      'Ucirc;' => "\xC3\x9B",
 561                      'ucirc;' => "\xC3\xBB",
 562                      'Ugrave' => "\xC3\x99",
 563                      'ugrave' => "\xC3\xB9",
 564                      'Ugrave;' => "\xC3\x99",
 565                      'ugrave;' => "\xC3\xB9",
 566                      'uml' => "\xC2\xA8",
 567                      'uml;' => "\xC2\xA8",
 568                      'upsih;' => "\xCF\x92",
 569                      'Upsilon;' => "\xCE\xA5",
 570                      'upsilon;' => "\xCF\x85",
 571                      'Uuml' => "\xC3\x9C",
 572                      'uuml' => "\xC3\xBC",
 573                      'Uuml;' => "\xC3\x9C",
 574                      'uuml;' => "\xC3\xBC",
 575                      'weierp;' => "\xE2\x84\x98",
 576                      'Xi;' => "\xCE\x9E",
 577                      'xi;' => "\xCE\xBE",
 578                      'Yacute' => "\xC3\x9D",
 579                      'yacute' => "\xC3\xBD",
 580                      'Yacute;' => "\xC3\x9D",
 581                      'yacute;' => "\xC3\xBD",
 582                      'yen' => "\xC2\xA5",
 583                      'yen;' => "\xC2\xA5",
 584                      'yuml' => "\xC3\xBF",
 585                      'Yuml;' => "\xC5\xB8",
 586                      'yuml;' => "\xC3\xBF",
 587                      'Zeta;' => "\xCE\x96",
 588                      'zeta;' => "\xCE\xB6",
 589                      'zwj;' => "\xE2\x80\x8D",
 590                      'zwnj;' => "\xE2\x80\x8C"
 591                  );
 592  
 593                  for ($i = 0, $match = null; $i < 9 && $this->consume() !== false; $i++)
 594                  {
 595                      $consumed = substr($this->consumed, 1);
 596                      if (isset($entities[$consumed]))
 597                      {
 598                          $match = $consumed;
 599                      }
 600                  }
 601  
 602                  if ($match !== null)
 603                  {
 604                       $this->data = substr_replace($this->data, $entities[$match], $this->position - strlen($consumed) - 1, strlen($match) + 1);
 605                      $this->position += strlen($entities[$match]) - strlen($consumed) - 1;
 606                  }
 607                  break;
 608          }
 609      }
 610  }