web/wp-includes/SimplePie/Decode/HTML/Entities.php
changeset 204 09a1c134465b
equal deleted inserted replaced
203:f507feede89a 204:09a1c134465b
       
     1 <?php
       
     2 /**
       
     3  * SimplePie
       
     4  *
       
     5  * A PHP-Based RSS and Atom Feed Framework.
       
     6  * Takes the hard work out of managing a complete RSS/Atom solution.
       
     7  *
       
     8  * Copyright (c) 2004-2012, Ryan Parman, Geoffrey Sneddon, Ryan McCue, and contributors
       
     9  * All rights reserved.
       
    10  *
       
    11  * Redistribution and use in source and binary forms, with or without modification, are
       
    12  * permitted provided that the following conditions are met:
       
    13  *
       
    14  * 	* Redistributions of source code must retain the above copyright notice, this list of
       
    15  * 	  conditions and the following disclaimer.
       
    16  *
       
    17  * 	* Redistributions in binary form must reproduce the above copyright notice, this list
       
    18  * 	  of conditions and the following disclaimer in the documentation and/or other materials
       
    19  * 	  provided with the distribution.
       
    20  *
       
    21  * 	* Neither the name of the SimplePie Team nor the names of its contributors may be used
       
    22  * 	  to endorse or promote products derived from this software without specific prior
       
    23  * 	  written permission.
       
    24  *
       
    25  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS
       
    26  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY
       
    27  * AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS
       
    28  * AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
       
    29  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
       
    30  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
       
    31  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
       
    32  * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
       
    33  * POSSIBILITY OF SUCH DAMAGE.
       
    34  *
       
    35  * @package SimplePie
       
    36  * @version 1.3.1
       
    37  * @copyright 2004-2012 Ryan Parman, Geoffrey Sneddon, Ryan McCue
       
    38  * @author Ryan Parman
       
    39  * @author Geoffrey Sneddon
       
    40  * @author Ryan McCue
       
    41  * @link http://simplepie.org/ SimplePie
       
    42  * @license http://www.opensource.org/licenses/bsd-license.php BSD License
       
    43  */
       
    44 
       
    45 
       
    46 /**
       
    47  * Decode HTML Entities
       
    48  *
       
    49  * This implements HTML5 as of revision 967 (2007-06-28)
       
    50  *
       
    51  * @deprecated Use DOMDocument instead!
       
    52  * @package SimplePie
       
    53  */
       
    54 class SimplePie_Decode_HTML_Entities
       
    55 {
       
    56 	/**
       
    57 	 * Data to be parsed
       
    58 	 *
       
    59 	 * @access private
       
    60 	 * @var string
       
    61 	 */
       
    62 	var $data = '';
       
    63 
       
    64 	/**
       
    65 	 * Currently consumed bytes
       
    66 	 *
       
    67 	 * @access private
       
    68 	 * @var string
       
    69 	 */
       
    70 	var $consumed = '';
       
    71 
       
    72 	/**
       
    73 	 * Position of the current byte being parsed
       
    74 	 *
       
    75 	 * @access private
       
    76 	 * @var int
       
    77 	 */
       
    78 	var $position = 0;
       
    79 
       
    80 	/**
       
    81 	 * Create an instance of the class with the input data
       
    82 	 *
       
    83 	 * @access public
       
    84 	 * @param string $data Input data
       
    85 	 */
       
    86 	public function __construct($data)
       
    87 	{
       
    88 		$this->data = $data;
       
    89 	}
       
    90 
       
    91 	/**
       
    92 	 * Parse the input data
       
    93 	 *
       
    94 	 * @access public
       
    95 	 * @return string Output data
       
    96 	 */
       
    97 	public function parse()
       
    98 	{
       
    99 		while (($this->position = strpos($this->data, '&', $this->position)) !== false)
       
   100 		{
       
   101 			$this->consume();
       
   102 			$this->entity();
       
   103 			$this->consumed = '';
       
   104 		}
       
   105 		return $this->data;
       
   106 	}
       
   107 
       
   108 	/**
       
   109 	 * Consume the next byte
       
   110 	 *
       
   111 	 * @access private
       
   112 	 * @return mixed The next byte, or false, if there is no more data
       
   113 	 */
       
   114 	public function consume()
       
   115 	{
       
   116 		if (isset($this->data[$this->position]))
       
   117 		{
       
   118 			$this->consumed .= $this->data[$this->position];
       
   119 			return $this->data[$this->position++];
       
   120 		}
       
   121 		else
       
   122 		{
       
   123 			return false;
       
   124 		}
       
   125 	}
       
   126 
       
   127 	/**
       
   128 	 * Consume a range of characters
       
   129 	 *
       
   130 	 * @access private
       
   131 	 * @param string $chars Characters to consume
       
   132 	 * @return mixed A series of characters that match the range, or false
       
   133 	 */
       
   134 	public function consume_range($chars)
       
   135 	{
       
   136 		if ($len = strspn($this->data, $chars, $this->position))
       
   137 		{
       
   138 			$data = substr($this->data, $this->position, $len);
       
   139 			$this->consumed .= $data;
       
   140 			$this->position += $len;
       
   141 			return $data;
       
   142 		}
       
   143 		else
       
   144 		{
       
   145 			return false;
       
   146 		}
       
   147 	}
       
   148 
       
   149 	/**
       
   150 	 * Unconsume one byte
       
   151 	 *
       
   152 	 * @access private
       
   153 	 */
       
   154 	public function unconsume()
       
   155 	{
       
   156 		$this->consumed = substr($this->consumed, 0, -1);
       
   157 		$this->position--;
       
   158 	}
       
   159 
       
   160 	/**
       
   161 	 * Decode an entity
       
   162 	 *
       
   163 	 * @access private
       
   164 	 */
       
   165 	public function entity()
       
   166 	{
       
   167 		switch ($this->consume())
       
   168 		{
       
   169 			case "\x09":
       
   170 			case "\x0A":
       
   171 			case "\x0B":
       
   172 			case "\x0B":
       
   173 			case "\x0C":
       
   174 			case "\x20":
       
   175 			case "\x3C":
       
   176 			case "\x26":
       
   177 			case false:
       
   178 				break;
       
   179 
       
   180 			case "\x23":
       
   181 				switch ($this->consume())
       
   182 				{
       
   183 					case "\x78":
       
   184 					case "\x58":
       
   185 						$range = '0123456789ABCDEFabcdef';
       
   186 						$hex = true;
       
   187 						break;
       
   188 
       
   189 					default:
       
   190 						$range = '0123456789';
       
   191 						$hex = false;
       
   192 						$this->unconsume();
       
   193 						break;
       
   194 				}
       
   195 
       
   196 				if ($codepoint = $this->consume_range($range))
       
   197 				{
       
   198 					static $windows_1252_specials = array(0x0D => "\x0A", 0x80 => "\xE2\x82\xAC", 0x81 => "\xEF\xBF\xBD", 0x82 => "\xE2\x80\x9A", 0x83 => "\xC6\x92", 0x84 => "\xE2\x80\x9E", 0x85 => "\xE2\x80\xA6", 0x86 => "\xE2\x80\xA0", 0x87 => "\xE2\x80\xA1", 0x88 => "\xCB\x86", 0x89 => "\xE2\x80\xB0", 0x8A => "\xC5\xA0", 0x8B => "\xE2\x80\xB9", 0x8C => "\xC5\x92", 0x8D => "\xEF\xBF\xBD", 0x8E => "\xC5\xBD", 0x8F => "\xEF\xBF\xBD", 0x90 => "\xEF\xBF\xBD", 0x91 => "\xE2\x80\x98", 0x92 => "\xE2\x80\x99", 0x93 => "\xE2\x80\x9C", 0x94 => "\xE2\x80\x9D", 0x95 => "\xE2\x80\xA2", 0x96 => "\xE2\x80\x93", 0x97 => "\xE2\x80\x94", 0x98 => "\xCB\x9C", 0x99 => "\xE2\x84\xA2", 0x9A => "\xC5\xA1", 0x9B => "\xE2\x80\xBA", 0x9C => "\xC5\x93", 0x9D => "\xEF\xBF\xBD", 0x9E => "\xC5\xBE", 0x9F => "\xC5\xB8");
       
   199 
       
   200 					if ($hex)
       
   201 					{
       
   202 						$codepoint = hexdec($codepoint);
       
   203 					}
       
   204 					else
       
   205 					{
       
   206 						$codepoint = intval($codepoint);
       
   207 					}
       
   208 
       
   209 					if (isset($windows_1252_specials[$codepoint]))
       
   210 					{
       
   211 						$replacement = $windows_1252_specials[$codepoint];
       
   212 					}
       
   213 					else
       
   214 					{
       
   215 						$replacement = SimplePie_Misc::codepoint_to_utf8($codepoint);
       
   216 					}
       
   217 
       
   218 					if (!in_array($this->consume(), array(';', false), true))
       
   219 					{
       
   220 						$this->unconsume();
       
   221 					}
       
   222 
       
   223 					$consumed_length = strlen($this->consumed);
       
   224 					$this->data = substr_replace($this->data, $replacement, $this->position - $consumed_length, $consumed_length);
       
   225 					$this->position += strlen($replacement) - $consumed_length;
       
   226 				}
       
   227 				break;
       
   228 
       
   229 			default:
       
   230 				static $entities = array(
       
   231 					'Aacute' => "\xC3\x81",
       
   232 					'aacute' => "\xC3\xA1",
       
   233 					'Aacute;' => "\xC3\x81",
       
   234 					'aacute;' => "\xC3\xA1",
       
   235 					'Acirc' => "\xC3\x82",
       
   236 					'acirc' => "\xC3\xA2",
       
   237 					'Acirc;' => "\xC3\x82",
       
   238 					'acirc;' => "\xC3\xA2",
       
   239 					'acute' => "\xC2\xB4",
       
   240 					'acute;' => "\xC2\xB4",
       
   241 					'AElig' => "\xC3\x86",
       
   242 					'aelig' => "\xC3\xA6",
       
   243 					'AElig;' => "\xC3\x86",
       
   244 					'aelig;' => "\xC3\xA6",
       
   245 					'Agrave' => "\xC3\x80",
       
   246 					'agrave' => "\xC3\xA0",
       
   247 					'Agrave;' => "\xC3\x80",
       
   248 					'agrave;' => "\xC3\xA0",
       
   249 					'alefsym;' => "\xE2\x84\xB5",
       
   250 					'Alpha;' => "\xCE\x91",
       
   251 					'alpha;' => "\xCE\xB1",
       
   252 					'AMP' => "\x26",
       
   253 					'amp' => "\x26",
       
   254 					'AMP;' => "\x26",
       
   255 					'amp;' => "\x26",
       
   256 					'and;' => "\xE2\x88\xA7",
       
   257 					'ang;' => "\xE2\x88\xA0",
       
   258 					'apos;' => "\x27",
       
   259 					'Aring' => "\xC3\x85",
       
   260 					'aring' => "\xC3\xA5",
       
   261 					'Aring;' => "\xC3\x85",
       
   262 					'aring;' => "\xC3\xA5",
       
   263 					'asymp;' => "\xE2\x89\x88",
       
   264 					'Atilde' => "\xC3\x83",
       
   265 					'atilde' => "\xC3\xA3",
       
   266 					'Atilde;' => "\xC3\x83",
       
   267 					'atilde;' => "\xC3\xA3",
       
   268 					'Auml' => "\xC3\x84",
       
   269 					'auml' => "\xC3\xA4",
       
   270 					'Auml;' => "\xC3\x84",
       
   271 					'auml;' => "\xC3\xA4",
       
   272 					'bdquo;' => "\xE2\x80\x9E",
       
   273 					'Beta;' => "\xCE\x92",
       
   274 					'beta;' => "\xCE\xB2",
       
   275 					'brvbar' => "\xC2\xA6",
       
   276 					'brvbar;' => "\xC2\xA6",
       
   277 					'bull;' => "\xE2\x80\xA2",
       
   278 					'cap;' => "\xE2\x88\xA9",
       
   279 					'Ccedil' => "\xC3\x87",
       
   280 					'ccedil' => "\xC3\xA7",
       
   281 					'Ccedil;' => "\xC3\x87",
       
   282 					'ccedil;' => "\xC3\xA7",
       
   283 					'cedil' => "\xC2\xB8",
       
   284 					'cedil;' => "\xC2\xB8",
       
   285 					'cent' => "\xC2\xA2",
       
   286 					'cent;' => "\xC2\xA2",
       
   287 					'Chi;' => "\xCE\xA7",
       
   288 					'chi;' => "\xCF\x87",
       
   289 					'circ;' => "\xCB\x86",
       
   290 					'clubs;' => "\xE2\x99\xA3",
       
   291 					'cong;' => "\xE2\x89\x85",
       
   292 					'COPY' => "\xC2\xA9",
       
   293 					'copy' => "\xC2\xA9",
       
   294 					'COPY;' => "\xC2\xA9",
       
   295 					'copy;' => "\xC2\xA9",
       
   296 					'crarr;' => "\xE2\x86\xB5",
       
   297 					'cup;' => "\xE2\x88\xAA",
       
   298 					'curren' => "\xC2\xA4",
       
   299 					'curren;' => "\xC2\xA4",
       
   300 					'Dagger;' => "\xE2\x80\xA1",
       
   301 					'dagger;' => "\xE2\x80\xA0",
       
   302 					'dArr;' => "\xE2\x87\x93",
       
   303 					'darr;' => "\xE2\x86\x93",
       
   304 					'deg' => "\xC2\xB0",
       
   305 					'deg;' => "\xC2\xB0",
       
   306 					'Delta;' => "\xCE\x94",
       
   307 					'delta;' => "\xCE\xB4",
       
   308 					'diams;' => "\xE2\x99\xA6",
       
   309 					'divide' => "\xC3\xB7",
       
   310 					'divide;' => "\xC3\xB7",
       
   311 					'Eacute' => "\xC3\x89",
       
   312 					'eacute' => "\xC3\xA9",
       
   313 					'Eacute;' => "\xC3\x89",
       
   314 					'eacute;' => "\xC3\xA9",
       
   315 					'Ecirc' => "\xC3\x8A",
       
   316 					'ecirc' => "\xC3\xAA",
       
   317 					'Ecirc;' => "\xC3\x8A",
       
   318 					'ecirc;' => "\xC3\xAA",
       
   319 					'Egrave' => "\xC3\x88",
       
   320 					'egrave' => "\xC3\xA8",
       
   321 					'Egrave;' => "\xC3\x88",
       
   322 					'egrave;' => "\xC3\xA8",
       
   323 					'empty;' => "\xE2\x88\x85",
       
   324 					'emsp;' => "\xE2\x80\x83",
       
   325 					'ensp;' => "\xE2\x80\x82",
       
   326 					'Epsilon;' => "\xCE\x95",
       
   327 					'epsilon;' => "\xCE\xB5",
       
   328 					'equiv;' => "\xE2\x89\xA1",
       
   329 					'Eta;' => "\xCE\x97",
       
   330 					'eta;' => "\xCE\xB7",
       
   331 					'ETH' => "\xC3\x90",
       
   332 					'eth' => "\xC3\xB0",
       
   333 					'ETH;' => "\xC3\x90",
       
   334 					'eth;' => "\xC3\xB0",
       
   335 					'Euml' => "\xC3\x8B",
       
   336 					'euml' => "\xC3\xAB",
       
   337 					'Euml;' => "\xC3\x8B",
       
   338 					'euml;' => "\xC3\xAB",
       
   339 					'euro;' => "\xE2\x82\xAC",
       
   340 					'exist;' => "\xE2\x88\x83",
       
   341 					'fnof;' => "\xC6\x92",
       
   342 					'forall;' => "\xE2\x88\x80",
       
   343 					'frac12' => "\xC2\xBD",
       
   344 					'frac12;' => "\xC2\xBD",
       
   345 					'frac14' => "\xC2\xBC",
       
   346 					'frac14;' => "\xC2\xBC",
       
   347 					'frac34' => "\xC2\xBE",
       
   348 					'frac34;' => "\xC2\xBE",
       
   349 					'frasl;' => "\xE2\x81\x84",
       
   350 					'Gamma;' => "\xCE\x93",
       
   351 					'gamma;' => "\xCE\xB3",
       
   352 					'ge;' => "\xE2\x89\xA5",
       
   353 					'GT' => "\x3E",
       
   354 					'gt' => "\x3E",
       
   355 					'GT;' => "\x3E",
       
   356 					'gt;' => "\x3E",
       
   357 					'hArr;' => "\xE2\x87\x94",
       
   358 					'harr;' => "\xE2\x86\x94",
       
   359 					'hearts;' => "\xE2\x99\xA5",
       
   360 					'hellip;' => "\xE2\x80\xA6",
       
   361 					'Iacute' => "\xC3\x8D",
       
   362 					'iacute' => "\xC3\xAD",
       
   363 					'Iacute;' => "\xC3\x8D",
       
   364 					'iacute;' => "\xC3\xAD",
       
   365 					'Icirc' => "\xC3\x8E",
       
   366 					'icirc' => "\xC3\xAE",
       
   367 					'Icirc;' => "\xC3\x8E",
       
   368 					'icirc;' => "\xC3\xAE",
       
   369 					'iexcl' => "\xC2\xA1",
       
   370 					'iexcl;' => "\xC2\xA1",
       
   371 					'Igrave' => "\xC3\x8C",
       
   372 					'igrave' => "\xC3\xAC",
       
   373 					'Igrave;' => "\xC3\x8C",
       
   374 					'igrave;' => "\xC3\xAC",
       
   375 					'image;' => "\xE2\x84\x91",
       
   376 					'infin;' => "\xE2\x88\x9E",
       
   377 					'int;' => "\xE2\x88\xAB",
       
   378 					'Iota;' => "\xCE\x99",
       
   379 					'iota;' => "\xCE\xB9",
       
   380 					'iquest' => "\xC2\xBF",
       
   381 					'iquest;' => "\xC2\xBF",
       
   382 					'isin;' => "\xE2\x88\x88",
       
   383 					'Iuml' => "\xC3\x8F",
       
   384 					'iuml' => "\xC3\xAF",
       
   385 					'Iuml;' => "\xC3\x8F",
       
   386 					'iuml;' => "\xC3\xAF",
       
   387 					'Kappa;' => "\xCE\x9A",
       
   388 					'kappa;' => "\xCE\xBA",
       
   389 					'Lambda;' => "\xCE\x9B",
       
   390 					'lambda;' => "\xCE\xBB",
       
   391 					'lang;' => "\xE3\x80\x88",
       
   392 					'laquo' => "\xC2\xAB",
       
   393 					'laquo;' => "\xC2\xAB",
       
   394 					'lArr;' => "\xE2\x87\x90",
       
   395 					'larr;' => "\xE2\x86\x90",
       
   396 					'lceil;' => "\xE2\x8C\x88",
       
   397 					'ldquo;' => "\xE2\x80\x9C",
       
   398 					'le;' => "\xE2\x89\xA4",
       
   399 					'lfloor;' => "\xE2\x8C\x8A",
       
   400 					'lowast;' => "\xE2\x88\x97",
       
   401 					'loz;' => "\xE2\x97\x8A",
       
   402 					'lrm;' => "\xE2\x80\x8E",
       
   403 					'lsaquo;' => "\xE2\x80\xB9",
       
   404 					'lsquo;' => "\xE2\x80\x98",
       
   405 					'LT' => "\x3C",
       
   406 					'lt' => "\x3C",
       
   407 					'LT;' => "\x3C",
       
   408 					'lt;' => "\x3C",
       
   409 					'macr' => "\xC2\xAF",
       
   410 					'macr;' => "\xC2\xAF",
       
   411 					'mdash;' => "\xE2\x80\x94",
       
   412 					'micro' => "\xC2\xB5",
       
   413 					'micro;' => "\xC2\xB5",
       
   414 					'middot' => "\xC2\xB7",
       
   415 					'middot;' => "\xC2\xB7",
       
   416 					'minus;' => "\xE2\x88\x92",
       
   417 					'Mu;' => "\xCE\x9C",
       
   418 					'mu;' => "\xCE\xBC",
       
   419 					'nabla;' => "\xE2\x88\x87",
       
   420 					'nbsp' => "\xC2\xA0",
       
   421 					'nbsp;' => "\xC2\xA0",
       
   422 					'ndash;' => "\xE2\x80\x93",
       
   423 					'ne;' => "\xE2\x89\xA0",
       
   424 					'ni;' => "\xE2\x88\x8B",
       
   425 					'not' => "\xC2\xAC",
       
   426 					'not;' => "\xC2\xAC",
       
   427 					'notin;' => "\xE2\x88\x89",
       
   428 					'nsub;' => "\xE2\x8A\x84",
       
   429 					'Ntilde' => "\xC3\x91",
       
   430 					'ntilde' => "\xC3\xB1",
       
   431 					'Ntilde;' => "\xC3\x91",
       
   432 					'ntilde;' => "\xC3\xB1",
       
   433 					'Nu;' => "\xCE\x9D",
       
   434 					'nu;' => "\xCE\xBD",
       
   435 					'Oacute' => "\xC3\x93",
       
   436 					'oacute' => "\xC3\xB3",
       
   437 					'Oacute;' => "\xC3\x93",
       
   438 					'oacute;' => "\xC3\xB3",
       
   439 					'Ocirc' => "\xC3\x94",
       
   440 					'ocirc' => "\xC3\xB4",
       
   441 					'Ocirc;' => "\xC3\x94",
       
   442 					'ocirc;' => "\xC3\xB4",
       
   443 					'OElig;' => "\xC5\x92",
       
   444 					'oelig;' => "\xC5\x93",
       
   445 					'Ograve' => "\xC3\x92",
       
   446 					'ograve' => "\xC3\xB2",
       
   447 					'Ograve;' => "\xC3\x92",
       
   448 					'ograve;' => "\xC3\xB2",
       
   449 					'oline;' => "\xE2\x80\xBE",
       
   450 					'Omega;' => "\xCE\xA9",
       
   451 					'omega;' => "\xCF\x89",
       
   452 					'Omicron;' => "\xCE\x9F",
       
   453 					'omicron;' => "\xCE\xBF",
       
   454 					'oplus;' => "\xE2\x8A\x95",
       
   455 					'or;' => "\xE2\x88\xA8",
       
   456 					'ordf' => "\xC2\xAA",
       
   457 					'ordf;' => "\xC2\xAA",
       
   458 					'ordm' => "\xC2\xBA",
       
   459 					'ordm;' => "\xC2\xBA",
       
   460 					'Oslash' => "\xC3\x98",
       
   461 					'oslash' => "\xC3\xB8",
       
   462 					'Oslash;' => "\xC3\x98",
       
   463 					'oslash;' => "\xC3\xB8",
       
   464 					'Otilde' => "\xC3\x95",
       
   465 					'otilde' => "\xC3\xB5",
       
   466 					'Otilde;' => "\xC3\x95",
       
   467 					'otilde;' => "\xC3\xB5",
       
   468 					'otimes;' => "\xE2\x8A\x97",
       
   469 					'Ouml' => "\xC3\x96",
       
   470 					'ouml' => "\xC3\xB6",
       
   471 					'Ouml;' => "\xC3\x96",
       
   472 					'ouml;' => "\xC3\xB6",
       
   473 					'para' => "\xC2\xB6",
       
   474 					'para;' => "\xC2\xB6",
       
   475 					'part;' => "\xE2\x88\x82",
       
   476 					'permil;' => "\xE2\x80\xB0",
       
   477 					'perp;' => "\xE2\x8A\xA5",
       
   478 					'Phi;' => "\xCE\xA6",
       
   479 					'phi;' => "\xCF\x86",
       
   480 					'Pi;' => "\xCE\xA0",
       
   481 					'pi;' => "\xCF\x80",
       
   482 					'piv;' => "\xCF\x96",
       
   483 					'plusmn' => "\xC2\xB1",
       
   484 					'plusmn;' => "\xC2\xB1",
       
   485 					'pound' => "\xC2\xA3",
       
   486 					'pound;' => "\xC2\xA3",
       
   487 					'Prime;' => "\xE2\x80\xB3",
       
   488 					'prime;' => "\xE2\x80\xB2",
       
   489 					'prod;' => "\xE2\x88\x8F",
       
   490 					'prop;' => "\xE2\x88\x9D",
       
   491 					'Psi;' => "\xCE\xA8",
       
   492 					'psi;' => "\xCF\x88",
       
   493 					'QUOT' => "\x22",
       
   494 					'quot' => "\x22",
       
   495 					'QUOT;' => "\x22",
       
   496 					'quot;' => "\x22",
       
   497 					'radic;' => "\xE2\x88\x9A",
       
   498 					'rang;' => "\xE3\x80\x89",
       
   499 					'raquo' => "\xC2\xBB",
       
   500 					'raquo;' => "\xC2\xBB",
       
   501 					'rArr;' => "\xE2\x87\x92",
       
   502 					'rarr;' => "\xE2\x86\x92",
       
   503 					'rceil;' => "\xE2\x8C\x89",
       
   504 					'rdquo;' => "\xE2\x80\x9D",
       
   505 					'real;' => "\xE2\x84\x9C",
       
   506 					'REG' => "\xC2\xAE",
       
   507 					'reg' => "\xC2\xAE",
       
   508 					'REG;' => "\xC2\xAE",
       
   509 					'reg;' => "\xC2\xAE",
       
   510 					'rfloor;' => "\xE2\x8C\x8B",
       
   511 					'Rho;' => "\xCE\xA1",
       
   512 					'rho;' => "\xCF\x81",
       
   513 					'rlm;' => "\xE2\x80\x8F",
       
   514 					'rsaquo;' => "\xE2\x80\xBA",
       
   515 					'rsquo;' => "\xE2\x80\x99",
       
   516 					'sbquo;' => "\xE2\x80\x9A",
       
   517 					'Scaron;' => "\xC5\xA0",
       
   518 					'scaron;' => "\xC5\xA1",
       
   519 					'sdot;' => "\xE2\x8B\x85",
       
   520 					'sect' => "\xC2\xA7",
       
   521 					'sect;' => "\xC2\xA7",
       
   522 					'shy' => "\xC2\xAD",
       
   523 					'shy;' => "\xC2\xAD",
       
   524 					'Sigma;' => "\xCE\xA3",
       
   525 					'sigma;' => "\xCF\x83",
       
   526 					'sigmaf;' => "\xCF\x82",
       
   527 					'sim;' => "\xE2\x88\xBC",
       
   528 					'spades;' => "\xE2\x99\xA0",
       
   529 					'sub;' => "\xE2\x8A\x82",
       
   530 					'sube;' => "\xE2\x8A\x86",
       
   531 					'sum;' => "\xE2\x88\x91",
       
   532 					'sup;' => "\xE2\x8A\x83",
       
   533 					'sup1' => "\xC2\xB9",
       
   534 					'sup1;' => "\xC2\xB9",
       
   535 					'sup2' => "\xC2\xB2",
       
   536 					'sup2;' => "\xC2\xB2",
       
   537 					'sup3' => "\xC2\xB3",
       
   538 					'sup3;' => "\xC2\xB3",
       
   539 					'supe;' => "\xE2\x8A\x87",
       
   540 					'szlig' => "\xC3\x9F",
       
   541 					'szlig;' => "\xC3\x9F",
       
   542 					'Tau;' => "\xCE\xA4",
       
   543 					'tau;' => "\xCF\x84",
       
   544 					'there4;' => "\xE2\x88\xB4",
       
   545 					'Theta;' => "\xCE\x98",
       
   546 					'theta;' => "\xCE\xB8",
       
   547 					'thetasym;' => "\xCF\x91",
       
   548 					'thinsp;' => "\xE2\x80\x89",
       
   549 					'THORN' => "\xC3\x9E",
       
   550 					'thorn' => "\xC3\xBE",
       
   551 					'THORN;' => "\xC3\x9E",
       
   552 					'thorn;' => "\xC3\xBE",
       
   553 					'tilde;' => "\xCB\x9C",
       
   554 					'times' => "\xC3\x97",
       
   555 					'times;' => "\xC3\x97",
       
   556 					'TRADE;' => "\xE2\x84\xA2",
       
   557 					'trade;' => "\xE2\x84\xA2",
       
   558 					'Uacute' => "\xC3\x9A",
       
   559 					'uacute' => "\xC3\xBA",
       
   560 					'Uacute;' => "\xC3\x9A",
       
   561 					'uacute;' => "\xC3\xBA",
       
   562 					'uArr;' => "\xE2\x87\x91",
       
   563 					'uarr;' => "\xE2\x86\x91",
       
   564 					'Ucirc' => "\xC3\x9B",
       
   565 					'ucirc' => "\xC3\xBB",
       
   566 					'Ucirc;' => "\xC3\x9B",
       
   567 					'ucirc;' => "\xC3\xBB",
       
   568 					'Ugrave' => "\xC3\x99",
       
   569 					'ugrave' => "\xC3\xB9",
       
   570 					'Ugrave;' => "\xC3\x99",
       
   571 					'ugrave;' => "\xC3\xB9",
       
   572 					'uml' => "\xC2\xA8",
       
   573 					'uml;' => "\xC2\xA8",
       
   574 					'upsih;' => "\xCF\x92",
       
   575 					'Upsilon;' => "\xCE\xA5",
       
   576 					'upsilon;' => "\xCF\x85",
       
   577 					'Uuml' => "\xC3\x9C",
       
   578 					'uuml' => "\xC3\xBC",
       
   579 					'Uuml;' => "\xC3\x9C",
       
   580 					'uuml;' => "\xC3\xBC",
       
   581 					'weierp;' => "\xE2\x84\x98",
       
   582 					'Xi;' => "\xCE\x9E",
       
   583 					'xi;' => "\xCE\xBE",
       
   584 					'Yacute' => "\xC3\x9D",
       
   585 					'yacute' => "\xC3\xBD",
       
   586 					'Yacute;' => "\xC3\x9D",
       
   587 					'yacute;' => "\xC3\xBD",
       
   588 					'yen' => "\xC2\xA5",
       
   589 					'yen;' => "\xC2\xA5",
       
   590 					'yuml' => "\xC3\xBF",
       
   591 					'Yuml;' => "\xC5\xB8",
       
   592 					'yuml;' => "\xC3\xBF",
       
   593 					'Zeta;' => "\xCE\x96",
       
   594 					'zeta;' => "\xCE\xB6",
       
   595 					'zwj;' => "\xE2\x80\x8D",
       
   596 					'zwnj;' => "\xE2\x80\x8C"
       
   597 				);
       
   598 
       
   599 				for ($i = 0, $match = null; $i < 9 && $this->consume() !== false; $i++)
       
   600 				{
       
   601 					$consumed = substr($this->consumed, 1);
       
   602 					if (isset($entities[$consumed]))
       
   603 					{
       
   604 						$match = $consumed;
       
   605 					}
       
   606 				}
       
   607 
       
   608 				if ($match !== null)
       
   609 				{
       
   610  					$this->data = substr_replace($this->data, $entities[$match], $this->position - strlen($consumed) - 1, strlen($match) + 1);
       
   611 					$this->position += strlen($entities[$match]) - strlen($consumed) - 1;
       
   612 				}
       
   613 				break;
       
   614 		}
       
   615 	}
       
   616 }
       
   617