]>
Commit | Line | Data |
---|---|---|
42c80841 NL |
1 | <?php |
2 | /** | |
3 | * SimplePie | |
4 | * | |
5 | * A PHP-Based RSS and Atom Feed Framework. | |
6 | * Takes the hard work out of managing a complete RSS/Atom solution. | |
7 | * | |
8 | * Copyright (c) 2004-2012, Ryan Parman, Geoffrey Sneddon, Ryan McCue, and contributors | |
9 | * All rights reserved. | |
10 | * | |
11 | * Redistribution and use in source and binary forms, with or without modification, are | |
12 | * permitted provided that the following conditions are met: | |
13 | * | |
14 | * * Redistributions of source code must retain the above copyright notice, this list of | |
15 | * conditions and the following disclaimer. | |
16 | * | |
17 | * * Redistributions in binary form must reproduce the above copyright notice, this list | |
18 | * of conditions and the following disclaimer in the documentation and/or other materials | |
19 | * provided with the distribution. | |
20 | * | |
21 | * * Neither the name of the SimplePie Team nor the names of its contributors may be used | |
22 | * to endorse or promote products derived from this software without specific prior | |
23 | * written permission. | |
24 | * | |
25 | * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS | |
26 | * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY | |
27 | * AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS | |
28 | * AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | |
29 | * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR | |
30 | * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY | |
31 | * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR | |
32 | * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | |
33 | * POSSIBILITY OF SUCH DAMAGE. | |
34 | * | |
35 | * @package SimplePie | |
36 | * @version 1.3.1 | |
37 | * @copyright 2004-2012 Ryan Parman, Geoffrey Sneddon, Ryan McCue | |
38 | * @author Ryan Parman | |
39 | * @author Geoffrey Sneddon | |
40 | * @author Ryan McCue | |
41 | * @link http://simplepie.org/ SimplePie | |
42 | * @license http://www.opensource.org/licenses/bsd-license.php BSD License | |
43 | */ | |
44 | ||
45 | ||
46 | /** | |
47 | * Decode HTML Entities | |
48 | * | |
49 | * This implements HTML5 as of revision 967 (2007-06-28) | |
50 | * | |
51 | * @deprecated Use DOMDocument instead! | |
52 | * @package SimplePie | |
53 | */ | |
54 | class SimplePie_Decode_HTML_Entities | |
55 | { | |
56 | /** | |
57 | * Data to be parsed | |
58 | * | |
59 | * @access private | |
60 | * @var string | |
61 | */ | |
62 | var $data = ''; | |
63 | ||
64 | /** | |
65 | * Currently consumed bytes | |
66 | * | |
67 | * @access private | |
68 | * @var string | |
69 | */ | |
70 | var $consumed = ''; | |
71 | ||
72 | /** | |
73 | * Position of the current byte being parsed | |
74 | * | |
75 | * @access private | |
76 | * @var int | |
77 | */ | |
78 | var $position = 0; | |
79 | ||
80 | /** | |
81 | * Create an instance of the class with the input data | |
82 | * | |
83 | * @access public | |
84 | * @param string $data Input data | |
85 | */ | |
86 | public function __construct($data) | |
87 | { | |
88 | $this->data = $data; | |
89 | } | |
90 | ||
91 | /** | |
92 | * Parse the input data | |
93 | * | |
94 | * @access public | |
95 | * @return string Output data | |
96 | */ | |
97 | public function parse() | |
98 | { | |
99 | while (($this->position = strpos($this->data, '&', $this->position)) !== false) | |
100 | { | |
101 | $this->consume(); | |
102 | $this->entity(); | |
103 | $this->consumed = ''; | |
104 | } | |
105 | return $this->data; | |
106 | } | |
107 | ||
108 | /** | |
109 | * Consume the next byte | |
110 | * | |
111 | * @access private | |
112 | * @return mixed The next byte, or false, if there is no more data | |
113 | */ | |
114 | public function consume() | |
115 | { | |
116 | if (isset($this->data[$this->position])) | |
117 | { | |
118 | $this->consumed .= $this->data[$this->position]; | |
119 | return $this->data[$this->position++]; | |
120 | } | |
121 | else | |
122 | { | |
123 | return false; | |
124 | } | |
125 | } | |
126 | ||
127 | /** | |
128 | * Consume a range of characters | |
129 | * | |
130 | * @access private | |
131 | * @param string $chars Characters to consume | |
132 | * @return mixed A series of characters that match the range, or false | |
133 | */ | |
134 | public function consume_range($chars) | |
135 | { | |
136 | if ($len = strspn($this->data, $chars, $this->position)) | |
137 | { | |
138 | $data = substr($this->data, $this->position, $len); | |
139 | $this->consumed .= $data; | |
140 | $this->position += $len; | |
141 | return $data; | |
142 | } | |
143 | else | |
144 | { | |
145 | return false; | |
146 | } | |
147 | } | |
148 | ||
149 | /** | |
150 | * Unconsume one byte | |
151 | * | |
152 | * @access private | |
153 | */ | |
154 | public function unconsume() | |
155 | { | |
156 | $this->consumed = substr($this->consumed, 0, -1); | |
157 | $this->position--; | |
158 | } | |
159 | ||
160 | /** | |
161 | * Decode an entity | |
162 | * | |
163 | * @access private | |
164 | */ | |
165 | public function entity() | |
166 | { | |
167 | switch ($this->consume()) | |
168 | { | |
169 | case "\x09": | |
170 | case "\x0A": | |
171 | case "\x0B": | |
172 | case "\x0B": | |
173 | case "\x0C": | |
174 | case "\x20": | |
175 | case "\x3C": | |
176 | case "\x26": | |
177 | case false: | |
178 | break; | |
179 | ||
180 | case "\x23": | |
181 | switch ($this->consume()) | |
182 | { | |
183 | case "\x78": | |
184 | case "\x58": | |
185 | $range = '0123456789ABCDEFabcdef'; | |
186 | $hex = true; | |
187 | break; | |
188 | ||
189 | default: | |
190 | $range = '0123456789'; | |
191 | $hex = false; | |
192 | $this->unconsume(); | |
193 | break; | |
194 | } | |
195 | ||
196 | if ($codepoint = $this->consume_range($range)) | |
197 | { | |
198 | static $windows_1252_specials = array(0x0D => "\x0A", 0x80 => "\xE2\x82\xAC", 0x81 => "\xEF\xBF\xBD", 0x82 => "\xE2\x80\x9A", 0x83 => "\xC6\x92", 0x84 => "\xE2\x80\x9E", 0x85 => "\xE2\x80\xA6", 0x86 => "\xE2\x80\xA0", 0x87 => "\xE2\x80\xA1", 0x88 => "\xCB\x86", 0x89 => "\xE2\x80\xB0", 0x8A => "\xC5\xA0", 0x8B => "\xE2\x80\xB9", 0x8C => "\xC5\x92", 0x8D => "\xEF\xBF\xBD", 0x8E => "\xC5\xBD", 0x8F => "\xEF\xBF\xBD", 0x90 => "\xEF\xBF\xBD", 0x91 => "\xE2\x80\x98", 0x92 => "\xE2\x80\x99", 0x93 => "\xE2\x80\x9C", 0x94 => "\xE2\x80\x9D", 0x95 => "\xE2\x80\xA2", 0x96 => "\xE2\x80\x93", 0x97 => "\xE2\x80\x94", 0x98 => "\xCB\x9C", 0x99 => "\xE2\x84\xA2", 0x9A => "\xC5\xA1", 0x9B => "\xE2\x80\xBA", 0x9C => "\xC5\x93", 0x9D => "\xEF\xBF\xBD", 0x9E => "\xC5\xBE", 0x9F => "\xC5\xB8"); | |
199 | ||
200 | if ($hex) | |
201 | { | |
202 | $codepoint = hexdec($codepoint); | |
203 | } | |
204 | else | |
205 | { | |
206 | $codepoint = intval($codepoint); | |
207 | } | |
208 | ||
209 | if (isset($windows_1252_specials[$codepoint])) | |
210 | { | |
211 | $replacement = $windows_1252_specials[$codepoint]; | |
212 | } | |
213 | else | |
214 | { | |
215 | $replacement = SimplePie_Misc::codepoint_to_utf8($codepoint); | |
216 | } | |
217 | ||
218 | if (!in_array($this->consume(), array(';', false), true)) | |
219 | { | |
220 | $this->unconsume(); | |
221 | } | |
222 | ||
223 | $consumed_length = strlen($this->consumed); | |
224 | $this->data = substr_replace($this->data, $replacement, $this->position - $consumed_length, $consumed_length); | |
225 | $this->position += strlen($replacement) - $consumed_length; | |
226 | } | |
227 | break; | |
228 | ||
229 | default: | |
230 | static $entities = array( | |
231 | 'Aacute' => "\xC3\x81", | |
232 | 'aacute' => "\xC3\xA1", | |
233 | 'Aacute;' => "\xC3\x81", | |
234 | 'aacute;' => "\xC3\xA1", | |
235 | 'Acirc' => "\xC3\x82", | |
236 | 'acirc' => "\xC3\xA2", | |
237 | 'Acirc;' => "\xC3\x82", | |
238 | 'acirc;' => "\xC3\xA2", | |
239 | 'acute' => "\xC2\xB4", | |
240 | 'acute;' => "\xC2\xB4", | |
241 | 'AElig' => "\xC3\x86", | |
242 | 'aelig' => "\xC3\xA6", | |
243 | 'AElig;' => "\xC3\x86", | |
244 | 'aelig;' => "\xC3\xA6", | |
245 | 'Agrave' => "\xC3\x80", | |
246 | 'agrave' => "\xC3\xA0", | |
247 | 'Agrave;' => "\xC3\x80", | |
248 | 'agrave;' => "\xC3\xA0", | |
249 | 'alefsym;' => "\xE2\x84\xB5", | |
250 | 'Alpha;' => "\xCE\x91", | |
251 | 'alpha;' => "\xCE\xB1", | |
252 | 'AMP' => "\x26", | |
253 | 'amp' => "\x26", | |
254 | 'AMP;' => "\x26", | |
255 | 'amp;' => "\x26", | |
256 | 'and;' => "\xE2\x88\xA7", | |
257 | 'ang;' => "\xE2\x88\xA0", | |
258 | 'apos;' => "\x27", | |
259 | 'Aring' => "\xC3\x85", | |
260 | 'aring' => "\xC3\xA5", | |
261 | 'Aring;' => "\xC3\x85", | |
262 | 'aring;' => "\xC3\xA5", | |
263 | 'asymp;' => "\xE2\x89\x88", | |
264 | 'Atilde' => "\xC3\x83", | |
265 | 'atilde' => "\xC3\xA3", | |
266 | 'Atilde;' => "\xC3\x83", | |
267 | 'atilde;' => "\xC3\xA3", | |
268 | 'Auml' => "\xC3\x84", | |
269 | 'auml' => "\xC3\xA4", | |
270 | 'Auml;' => "\xC3\x84", | |
271 | 'auml;' => "\xC3\xA4", | |
272 | 'bdquo;' => "\xE2\x80\x9E", | |
273 | 'Beta;' => "\xCE\x92", | |
274 | 'beta;' => "\xCE\xB2", | |
275 | 'brvbar' => "\xC2\xA6", | |
276 | 'brvbar;' => "\xC2\xA6", | |
277 | 'bull;' => "\xE2\x80\xA2", | |
278 | 'cap;' => "\xE2\x88\xA9", | |
279 | 'Ccedil' => "\xC3\x87", | |
280 | 'ccedil' => "\xC3\xA7", | |
281 | 'Ccedil;' => "\xC3\x87", | |
282 | 'ccedil;' => "\xC3\xA7", | |
283 | 'cedil' => "\xC2\xB8", | |
284 | 'cedil;' => "\xC2\xB8", | |
285 | 'cent' => "\xC2\xA2", | |
286 | 'cent;' => "\xC2\xA2", | |
287 | 'Chi;' => "\xCE\xA7", | |
288 | 'chi;' => "\xCF\x87", | |
289 | 'circ;' => "\xCB\x86", | |
290 | 'clubs;' => "\xE2\x99\xA3", | |
291 | 'cong;' => "\xE2\x89\x85", | |
292 | 'COPY' => "\xC2\xA9", | |
293 | 'copy' => "\xC2\xA9", | |
294 | 'COPY;' => "\xC2\xA9", | |
295 | 'copy;' => "\xC2\xA9", | |
296 | 'crarr;' => "\xE2\x86\xB5", | |
297 | 'cup;' => "\xE2\x88\xAA", | |
298 | 'curren' => "\xC2\xA4", | |
299 | 'curren;' => "\xC2\xA4", | |
300 | 'Dagger;' => "\xE2\x80\xA1", | |
301 | 'dagger;' => "\xE2\x80\xA0", | |
302 | 'dArr;' => "\xE2\x87\x93", | |
303 | 'darr;' => "\xE2\x86\x93", | |
304 | 'deg' => "\xC2\xB0", | |
305 | 'deg;' => "\xC2\xB0", | |
306 | 'Delta;' => "\xCE\x94", | |
307 | 'delta;' => "\xCE\xB4", | |
308 | 'diams;' => "\xE2\x99\xA6", | |
309 | 'divide' => "\xC3\xB7", | |
310 | 'divide;' => "\xC3\xB7", | |
311 | 'Eacute' => "\xC3\x89", | |
312 | 'eacute' => "\xC3\xA9", | |
313 | 'Eacute;' => "\xC3\x89", | |
314 | 'eacute;' => "\xC3\xA9", | |
315 | 'Ecirc' => "\xC3\x8A", | |
316 | 'ecirc' => "\xC3\xAA", | |
317 | 'Ecirc;' => "\xC3\x8A", | |
318 | 'ecirc;' => "\xC3\xAA", | |
319 | 'Egrave' => "\xC3\x88", | |
320 | 'egrave' => "\xC3\xA8", | |
321 | 'Egrave;' => "\xC3\x88", | |
322 | 'egrave;' => "\xC3\xA8", | |
323 | 'empty;' => "\xE2\x88\x85", | |
324 | 'emsp;' => "\xE2\x80\x83", | |
325 | 'ensp;' => "\xE2\x80\x82", | |
326 | 'Epsilon;' => "\xCE\x95", | |
327 | 'epsilon;' => "\xCE\xB5", | |
328 | 'equiv;' => "\xE2\x89\xA1", | |
329 | 'Eta;' => "\xCE\x97", | |
330 | 'eta;' => "\xCE\xB7", | |
331 | 'ETH' => "\xC3\x90", | |
332 | 'eth' => "\xC3\xB0", | |
333 | 'ETH;' => "\xC3\x90", | |
334 | 'eth;' => "\xC3\xB0", | |
335 | 'Euml' => "\xC3\x8B", | |
336 | 'euml' => "\xC3\xAB", | |
337 | 'Euml;' => "\xC3\x8B", | |
338 | 'euml;' => "\xC3\xAB", | |
339 | 'euro;' => "\xE2\x82\xAC", | |
340 | 'exist;' => "\xE2\x88\x83", | |
341 | 'fnof;' => "\xC6\x92", | |
342 | 'forall;' => "\xE2\x88\x80", | |
343 | 'frac12' => "\xC2\xBD", | |
344 | 'frac12;' => "\xC2\xBD", | |
345 | 'frac14' => "\xC2\xBC", | |
346 | 'frac14;' => "\xC2\xBC", | |
347 | 'frac34' => "\xC2\xBE", | |
348 | 'frac34;' => "\xC2\xBE", | |
349 | 'frasl;' => "\xE2\x81\x84", | |
350 | 'Gamma;' => "\xCE\x93", | |
351 | 'gamma;' => "\xCE\xB3", | |
352 | 'ge;' => "\xE2\x89\xA5", | |
353 | 'GT' => "\x3E", | |
354 | 'gt' => "\x3E", | |
355 | 'GT;' => "\x3E", | |
356 | 'gt;' => "\x3E", | |
357 | 'hArr;' => "\xE2\x87\x94", | |
358 | 'harr;' => "\xE2\x86\x94", | |
359 | 'hearts;' => "\xE2\x99\xA5", | |
360 | 'hellip;' => "\xE2\x80\xA6", | |
361 | 'Iacute' => "\xC3\x8D", | |
362 | 'iacute' => "\xC3\xAD", | |
363 | 'Iacute;' => "\xC3\x8D", | |
364 | 'iacute;' => "\xC3\xAD", | |
365 | 'Icirc' => "\xC3\x8E", | |
366 | 'icirc' => "\xC3\xAE", | |
367 | 'Icirc;' => "\xC3\x8E", | |
368 | 'icirc;' => "\xC3\xAE", | |
369 | 'iexcl' => "\xC2\xA1", | |
370 | 'iexcl;' => "\xC2\xA1", | |
371 | 'Igrave' => "\xC3\x8C", | |
372 | 'igrave' => "\xC3\xAC", | |
373 | 'Igrave;' => "\xC3\x8C", | |
374 | 'igrave;' => "\xC3\xAC", | |
375 | 'image;' => "\xE2\x84\x91", | |
376 | 'infin;' => "\xE2\x88\x9E", | |
377 | 'int;' => "\xE2\x88\xAB", | |
378 | 'Iota;' => "\xCE\x99", | |
379 | 'iota;' => "\xCE\xB9", | |
380 | 'iquest' => "\xC2\xBF", | |
381 | 'iquest;' => "\xC2\xBF", | |
382 | 'isin;' => "\xE2\x88\x88", | |
383 | 'Iuml' => "\xC3\x8F", | |
384 | 'iuml' => "\xC3\xAF", | |
385 | 'Iuml;' => "\xC3\x8F", | |
386 | 'iuml;' => "\xC3\xAF", | |
387 | 'Kappa;' => "\xCE\x9A", | |
388 | 'kappa;' => "\xCE\xBA", | |
389 | 'Lambda;' => "\xCE\x9B", | |
390 | 'lambda;' => "\xCE\xBB", | |
391 | 'lang;' => "\xE3\x80\x88", | |
392 | 'laquo' => "\xC2\xAB", | |
393 | 'laquo;' => "\xC2\xAB", | |
394 | 'lArr;' => "\xE2\x87\x90", | |
395 | 'larr;' => "\xE2\x86\x90", | |
396 | 'lceil;' => "\xE2\x8C\x88", | |
397 | 'ldquo;' => "\xE2\x80\x9C", | |
398 | 'le;' => "\xE2\x89\xA4", | |
399 | 'lfloor;' => "\xE2\x8C\x8A", | |
400 | 'lowast;' => "\xE2\x88\x97", | |
401 | 'loz;' => "\xE2\x97\x8A", | |
402 | 'lrm;' => "\xE2\x80\x8E", | |
403 | 'lsaquo;' => "\xE2\x80\xB9", | |
404 | 'lsquo;' => "\xE2\x80\x98", | |
405 | 'LT' => "\x3C", | |
406 | 'lt' => "\x3C", | |
407 | 'LT;' => "\x3C", | |
408 | 'lt;' => "\x3C", | |
409 | 'macr' => "\xC2\xAF", | |
410 | 'macr;' => "\xC2\xAF", | |
411 | 'mdash;' => "\xE2\x80\x94", | |
412 | 'micro' => "\xC2\xB5", | |
413 | 'micro;' => "\xC2\xB5", | |
414 | 'middot' => "\xC2\xB7", | |
415 | 'middot;' => "\xC2\xB7", | |
416 | 'minus;' => "\xE2\x88\x92", | |
417 | 'Mu;' => "\xCE\x9C", | |
418 | 'mu;' => "\xCE\xBC", | |
419 | 'nabla;' => "\xE2\x88\x87", | |
420 | 'nbsp' => "\xC2\xA0", | |
421 | 'nbsp;' => "\xC2\xA0", | |
422 | 'ndash;' => "\xE2\x80\x93", | |
423 | 'ne;' => "\xE2\x89\xA0", | |
424 | 'ni;' => "\xE2\x88\x8B", | |
425 | 'not' => "\xC2\xAC", | |
426 | 'not;' => "\xC2\xAC", | |
427 | 'notin;' => "\xE2\x88\x89", | |
428 | 'nsub;' => "\xE2\x8A\x84", | |
429 | 'Ntilde' => "\xC3\x91", | |
430 | 'ntilde' => "\xC3\xB1", | |
431 | 'Ntilde;' => "\xC3\x91", | |
432 | 'ntilde;' => "\xC3\xB1", | |
433 | 'Nu;' => "\xCE\x9D", | |
434 | 'nu;' => "\xCE\xBD", | |
435 | 'Oacute' => "\xC3\x93", | |
436 | 'oacute' => "\xC3\xB3", | |
437 | 'Oacute;' => "\xC3\x93", | |
438 | 'oacute;' => "\xC3\xB3", | |
439 | 'Ocirc' => "\xC3\x94", | |
440 | 'ocirc' => "\xC3\xB4", | |
441 | 'Ocirc;' => "\xC3\x94", | |
442 | 'ocirc;' => "\xC3\xB4", | |
443 | 'OElig;' => "\xC5\x92", | |
444 | 'oelig;' => "\xC5\x93", | |
445 | 'Ograve' => "\xC3\x92", | |
446 | 'ograve' => "\xC3\xB2", | |
447 | 'Ograve;' => "\xC3\x92", | |
448 | 'ograve;' => "\xC3\xB2", | |
449 | 'oline;' => "\xE2\x80\xBE", | |
450 | 'Omega;' => "\xCE\xA9", | |
451 | 'omega;' => "\xCF\x89", | |
452 | 'Omicron;' => "\xCE\x9F", | |
453 | 'omicron;' => "\xCE\xBF", | |
454 | 'oplus;' => "\xE2\x8A\x95", | |
455 | 'or;' => "\xE2\x88\xA8", | |
456 | 'ordf' => "\xC2\xAA", | |
457 | 'ordf;' => "\xC2\xAA", | |
458 | 'ordm' => "\xC2\xBA", | |
459 | 'ordm;' => "\xC2\xBA", | |
460 | 'Oslash' => "\xC3\x98", | |
461 | 'oslash' => "\xC3\xB8", | |
462 | 'Oslash;' => "\xC3\x98", | |
463 | 'oslash;' => "\xC3\xB8", | |
464 | 'Otilde' => "\xC3\x95", | |
465 | 'otilde' => "\xC3\xB5", | |
466 | 'Otilde;' => "\xC3\x95", | |
467 | 'otilde;' => "\xC3\xB5", | |
468 | 'otimes;' => "\xE2\x8A\x97", | |
469 | 'Ouml' => "\xC3\x96", | |
470 | 'ouml' => "\xC3\xB6", | |
471 | 'Ouml;' => "\xC3\x96", | |
472 | 'ouml;' => "\xC3\xB6", | |
473 | 'para' => "\xC2\xB6", | |
474 | 'para;' => "\xC2\xB6", | |
475 | 'part;' => "\xE2\x88\x82", | |
476 | 'permil;' => "\xE2\x80\xB0", | |
477 | 'perp;' => "\xE2\x8A\xA5", | |
478 | 'Phi;' => "\xCE\xA6", | |
479 | 'phi;' => "\xCF\x86", | |
480 | 'Pi;' => "\xCE\xA0", | |
481 | 'pi;' => "\xCF\x80", | |
482 | 'piv;' => "\xCF\x96", | |
483 | 'plusmn' => "\xC2\xB1", | |
484 | 'plusmn;' => "\xC2\xB1", | |
485 | 'pound' => "\xC2\xA3", | |
486 | 'pound;' => "\xC2\xA3", | |
487 | 'Prime;' => "\xE2\x80\xB3", | |
488 | 'prime;' => "\xE2\x80\xB2", | |
489 | 'prod;' => "\xE2\x88\x8F", | |
490 | 'prop;' => "\xE2\x88\x9D", | |
491 | 'Psi;' => "\xCE\xA8", | |
492 | 'psi;' => "\xCF\x88", | |
493 | 'QUOT' => "\x22", | |
494 | 'quot' => "\x22", | |
495 | 'QUOT;' => "\x22", | |
496 | 'quot;' => "\x22", | |
497 | 'radic;' => "\xE2\x88\x9A", | |
498 | 'rang;' => "\xE3\x80\x89", | |
499 | 'raquo' => "\xC2\xBB", | |
500 | 'raquo;' => "\xC2\xBB", | |
501 | 'rArr;' => "\xE2\x87\x92", | |
502 | 'rarr;' => "\xE2\x86\x92", | |
503 | 'rceil;' => "\xE2\x8C\x89", | |
504 | 'rdquo;' => "\xE2\x80\x9D", | |
505 | 'real;' => "\xE2\x84\x9C", | |
506 | 'REG' => "\xC2\xAE", | |
507 | 'reg' => "\xC2\xAE", | |
508 | 'REG;' => "\xC2\xAE", | |
509 | 'reg;' => "\xC2\xAE", | |
510 | 'rfloor;' => "\xE2\x8C\x8B", | |
511 | 'Rho;' => "\xCE\xA1", | |
512 | 'rho;' => "\xCF\x81", | |
513 | 'rlm;' => "\xE2\x80\x8F", | |
514 | 'rsaquo;' => "\xE2\x80\xBA", | |
515 | 'rsquo;' => "\xE2\x80\x99", | |
516 | 'sbquo;' => "\xE2\x80\x9A", | |
517 | 'Scaron;' => "\xC5\xA0", | |
518 | 'scaron;' => "\xC5\xA1", | |
519 | 'sdot;' => "\xE2\x8B\x85", | |
520 | 'sect' => "\xC2\xA7", | |
521 | 'sect;' => "\xC2\xA7", | |
522 | 'shy' => "\xC2\xAD", | |
523 | 'shy;' => "\xC2\xAD", | |
524 | 'Sigma;' => "\xCE\xA3", | |
525 | 'sigma;' => "\xCF\x83", | |
526 | 'sigmaf;' => "\xCF\x82", | |
527 | 'sim;' => "\xE2\x88\xBC", | |
528 | 'spades;' => "\xE2\x99\xA0", | |
529 | 'sub;' => "\xE2\x8A\x82", | |
530 | 'sube;' => "\xE2\x8A\x86", | |
531 | 'sum;' => "\xE2\x88\x91", | |
532 | 'sup;' => "\xE2\x8A\x83", | |
533 | 'sup1' => "\xC2\xB9", | |
534 | 'sup1;' => "\xC2\xB9", | |
535 | 'sup2' => "\xC2\xB2", | |
536 | 'sup2;' => "\xC2\xB2", | |
537 | 'sup3' => "\xC2\xB3", | |
538 | 'sup3;' => "\xC2\xB3", | |
539 | 'supe;' => "\xE2\x8A\x87", | |
540 | 'szlig' => "\xC3\x9F", | |
541 | 'szlig;' => "\xC3\x9F", | |
542 | 'Tau;' => "\xCE\xA4", | |
543 | 'tau;' => "\xCF\x84", | |
544 | 'there4;' => "\xE2\x88\xB4", | |
545 | 'Theta;' => "\xCE\x98", | |
546 | 'theta;' => "\xCE\xB8", | |
547 | 'thetasym;' => "\xCF\x91", | |
548 | 'thinsp;' => "\xE2\x80\x89", | |
549 | 'THORN' => "\xC3\x9E", | |
550 | 'thorn' => "\xC3\xBE", | |
551 | 'THORN;' => "\xC3\x9E", | |
552 | 'thorn;' => "\xC3\xBE", | |
553 | 'tilde;' => "\xCB\x9C", | |
554 | 'times' => "\xC3\x97", | |
555 | 'times;' => "\xC3\x97", | |
556 | 'TRADE;' => "\xE2\x84\xA2", | |
557 | 'trade;' => "\xE2\x84\xA2", | |
558 | 'Uacute' => "\xC3\x9A", | |
559 | 'uacute' => "\xC3\xBA", | |
560 | 'Uacute;' => "\xC3\x9A", | |
561 | 'uacute;' => "\xC3\xBA", | |
562 | 'uArr;' => "\xE2\x87\x91", | |
563 | 'uarr;' => "\xE2\x86\x91", | |
564 | 'Ucirc' => "\xC3\x9B", | |
565 | 'ucirc' => "\xC3\xBB", | |
566 | 'Ucirc;' => "\xC3\x9B", | |
567 | 'ucirc;' => "\xC3\xBB", | |
568 | 'Ugrave' => "\xC3\x99", | |
569 | 'ugrave' => "\xC3\xB9", | |
570 | 'Ugrave;' => "\xC3\x99", | |
571 | 'ugrave;' => "\xC3\xB9", | |
572 | 'uml' => "\xC2\xA8", | |
573 | 'uml;' => "\xC2\xA8", | |
574 | 'upsih;' => "\xCF\x92", | |
575 | 'Upsilon;' => "\xCE\xA5", | |
576 | 'upsilon;' => "\xCF\x85", | |
577 | 'Uuml' => "\xC3\x9C", | |
578 | 'uuml' => "\xC3\xBC", | |
579 | 'Uuml;' => "\xC3\x9C", | |
580 | 'uuml;' => "\xC3\xBC", | |
581 | 'weierp;' => "\xE2\x84\x98", | |
582 | 'Xi;' => "\xCE\x9E", | |
583 | 'xi;' => "\xCE\xBE", | |
584 | 'Yacute' => "\xC3\x9D", | |
585 | 'yacute' => "\xC3\xBD", | |
586 | 'Yacute;' => "\xC3\x9D", | |
587 | 'yacute;' => "\xC3\xBD", | |
588 | 'yen' => "\xC2\xA5", | |
589 | 'yen;' => "\xC2\xA5", | |
590 | 'yuml' => "\xC3\xBF", | |
591 | 'Yuml;' => "\xC5\xB8", | |
592 | 'yuml;' => "\xC3\xBF", | |
593 | 'Zeta;' => "\xCE\x96", | |
594 | 'zeta;' => "\xCE\xB6", | |
595 | 'zwj;' => "\xE2\x80\x8D", | |
596 | 'zwnj;' => "\xE2\x80\x8C" | |
597 | ); | |
598 | ||
599 | for ($i = 0, $match = null; $i < 9 && $this->consume() !== false; $i++) | |
600 | { | |
601 | $consumed = substr($this->consumed, 1); | |
602 | if (isset($entities[$consumed])) | |
603 | { | |
604 | $match = $consumed; | |
605 | } | |
606 | } | |
607 | ||
608 | if ($match !== null) | |
609 | { | |
610 | $this->data = substr_replace($this->data, $entities[$match], $this->position - strlen($consumed) - 1, strlen($match) + 1); | |
611 | $this->position += strlen($entities[$match]) - strlen($consumed) - 1; | |
612 | } | |
613 | break; | |
614 | } | |
615 | } | |
616 | } | |
617 |