Chris@0
|
1 <?php
|
Chris@0
|
2
|
Chris@0
|
3 /*
|
Chris@0
|
4 * This file is part of the Symfony package.
|
Chris@0
|
5 *
|
Chris@0
|
6 * (c) Fabien Potencier <fabien@symfony.com>
|
Chris@0
|
7 *
|
Chris@0
|
8 * For the full copyright and license information, please view the LICENSE
|
Chris@0
|
9 * file that was distributed with this source code.
|
Chris@0
|
10 */
|
Chris@0
|
11
|
Chris@0
|
12 namespace Symfony\Component\CssSelector\Parser\Tokenizer;
|
Chris@0
|
13
|
Chris@0
|
14 /**
|
Chris@0
|
15 * CSS selector tokenizer escaping applier.
|
Chris@0
|
16 *
|
Chris@0
|
17 * This component is a port of the Python cssselect library,
|
Chris@0
|
18 * which is copyright Ian Bicking, @see https://github.com/SimonSapin/cssselect.
|
Chris@0
|
19 *
|
Chris@0
|
20 * @author Jean-François Simon <jeanfrancois.simon@sensiolabs.com>
|
Chris@0
|
21 *
|
Chris@0
|
22 * @internal
|
Chris@0
|
23 */
|
Chris@0
|
24 class TokenizerEscaping
|
Chris@0
|
25 {
|
Chris@0
|
26 /**
|
Chris@0
|
27 * @var TokenizerPatterns
|
Chris@0
|
28 */
|
Chris@0
|
29 private $patterns;
|
Chris@0
|
30
|
Chris@0
|
31 /**
|
Chris@0
|
32 * @param TokenizerPatterns $patterns
|
Chris@0
|
33 */
|
Chris@0
|
34 public function __construct(TokenizerPatterns $patterns)
|
Chris@0
|
35 {
|
Chris@0
|
36 $this->patterns = $patterns;
|
Chris@0
|
37 }
|
Chris@0
|
38
|
Chris@0
|
39 /**
|
Chris@0
|
40 * @param string $value
|
Chris@0
|
41 *
|
Chris@0
|
42 * @return string
|
Chris@0
|
43 */
|
Chris@0
|
44 public function escapeUnicode($value)
|
Chris@0
|
45 {
|
Chris@0
|
46 $value = $this->replaceUnicodeSequences($value);
|
Chris@0
|
47
|
Chris@0
|
48 return preg_replace($this->patterns->getSimpleEscapePattern(), '$1', $value);
|
Chris@0
|
49 }
|
Chris@0
|
50
|
Chris@0
|
51 /**
|
Chris@0
|
52 * @param string $value
|
Chris@0
|
53 *
|
Chris@0
|
54 * @return string
|
Chris@0
|
55 */
|
Chris@0
|
56 public function escapeUnicodeAndNewLine($value)
|
Chris@0
|
57 {
|
Chris@0
|
58 $value = preg_replace($this->patterns->getNewLineEscapePattern(), '', $value);
|
Chris@0
|
59
|
Chris@0
|
60 return $this->escapeUnicode($value);
|
Chris@0
|
61 }
|
Chris@0
|
62
|
Chris@0
|
63 /**
|
Chris@0
|
64 * @param string $value
|
Chris@0
|
65 *
|
Chris@0
|
66 * @return string
|
Chris@0
|
67 */
|
Chris@0
|
68 private function replaceUnicodeSequences($value)
|
Chris@0
|
69 {
|
Chris@0
|
70 return preg_replace_callback($this->patterns->getUnicodeEscapePattern(), function ($match) {
|
Chris@0
|
71 $c = hexdec($match[1]);
|
Chris@0
|
72
|
Chris@0
|
73 if (0x80 > $c %= 0x200000) {
|
Chris@0
|
74 return chr($c);
|
Chris@0
|
75 }
|
Chris@0
|
76 if (0x800 > $c) {
|
Chris@0
|
77 return chr(0xC0 | $c >> 6).chr(0x80 | $c & 0x3F);
|
Chris@0
|
78 }
|
Chris@0
|
79 if (0x10000 > $c) {
|
Chris@0
|
80 return chr(0xE0 | $c >> 12).chr(0x80 | $c >> 6 & 0x3F).chr(0x80 | $c & 0x3F);
|
Chris@0
|
81 }
|
Chris@0
|
82 }, $value);
|
Chris@0
|
83 }
|
Chris@0
|
84 }
|