Chris@0
|
1 <?php
|
Chris@0
|
2
|
Chris@0
|
3 /*
|
Chris@0
|
4 * This file is part of the Symfony package.
|
Chris@0
|
5 *
|
Chris@0
|
6 * (c) Fabien Potencier <fabien@symfony.com>
|
Chris@0
|
7 *
|
Chris@0
|
8 * For the full copyright and license information, please view the LICENSE
|
Chris@0
|
9 * file that was distributed with this source code.
|
Chris@0
|
10 */
|
Chris@0
|
11
|
Chris@0
|
12 namespace Symfony\Component\CssSelector\Parser\Tokenizer;
|
Chris@0
|
13
|
Chris@0
|
14 /**
|
Chris@0
|
15 * CSS selector tokenizer patterns builder.
|
Chris@0
|
16 *
|
Chris@0
|
17 * This component is a port of the Python cssselect library,
|
Chris@0
|
18 * which is copyright Ian Bicking, @see https://github.com/SimonSapin/cssselect.
|
Chris@0
|
19 *
|
Chris@0
|
20 * @author Jean-François Simon <jeanfrancois.simon@sensiolabs.com>
|
Chris@0
|
21 *
|
Chris@0
|
22 * @internal
|
Chris@0
|
23 */
|
Chris@0
|
24 class TokenizerPatterns
|
Chris@0
|
25 {
|
Chris@0
|
26 private $unicodeEscapePattern;
|
Chris@0
|
27 private $simpleEscapePattern;
|
Chris@0
|
28 private $newLineEscapePattern;
|
Chris@0
|
29 private $escapePattern;
|
Chris@0
|
30 private $stringEscapePattern;
|
Chris@0
|
31 private $nonAsciiPattern;
|
Chris@0
|
32 private $nmCharPattern;
|
Chris@0
|
33 private $nmStartPattern;
|
Chris@0
|
34 private $identifierPattern;
|
Chris@0
|
35 private $hashPattern;
|
Chris@0
|
36 private $numberPattern;
|
Chris@0
|
37 private $quotedStringPattern;
|
Chris@0
|
38
|
Chris@0
|
39 public function __construct()
|
Chris@0
|
40 {
|
Chris@0
|
41 $this->unicodeEscapePattern = '\\\\([0-9a-f]{1,6})(?:\r\n|[ \n\r\t\f])?';
|
Chris@0
|
42 $this->simpleEscapePattern = '\\\\(.)';
|
Chris@0
|
43 $this->newLineEscapePattern = '\\\\(?:\n|\r\n|\r|\f)';
|
Chris@0
|
44 $this->escapePattern = $this->unicodeEscapePattern.'|\\\\[^\n\r\f0-9a-f]';
|
Chris@0
|
45 $this->stringEscapePattern = $this->newLineEscapePattern.'|'.$this->escapePattern;
|
Chris@0
|
46 $this->nonAsciiPattern = '[^\x00-\x7F]';
|
Chris@0
|
47 $this->nmCharPattern = '[_a-z0-9-]|'.$this->escapePattern.'|'.$this->nonAsciiPattern;
|
Chris@0
|
48 $this->nmStartPattern = '[_a-z]|'.$this->escapePattern.'|'.$this->nonAsciiPattern;
|
Chris@14
|
49 $this->identifierPattern = '-?(?:'.$this->nmStartPattern.')(?:'.$this->nmCharPattern.')*';
|
Chris@0
|
50 $this->hashPattern = '#((?:'.$this->nmCharPattern.')+)';
|
Chris@0
|
51 $this->numberPattern = '[+-]?(?:[0-9]*\.[0-9]+|[0-9]+)';
|
Chris@0
|
52 $this->quotedStringPattern = '([^\n\r\f%s]|'.$this->stringEscapePattern.')*';
|
Chris@0
|
53 }
|
Chris@0
|
54
|
Chris@0
|
55 /**
|
Chris@0
|
56 * @return string
|
Chris@0
|
57 */
|
Chris@0
|
58 public function getNewLineEscapePattern()
|
Chris@0
|
59 {
|
Chris@0
|
60 return '~^'.$this->newLineEscapePattern.'~';
|
Chris@0
|
61 }
|
Chris@0
|
62
|
Chris@0
|
63 /**
|
Chris@0
|
64 * @return string
|
Chris@0
|
65 */
|
Chris@0
|
66 public function getSimpleEscapePattern()
|
Chris@0
|
67 {
|
Chris@0
|
68 return '~^'.$this->simpleEscapePattern.'~';
|
Chris@0
|
69 }
|
Chris@0
|
70
|
Chris@0
|
71 /**
|
Chris@0
|
72 * @return string
|
Chris@0
|
73 */
|
Chris@0
|
74 public function getUnicodeEscapePattern()
|
Chris@0
|
75 {
|
Chris@0
|
76 return '~^'.$this->unicodeEscapePattern.'~i';
|
Chris@0
|
77 }
|
Chris@0
|
78
|
Chris@0
|
79 /**
|
Chris@0
|
80 * @return string
|
Chris@0
|
81 */
|
Chris@0
|
82 public function getIdentifierPattern()
|
Chris@0
|
83 {
|
Chris@0
|
84 return '~^'.$this->identifierPattern.'~i';
|
Chris@0
|
85 }
|
Chris@0
|
86
|
Chris@0
|
87 /**
|
Chris@0
|
88 * @return string
|
Chris@0
|
89 */
|
Chris@0
|
90 public function getHashPattern()
|
Chris@0
|
91 {
|
Chris@0
|
92 return '~^'.$this->hashPattern.'~i';
|
Chris@0
|
93 }
|
Chris@0
|
94
|
Chris@0
|
95 /**
|
Chris@0
|
96 * @return string
|
Chris@0
|
97 */
|
Chris@0
|
98 public function getNumberPattern()
|
Chris@0
|
99 {
|
Chris@0
|
100 return '~^'.$this->numberPattern.'~';
|
Chris@0
|
101 }
|
Chris@0
|
102
|
Chris@0
|
103 /**
|
Chris@0
|
104 * @param string $quote
|
Chris@0
|
105 *
|
Chris@0
|
106 * @return string
|
Chris@0
|
107 */
|
Chris@0
|
108 public function getQuotedStringPattern($quote)
|
Chris@0
|
109 {
|
Chris@0
|
110 return '~^'.sprintf($this->quotedStringPattern, $quote).'~i';
|
Chris@0
|
111 }
|
Chris@0
|
112 }
|