1 | <?php |
||
7 | class EmailLexer extends AbstractLexer |
||
8 | { |
||
9 | //ASCII values |
||
10 | const S_EMPTY = null; |
||
11 | const C_NUL = 0; |
||
12 | const S_HTAB = 9; |
||
13 | const S_LF = 10; |
||
14 | const S_CR = 13; |
||
15 | const S_SP = 32; |
||
16 | const EXCLAMATION = 33; |
||
17 | const S_DQUOTE = 34; |
||
18 | const NUMBER_SIGN = 35; |
||
19 | const DOLLAR = 36; |
||
20 | const PERCENTAGE = 37; |
||
21 | const AMPERSAND = 38; |
||
22 | const S_SQUOTE = 39; |
||
23 | const S_OPENPARENTHESIS = 40; |
||
24 | const S_CLOSEPARENTHESIS = 41; |
||
25 | const ASTERISK = 42; |
||
26 | const S_PLUS = 43; |
||
27 | const S_COMMA = 44; |
||
28 | const S_HYPHEN = 45; |
||
29 | const S_DOT = 46; |
||
30 | const S_SLASH = 47; |
||
31 | const S_COLON = 58; |
||
32 | const S_SEMICOLON = 59; |
||
33 | const S_LOWERTHAN = 60; |
||
34 | const S_EQUAL = 61; |
||
35 | const S_GREATERTHAN = 62; |
||
36 | const QUESTIONMARK = 63; |
||
37 | const S_AT = 64; |
||
38 | const S_OPENBRACKET = 91; |
||
39 | const S_BACKSLASH = 92; |
||
40 | const S_CLOSEBRACKET = 93; |
||
41 | const CARET = 94; |
||
42 | const S_UNDERSCORE = 95; |
||
43 | const S_BACKTICK = 96; |
||
44 | const S_OPENCURLYBRACES = 123; |
||
45 | const S_PIPE = 124; |
||
46 | const S_CLOSECURLYBRACES = 125; |
||
47 | const S_TILDE = 126; |
||
48 | const C_DEL = 127; |
||
49 | const INVERT_QUESTIONMARK= 168; |
||
50 | const INVERT_EXCLAMATION = 173; |
||
51 | const GENERIC = 300; |
||
52 | const S_IPV6TAG = 301; |
||
53 | const INVALID = 302; |
||
54 | const CRLF = 1310; |
||
55 | const S_DOUBLECOLON = 5858; |
||
56 | const ASCII_INVALID_FROM = 127; |
||
57 | const ASCII_INVALID_TO = 199; |
||
58 | |||
59 | /** |
||
60 | * US-ASCII visible characters not valid for atext (@link http://tools.ietf.org/html/rfc5322#section-3.2.3) |
||
61 | * |
||
62 | * @var array |
||
63 | */ |
||
64 | protected $charValue = array( |
||
65 | '{' => self::S_OPENCURLYBRACES, |
||
66 | '}' => self::S_CLOSECURLYBRACES, |
||
67 | '(' => self::S_OPENPARENTHESIS, |
||
68 | ')' => self::S_CLOSEPARENTHESIS, |
||
69 | '<' => self::S_LOWERTHAN, |
||
70 | '>' => self::S_GREATERTHAN, |
||
71 | '[' => self::S_OPENBRACKET, |
||
72 | ']' => self::S_CLOSEBRACKET, |
||
73 | ':' => self::S_COLON, |
||
74 | ';' => self::S_SEMICOLON, |
||
75 | '@' => self::S_AT, |
||
76 | '\\' => self::S_BACKSLASH, |
||
77 | '/' => self::S_SLASH, |
||
78 | ',' => self::S_COMMA, |
||
79 | '.' => self::S_DOT, |
||
80 | "'" => self::S_SQUOTE, |
||
81 | "`" => self::S_BACKTICK, |
||
82 | '"' => self::S_DQUOTE, |
||
83 | '-' => self::S_HYPHEN, |
||
84 | '::' => self::S_DOUBLECOLON, |
||
85 | ' ' => self::S_SP, |
||
86 | "\t" => self::S_HTAB, |
||
87 | "\r" => self::S_CR, |
||
88 | "\n" => self::S_LF, |
||
89 | "\r\n" => self::CRLF, |
||
90 | 'IPv6' => self::S_IPV6TAG, |
||
91 | '' => self::S_EMPTY, |
||
92 | '\0' => self::C_NUL, |
||
93 | '*' => self::ASTERISK, |
||
94 | '!' => self::EXCLAMATION, |
||
95 | '&' => self::AMPERSAND, |
||
96 | '^' => self::CARET, |
||
97 | '$' => self::DOLLAR, |
||
98 | '%' => self::PERCENTAGE, |
||
99 | '~' => self::S_TILDE, |
||
100 | '|' => self::S_PIPE, |
||
101 | '_' => self::S_UNDERSCORE, |
||
102 | '=' => self::S_EQUAL, |
||
103 | '+' => self::S_PLUS, |
||
104 | '¿' => self::INVERT_QUESTIONMARK, |
||
105 | '?' => self::QUESTIONMARK, |
||
106 | '#' => self::NUMBER_SIGN, |
||
107 | '¡' => self::INVERT_EXCLAMATION, |
||
108 | null => self::S_EMPTY, |
||
109 | ); |
||
110 | |||
111 | /** |
||
112 | * @var bool |
||
113 | */ |
||
114 | protected $hasInvalidTokens = false; |
||
115 | |||
116 | /** |
||
117 | * @var array |
||
118 | * |
||
119 | * @psalm-var array{value:string, type:null|int, position:int}|array<empty, empty> |
||
120 | */ |
||
121 | protected $previous = []; |
||
122 | |||
123 | /** |
||
124 | * The last matched/seen token. |
||
125 | * |
||
126 | * @var array |
||
127 | * |
||
128 | * @psalm-var array{value:string, type:null|int, position:int} |
||
129 | */ |
||
130 | public $token; |
||
131 | |||
132 | /** |
||
133 | * The next token in the input. |
||
134 | * |
||
135 | * @var array|null |
||
136 | */ |
||
137 | public $lookahead; |
||
138 | |||
139 | /** |
||
140 | * @psalm-var array{value:'', type:null, position:0} |
||
141 | */ |
||
142 | private static $nullToken = [ |
||
143 | 'value' => '', |
||
144 | 'type' => null, |
||
145 | 'position' => 0, |
||
146 | ]; |
||
147 | |||
148 | /** |
||
149 | * @var string |
||
150 | */ |
||
151 | private $accumulator = ''; |
||
152 | |||
153 | /** |
||
154 | * @var bool |
||
155 | */ |
||
156 | private $hasToRecord = false; |
||
157 | |||
158 | public function __construct() |
||
163 | |||
164 | /** |
||
165 | * @return void |
||
166 | */ |
||
167 | public function reset() |
||
173 | |||
174 | /** |
||
175 | * @return bool |
||
176 | */ |
||
177 | public function hasInvalidTokens() |
||
181 | |||
182 | /** |
||
183 | * @param int $type |
||
184 | * @throws \UnexpectedValueException |
||
185 | * @return boolean |
||
186 | * |
||
187 | * @psalm-suppress InvalidScalarArgument |
||
188 | */ |
||
189 | public function find($type) |
||
199 | |||
200 | /** |
||
201 | * getPrevious |
||
202 | * |
||
203 | * @return array |
||
204 | */ |
||
205 | public function getPrevious() |
||
209 | |||
210 | /** |
||
211 | * moveNext |
||
212 | * |
||
213 | * @return boolean |
||
214 | */ |
||
215 | public function moveNext() |
||
231 | |||
232 | /** |
||
233 | * Lexical catchable patterns. |
||
234 | * |
||
235 | * @return string[] |
||
236 | */ |
||
237 | protected function getCatchablePatterns() |
||
249 | |||
250 | /** |
||
251 | * Lexical non-catchable patterns. |
||
252 | * |
||
253 | * @return string[] |
||
254 | */ |
||
255 | protected function getNonCatchablePatterns() |
||
261 | |||
262 | /** |
||
263 | * Retrieve token type. Also processes the token value if necessary. |
||
264 | * |
||
265 | * @param string $value |
||
266 | * @throws \InvalidArgumentException |
||
267 | * @return integer |
||
268 | */ |
||
269 | protected function getType(&$value) |
||
293 | |||
294 | protected function isInvalidChar(string $value) : bool |
||
301 | |||
302 | protected function isValid(string $value) : bool |
||
310 | |||
311 | /** |
||
312 | * @param string $value |
||
313 | * @return bool |
||
314 | */ |
||
315 | protected function isNullType($value) |
||
323 | |||
324 | protected function isUTF8Invalid(string $value) : bool |
||
332 | |||
333 | /** |
||
334 | * @return string |
||
335 | */ |
||
336 | protected function getModifiers() |
||
340 | |||
341 | public function getAccumulatedValues() : string |
||
345 | |||
346 | public function startRecording() : void |
||
350 | |||
351 | public function stopRecording() : void |
||
355 | |||
356 | public function clearRecorded() : void |
||
360 | } |
||
361 |