1 | <?php |
||
8 | class Tokenizer { |
||
9 | private $str; |
||
10 | const NAME = 'LITERAL'; |
||
11 | const STRING = 'STRING'; |
||
12 | const OPEN_BRACKET = 'OPEN_BRACKET'; |
||
13 | const CLOSE_BRACKET = 'CLOSE_BRACKET'; |
||
14 | const OPEN_SQUARE_BRACKET = 'SQUARE_BRACKET'; |
||
15 | const CLOSE_SQUARE_BRACKET = 'CLOSE_SQUARE_BRACKET'; |
||
16 | const CONCAT = 'CONCAT'; |
||
17 | const ARG = 'ARG'; |
||
18 | const WHITESPACE = 'WHITESPACE'; |
||
19 | const NEW_LINE = 'NEW_LINE'; |
||
20 | const DOT = 'DOT'; |
||
21 | const NUMERIC = 'NUMERIC'; |
||
22 | const EQUALS = 'EQUALS'; |
||
23 | const NOT = 'NOT'; |
||
24 | const OPEN_BRACE = 'OPEN_BRACE'; |
||
25 | const CLOSE_BRACE = 'CLOSE_BRACE'; |
||
26 | const BOOL = 'BOOL'; |
||
27 | const COLON = 'COLON'; |
||
28 | const SEMI_COLON = 'SEMI_COLON'; |
||
29 | const NUM_SIGN = 'NUM_SIGN'; |
||
30 | const GREATER_THAN = 'GREATER_THAN'; |
||
31 | const AT_SIGN = 'AT_SIGN'; |
||
32 | const SUBTRACT = 'SUBTRACT'; |
||
33 | const MULTIPLY = 'MULTIPLY'; |
||
34 | const DIVIDE = 'DIVIDE'; |
||
35 | |||
36 | private $chars = [ |
||
37 | '"' => self::STRING, |
||
38 | '\'' => self::STRING, |
||
39 | '(' => self::OPEN_BRACKET, |
||
40 | ')' => self::CLOSE_BRACKET, |
||
41 | '[' => self::OPEN_SQUARE_BRACKET, |
||
42 | ']' => self::CLOSE_SQUARE_BRACKET, |
||
43 | '+' => self::CONCAT, |
||
44 | ',' => self::ARG, |
||
45 | '.' => self::DOT, |
||
46 | '!' => self::NOT, |
||
47 | '=' => self::EQUALS, |
||
48 | '{' => self::OPEN_BRACE, |
||
49 | '}' => self::CLOSE_BRACE, |
||
50 | ':' => self::COLON, |
||
51 | ';' => self::SEMI_COLON, |
||
52 | '#' => self::NUM_SIGN, |
||
53 | '>' => self::GREATER_THAN, |
||
54 | '@' => self::AT_SIGN, |
||
55 | '-' => self::SUBTRACT, |
||
56 | '*' => self::MULTIPLY, |
||
57 | '/' => self::DIVIDE, |
||
58 | ' ' => self::WHITESPACE, |
||
59 | "\n" => self::NEW_LINE, |
||
60 | "\r" => self::WHITESPACE, |
||
61 | "\t" => self::WHITESPACE |
||
62 | ]; |
||
63 | |||
64 | public function __construct($str) { |
||
67 | |||
68 | public function getTokens($returnObj = true) { |
||
82 | |||
83 | private function doSimpleTokens(&$tokens, $char) { |
||
90 | |||
91 | private function doLiterals(&$tokens, $char, &$i) { |
||
102 | |||
103 | private function processLiterals(&$tokens, $name) { |
||
109 | |||
110 | private function doBrackets(&$tokens, $char, $i) { |
||
126 | |||
127 | private function doStrings(&$tokens, $char, $i) { |
||
137 | |||
138 | private function extractString($pos) { |
||
145 | |||
146 | private function extractBrackets($open, $startBracket = '(', $closeBracket = ')') { |
||
153 | |||
154 | private function identifyChar($chr) { |
||
158 | |||
159 | private function getChar($num) { |
||
164 | |||
165 | public function serialize($tokens) { |
||
177 | |||
178 | private function serializeValue($token) { |
||
184 | } |
||
185 |