cerbero90 /
json-parser
| 1 | <?php |
||
| 2 | |||
| 3 | namespace Cerbero\JsonParser\Tokens; |
||
| 4 | |||
| 5 | use Cerbero\JsonParser\Exceptions\SyntaxException; |
||
| 6 | use Cerbero\JsonParser\Sources\Source; |
||
| 7 | use Cerbero\JsonParser\Tokens\Token; |
||
| 8 | use Cerbero\JsonParser\Tokens\Tokenizer; |
||
| 9 | use Cerbero\JsonParser\Tokens\Tokens; |
||
| 10 | use Cerbero\JsonParser\ValueObjects\Progress; |
||
| 11 | use IteratorAggregate; |
||
| 12 | use Traversable; |
||
| 13 | |||
| 14 | use function strlen; |
||
| 15 | |||
| 16 | /** |
||
| 17 | * The JSON lexer. |
||
| 18 | * |
||
| 19 | * @implements IteratorAggregate<int, Token> |
||
| 20 | */ |
||
| 21 | final class Lexer implements IteratorAggregate |
||
| 22 | { |
||
| 23 | /** |
||
| 24 | * The parsing progress. |
||
| 25 | * |
||
| 26 | * @var Progress |
||
| 27 | */ |
||
| 28 | private readonly Progress $progress; |
||
| 29 | |||
| 30 | /** |
||
| 31 | * The current position. |
||
| 32 | * |
||
| 33 | * @var int |
||
| 34 | */ |
||
| 35 | private int $position = 0; |
||
| 36 | |||
| 37 | /** |
||
| 38 | * Instantiate the class. |
||
| 39 | * |
||
| 40 | * @param Source $source |
||
| 41 | */ |
||
| 42 | 373 | public function __construct(private readonly Source $source) |
|
| 43 | { |
||
| 44 | 373 | $this->progress = new Progress(); |
|
|
0 ignored issues
–
show
Bug
introduced
by
Loading history...
|
|||
| 45 | } |
||
| 46 | |||
| 47 | /** |
||
| 48 | * Retrieve the JSON fragments |
||
| 49 | * |
||
| 50 | * @return \Generator<int, Token> |
||
| 51 | */ |
||
| 52 | 361 | public function getIterator(): Traversable |
|
| 53 | { |
||
| 54 | 361 | $buffer = ''; |
|
| 55 | 361 | $inString = $isEscaping = false; |
|
| 56 | 361 | $tokenizer = Tokenizer::instance(); |
|
| 57 | |||
| 58 | 361 | foreach ($this->source as $chunk) { |
|
| 59 | 358 | for ($i = 0, $size = strlen($chunk); $i < $size; $i++, $this->position++) { |
|
| 60 | 358 | $character = $chunk[$i]; |
|
| 61 | 358 | $inString = ($character == '"') != $inString || $isEscaping; |
|
| 62 | 358 | $isEscaping = $character == '\\' && !$isEscaping; |
|
| 63 | |||
| 64 | 358 | if ($inString || !isset(Tokens::BOUNDARIES[$character])) { |
|
| 65 | 304 | $buffer == '' && !isset(Tokens::TYPES[$character]) && throw new SyntaxException($character); |
|
| 66 | 301 | $buffer .= $character; |
|
| 67 | 301 | continue; |
|
| 68 | } |
||
| 69 | |||
| 70 | 357 | if ($buffer != '') { |
|
| 71 | 301 | yield $tokenizer->toToken($buffer); |
|
| 72 | 297 | $buffer = ''; |
|
| 73 | } |
||
| 74 | |||
| 75 | 357 | if (isset(Tokens::DELIMITERS[$character])) { |
|
| 76 | 357 | yield $tokenizer->toToken($character); |
|
| 77 | } |
||
| 78 | } |
||
| 79 | } |
||
| 80 | } |
||
| 81 | |||
| 82 | /** |
||
| 83 | * Retrieve the current position |
||
| 84 | * |
||
| 85 | * @return int |
||
| 86 | */ |
||
| 87 | 11 | public function position(): int |
|
| 88 | { |
||
| 89 | 11 | return $this->position; |
|
| 90 | } |
||
| 91 | |||
| 92 | /** |
||
| 93 | * Retrieve the parsing progress |
||
| 94 | * |
||
| 95 | * @return Progress |
||
| 96 | */ |
||
| 97 | 1 | public function progress(): Progress |
|
| 98 | { |
||
| 99 | 1 | return $this->progress->setCurrent($this->position)->setTotal($this->source->size()); |
|
| 100 | } |
||
| 101 | } |
||
| 102 |