| 1 | <?php |
||
| 9 | class NGramTokenizer extends WordTokenizer |
||
| 10 | { |
||
| 11 | /** |
||
| 12 | * @var int |
||
| 13 | */ |
||
| 14 | private $minGram; |
||
| 15 | |||
| 16 | /** |
||
| 17 | * @var int |
||
| 18 | */ |
||
| 19 | private $maxGram; |
||
| 20 | |||
| 21 | public function __construct(int $minGram = 1, int $maxGram = 2) |
||
| 30 | |||
| 31 | /** |
||
| 32 | * {@inheritdoc} |
||
| 33 | */ |
||
| 34 | public function tokenize(string $text): array |
||
| 46 | |||
| 47 | private function generateNGrams(string $word, array &$nGrams): void |
||
| 59 | } |
||
| 60 |