1 | <?php |
||
14 | class DocumentTokenizer |
||
15 | { |
||
16 | /** |
||
17 | * @var Document |
||
18 | */ |
||
19 | protected $document; |
||
20 | |||
21 | /** |
||
22 | * @var array |
||
23 | */ |
||
24 | protected $tokenVector = array(); |
||
25 | protected $storage; |
||
26 | |||
27 | /** |
||
28 | * Tokenizer constructor. |
||
29 | * |
||
30 | * @param \library\storage\Document $document |
||
31 | * @param JsonStorage $storage |
||
32 | */ |
||
33 | public function __construct(Document $document, JsonStorage $storage) |
||
39 | |||
40 | /** |
||
41 | * Execute tokenization of all document fields |
||
42 | */ |
||
43 | private function tokenize() |
||
52 | |||
53 | private function tokenizeTitle() |
||
59 | |||
60 | private function tokenizeFields() |
||
69 | |||
70 | private function tokenizeField($field, $fieldName, $fieldType) |
||
81 | |||
82 | private function tokenizeBricks() |
||
89 | |||
90 | private function tokenizeBrick($brick, $brickSlug) |
||
99 | |||
100 | private function tokenizeDynamicBricks() |
||
107 | |||
108 | public function getTokens() |
||
112 | |||
113 | /** |
||
114 | * Add a token to the existing tokenvector |
||
115 | * @param $token |
||
116 | * @param string $field |
||
117 | * @param int $count |
||
118 | */ |
||
119 | private function addTokenToVector($token, $field, $count = 1) |
||
129 | |||
130 | /** |
||
131 | * Add a complete token vector to the existing one. |
||
132 | * @param $tokenVector |
||
133 | * @param $field |
||
134 | */ |
||
135 | private function addTokenVectorToVector($tokenVector, $field) |
||
141 | |||
142 | /** |
||
143 | * Get the type for a field |
||
144 | * @param $fieldName |
||
145 | * @param $documentDefinition |
||
146 | * @return mixed |
||
147 | * @throws \Exception |
||
148 | */ |
||
149 | private function getFieldType($fieldName, $documentDefinition) |
||
159 | } |