|
1
|
|
|
<?php |
|
2
|
|
|
|
|
3
|
|
|
/** |
|
4
|
|
|
* @package s9e\TextFormatter |
|
5
|
|
|
* @copyright Copyright (c) 2010-2018 The s9e Authors |
|
6
|
|
|
* @license http://www.opensource.org/licenses/mit-license.php The MIT License |
|
7
|
|
|
*/ |
|
8
|
|
|
namespace s9e\TextFormatter\Configurator\RendererGenerators\PHP; |
|
9
|
|
|
|
|
10
|
|
|
use LogicException; |
|
11
|
|
|
use RuntimeException; |
|
12
|
|
|
|
|
13
|
|
|
class XPathConvertor |
|
14
|
|
|
{ |
|
15
|
|
|
/** |
|
16
|
|
|
* @var string PCRE version |
|
17
|
|
|
*/ |
|
18
|
|
|
public $pcreVersion; |
|
19
|
|
|
|
|
20
|
|
|
/** |
|
21
|
|
|
* @var string Regexp used to match XPath expressions |
|
22
|
|
|
*/ |
|
23
|
|
|
protected $regexp; |
|
24
|
|
|
|
|
25
|
|
|
/** |
|
26
|
|
|
* @var bool Whether to use the mbstring functions as a replacement for XPath expressions |
|
27
|
|
|
*/ |
|
28
|
|
|
public $useMultibyteStringFunctions = false; |
|
29
|
|
|
|
|
30
|
|
|
/** |
|
31
|
|
|
* Constructor |
|
32
|
|
|
*/ |
|
33
|
|
|
public function __construct() |
|
34
|
|
|
{ |
|
35
|
|
|
$this->pcreVersion = PCRE_VERSION; |
|
36
|
|
|
} |
|
37
|
|
|
|
|
38
|
|
|
/** |
|
39
|
|
|
* Convert an XPath expression (used in a condition) into PHP code |
|
40
|
|
|
* |
|
41
|
|
|
* This method is similar to convertXPath() but it selectively replaces some simple conditions |
|
42
|
|
|
* with the corresponding DOM method for performance reasons |
|
43
|
|
|
* |
|
44
|
|
|
* @param string $expr XPath expression |
|
45
|
|
|
* @return string PHP code |
|
46
|
|
|
*/ |
|
47
|
|
|
public function convertCondition($expr) |
|
48
|
|
|
{ |
|
49
|
|
|
$expr = trim($expr); |
|
50
|
|
|
|
|
51
|
|
|
// XSL: <xsl:if test="@foo"> |
|
52
|
|
|
// PHP: if ($node->hasAttribute('foo')) |
|
53
|
|
|
if (preg_match('#^@([-\\w]+)$#', $expr, $m)) |
|
54
|
|
|
{ |
|
55
|
|
|
return '$node->hasAttribute(' . var_export($m[1], true) . ')'; |
|
56
|
|
|
} |
|
57
|
|
|
|
|
58
|
|
|
// XSL: <xsl:if test="@*"> |
|
59
|
|
|
// PHP: if ($node->attributes->length) |
|
60
|
|
|
if ($expr === '@*') |
|
61
|
|
|
{ |
|
62
|
|
|
return '$node->attributes->length'; |
|
63
|
|
|
} |
|
64
|
|
|
|
|
65
|
|
|
// XSL: <xsl:if test="not(@foo)"> |
|
66
|
|
|
// PHP: if (!$node->hasAttribute('foo')) |
|
67
|
|
|
if (preg_match('#^not\\(@([-\\w]+)\\)$#', $expr, $m)) |
|
68
|
|
|
{ |
|
69
|
|
|
return '!$node->hasAttribute(' . var_export($m[1], true) . ')'; |
|
70
|
|
|
} |
|
71
|
|
|
|
|
72
|
|
|
// XSL: <xsl:if test="$foo"> |
|
73
|
|
|
// PHP: if ($this->params['foo']!=='') |
|
74
|
|
|
if (preg_match('#^\\$(\\w+)$#', $expr, $m)) |
|
75
|
|
|
{ |
|
76
|
|
|
return '$this->params[' . var_export($m[1], true) . "]!==''"; |
|
77
|
|
|
} |
|
78
|
|
|
|
|
79
|
|
|
// XSL: <xsl:if test="not($foo)"> |
|
80
|
|
|
// PHP: if ($this->params['foo']==='') |
|
81
|
|
|
if (preg_match('#^not\\(\\$(\\w+)\\)$#', $expr, $m)) |
|
82
|
|
|
{ |
|
83
|
|
|
return '$this->params[' . var_export($m[1], true) . "]===''"; |
|
84
|
|
|
} |
|
85
|
|
|
|
|
86
|
|
|
// XSL: <xsl:if test="@foo > 1"> |
|
87
|
|
|
// PHP: if ($node->getAttribute('foo') > 1) |
|
88
|
|
|
if (preg_match('#^([$@][-\\w]+)\\s*([<>])\\s*(\\d+)$#', $expr, $m)) |
|
89
|
|
|
{ |
|
90
|
|
|
return $this->convertXPath($m[1]) . $m[2] . $m[3]; |
|
91
|
|
|
} |
|
92
|
|
|
|
|
93
|
|
|
// If the condition does not seem to contain a relational expression, or start with a |
|
94
|
|
|
// function call, we wrap it inside of a boolean() call |
|
95
|
|
|
if (!preg_match('#[=<>]|\\bor\\b|\\band\\b|^[-\\w]+\\s*\\(#', $expr)) |
|
96
|
|
|
{ |
|
97
|
|
|
// XSL: <xsl:if test="parent::foo"> |
|
98
|
|
|
// PHP: if ($this->xpath->evaluate("boolean(parent::foo)",$node)) |
|
99
|
|
|
$expr = 'boolean(' . $expr . ')'; |
|
100
|
|
|
} |
|
101
|
|
|
|
|
102
|
|
|
// XSL: <xsl:if test="@foo='bar'"> |
|
103
|
|
|
// PHP: if ($this->xpath->evaluate("@foo='bar'",$node)) |
|
104
|
|
|
return $this->convertXPath($expr); |
|
105
|
|
|
} |
|
106
|
|
|
|
|
107
|
|
|
/** |
|
108
|
|
|
* Convert an XPath expression (used as value) into PHP code |
|
109
|
|
|
* |
|
110
|
|
|
* @param string $expr XPath expression |
|
111
|
|
|
* @return string PHP code |
|
112
|
|
|
*/ |
|
113
|
|
|
public function convertXPath($expr) |
|
114
|
|
|
{ |
|
115
|
|
|
$expr = trim($expr); |
|
116
|
|
|
|
|
117
|
|
|
$this->generateXPathRegexp(); |
|
118
|
|
|
if (preg_match($this->regexp, $expr, $m)) |
|
119
|
|
|
{ |
|
120
|
|
|
$methodName = null; |
|
121
|
|
|
foreach ($m as $k => $v) |
|
122
|
|
|
{ |
|
123
|
|
|
if (is_numeric($k) || $v === '' || $v === null || !method_exists($this, $k)) |
|
124
|
|
|
{ |
|
125
|
|
|
continue; |
|
126
|
|
|
} |
|
127
|
|
|
|
|
128
|
|
|
$methodName = $k; |
|
129
|
|
|
break; |
|
130
|
|
|
} |
|
131
|
|
|
|
|
132
|
|
|
if (isset($methodName)) |
|
133
|
|
|
{ |
|
134
|
|
|
// Default argument is the whole matched string |
|
135
|
|
|
$args = [$m[$methodName]]; |
|
136
|
|
|
|
|
137
|
|
|
// Overwrite the default arguments with the named captures |
|
138
|
|
|
$i = 0; |
|
139
|
|
|
while (isset($m[$methodName . $i])) |
|
140
|
|
|
{ |
|
141
|
|
|
$args[$i] = $m[$methodName . $i]; |
|
142
|
|
|
++$i; |
|
143
|
|
|
} |
|
144
|
|
|
|
|
145
|
|
|
return call_user_func_array([$this, $methodName], $args); |
|
146
|
|
|
} |
|
147
|
|
|
} |
|
148
|
|
|
|
|
149
|
|
|
// If the condition does not seem to contain a relational expression, or start with a |
|
150
|
|
|
// function call, we wrap it inside of a string() call |
|
151
|
|
|
if (!preg_match('#[=<>]|\\bor\\b|\\band\\b|^[-\\w]+\\s*\\(#', $expr)) |
|
152
|
|
|
{ |
|
153
|
|
|
$expr = 'string(' . $expr . ')'; |
|
154
|
|
|
} |
|
155
|
|
|
|
|
156
|
|
|
// Replace parameters in the expression |
|
157
|
|
|
return '$this->xpath->evaluate(' . $this->exportXPath($expr) . ',$node)'; |
|
158
|
|
|
} |
|
159
|
|
|
|
|
160
|
|
|
protected function attr($attrName) |
|
161
|
|
|
{ |
|
162
|
|
|
return '$node->getAttribute(' . var_export($attrName, true) . ')'; |
|
163
|
|
|
} |
|
164
|
|
|
|
|
165
|
|
|
protected function dot() |
|
166
|
|
|
{ |
|
167
|
|
|
return '$node->textContent'; |
|
168
|
|
|
} |
|
169
|
|
|
|
|
170
|
|
|
protected function param($paramName) |
|
171
|
|
|
{ |
|
172
|
|
|
return '$this->params[' . var_export($paramName, true) . ']'; |
|
173
|
|
|
} |
|
174
|
|
|
|
|
175
|
|
|
protected function string($string) |
|
176
|
|
|
{ |
|
177
|
|
|
return var_export(substr($string, 1, -1), true); |
|
178
|
|
|
} |
|
179
|
|
|
|
|
180
|
|
|
protected function lname() |
|
181
|
|
|
{ |
|
182
|
|
|
return '$node->localName'; |
|
183
|
|
|
} |
|
184
|
|
|
|
|
185
|
|
|
protected function name() |
|
186
|
|
|
{ |
|
187
|
|
|
return '$node->nodeName'; |
|
188
|
|
|
} |
|
189
|
|
|
|
|
190
|
|
|
protected function number($sign, $number) |
|
191
|
|
|
{ |
|
192
|
|
|
// Remove leading zeros |
|
193
|
|
|
$number = ltrim($number, '0') ?: 0; |
|
194
|
|
|
|
|
195
|
|
|
// Disable negative zero |
|
196
|
|
|
if (!$number) |
|
197
|
|
|
{ |
|
198
|
|
|
$sign = ''; |
|
199
|
|
|
} |
|
200
|
|
|
|
|
201
|
|
|
return "'" . $sign . $number . "'"; |
|
202
|
|
|
} |
|
203
|
|
|
|
|
204
|
|
|
protected function strlen($expr) |
|
205
|
|
|
{ |
|
206
|
|
|
if ($expr === '') |
|
207
|
|
|
{ |
|
208
|
|
|
$expr = '.'; |
|
209
|
|
|
} |
|
210
|
|
|
|
|
211
|
|
|
$php = $this->convertXPath($expr); |
|
212
|
|
|
|
|
213
|
|
|
return ($this->useMultibyteStringFunctions) |
|
214
|
|
|
? 'mb_strlen(' . $php . ",'utf-8')" |
|
215
|
|
|
: "strlen(preg_replace('(.)us','.'," . $php . '))'; |
|
216
|
|
|
} |
|
217
|
|
|
|
|
218
|
|
|
protected function contains($haystack, $needle) |
|
219
|
|
|
{ |
|
220
|
|
|
return '(strpos(' . $this->convertXPath($haystack) . ',' . $this->convertXPath($needle) . ')!==false)'; |
|
221
|
|
|
} |
|
222
|
|
|
|
|
223
|
|
|
protected function startswith($string, $substring) |
|
224
|
|
|
{ |
|
225
|
|
|
return '(strpos(' . $this->convertXPath($string) . ',' . $this->convertXPath($substring) . ')===0)'; |
|
226
|
|
|
} |
|
227
|
|
|
|
|
228
|
|
|
protected function not($expr) |
|
229
|
|
|
{ |
|
230
|
|
|
return '!(' . $this->convertCondition($expr) . ')'; |
|
231
|
|
|
} |
|
232
|
|
|
|
|
233
|
|
|
protected function notcontains($haystack, $needle) |
|
234
|
|
|
{ |
|
235
|
|
|
return '(strpos(' . $this->convertXPath($haystack) . ',' . $this->convertXPath($needle) . ')===false)'; |
|
236
|
|
|
} |
|
237
|
|
|
|
|
238
|
|
|
protected function substr($exprString, $exprPos, $exprLen = null) |
|
239
|
|
|
{ |
|
240
|
|
|
if (!$this->useMultibyteStringFunctions) |
|
241
|
|
|
{ |
|
242
|
|
|
$expr = 'substring(' . $exprString . ',' . $exprPos; |
|
243
|
|
|
if (isset($exprLen)) |
|
244
|
|
|
{ |
|
245
|
|
|
$expr .= ',' . $exprLen; |
|
246
|
|
|
} |
|
247
|
|
|
$expr .= ')'; |
|
248
|
|
|
|
|
249
|
|
|
return '$this->xpath->evaluate(' . $this->exportXPath($expr) . ',$node)'; |
|
250
|
|
|
} |
|
251
|
|
|
|
|
252
|
|
|
// NOTE: negative values for the second argument do not produce the same result as |
|
253
|
|
|
// specified in XPath if the argument is not a literal number |
|
254
|
|
|
$php = 'mb_substr(' . $this->convertXPath($exprString) . ','; |
|
255
|
|
|
|
|
256
|
|
|
// Hardcode the value if possible |
|
257
|
|
|
if (is_numeric($exprPos)) |
|
258
|
|
|
{ |
|
259
|
|
|
$php .= max(0, $exprPos - 1); |
|
260
|
|
|
} |
|
261
|
|
|
else |
|
262
|
|
|
{ |
|
263
|
|
|
$php .= 'max(0,' . $this->convertXPath($exprPos) . '-1)'; |
|
264
|
|
|
} |
|
265
|
|
|
|
|
266
|
|
|
$php .= ','; |
|
267
|
|
|
|
|
268
|
|
|
if (isset($exprLen)) |
|
269
|
|
|
{ |
|
270
|
|
|
if (is_numeric($exprLen)) |
|
271
|
|
|
{ |
|
272
|
|
|
// Handles substring(0,2) as per XPath |
|
273
|
|
|
if (is_numeric($exprPos) && $exprPos < 1) |
|
274
|
|
|
{ |
|
275
|
|
|
$php .= max(0, $exprPos + $exprLen - 1); |
|
276
|
|
|
} |
|
277
|
|
|
else |
|
278
|
|
|
{ |
|
279
|
|
|
$php .= max(0, $exprLen); |
|
280
|
|
|
} |
|
281
|
|
|
} |
|
282
|
|
|
else |
|
283
|
|
|
{ |
|
284
|
|
|
$php .= 'max(0,' . $this->convertXPath($exprLen) . ')'; |
|
285
|
|
|
} |
|
286
|
|
|
} |
|
287
|
|
|
else |
|
288
|
|
|
{ |
|
289
|
|
|
$php .= 'null'; |
|
290
|
|
|
} |
|
291
|
|
|
|
|
292
|
|
|
$php .= ",'utf-8')"; |
|
293
|
|
|
|
|
294
|
|
|
return $php; |
|
295
|
|
|
} |
|
296
|
|
|
|
|
297
|
|
|
protected function substringafter($expr, $str) |
|
298
|
|
|
{ |
|
299
|
|
|
return 'substr(strstr(' . $this->convertXPath($expr) . ',' . $this->convertXPath($str) . '),' . (strlen($str) - 2) . ')'; |
|
300
|
|
|
} |
|
301
|
|
|
|
|
302
|
|
|
protected function substringbefore($expr1, $expr2) |
|
303
|
|
|
{ |
|
304
|
|
|
return 'strstr(' . $this->convertXPath($expr1) . ',' . $this->convertXPath($expr2) . ',true)'; |
|
305
|
|
|
} |
|
306
|
|
|
|
|
307
|
|
|
protected function cmp($expr1, $operator, $expr2) |
|
308
|
|
|
{ |
|
309
|
|
|
$operands = []; |
|
310
|
|
|
$operators = [ |
|
311
|
|
|
'=' => '===', |
|
312
|
|
|
'!=' => '!==', |
|
313
|
|
|
'>' => '>', |
|
314
|
|
|
'>=' => '>=', |
|
315
|
|
|
'<' => '<', |
|
316
|
|
|
'<=' => '<=' |
|
317
|
|
|
]; |
|
318
|
|
|
|
|
319
|
|
|
// If either operand is a number, represent it as a PHP number and replace the identity |
|
320
|
|
|
// identity operators |
|
321
|
|
|
foreach ([$expr1, $expr2] as $expr) |
|
322
|
|
|
{ |
|
323
|
|
|
if (is_numeric($expr)) |
|
324
|
|
|
{ |
|
325
|
|
|
$operators['='] = '=='; |
|
326
|
|
|
$operators['!='] = '!='; |
|
327
|
|
|
|
|
328
|
|
|
$operands[] = preg_replace('(^0(.+))', '$1', $expr); |
|
329
|
|
|
} |
|
330
|
|
|
else |
|
331
|
|
|
{ |
|
332
|
|
|
$operands[] = $this->convertXPath($expr); |
|
333
|
|
|
} |
|
334
|
|
|
} |
|
335
|
|
|
|
|
336
|
|
|
return implode($operators[$operator], $operands); |
|
337
|
|
|
} |
|
338
|
|
|
|
|
339
|
|
|
protected function bool($expr1, $operator, $expr2) |
|
340
|
|
|
{ |
|
341
|
|
|
$operators = [ |
|
342
|
|
|
'and' => '&&', |
|
343
|
|
|
'or' => '||' |
|
344
|
|
|
]; |
|
345
|
|
|
|
|
346
|
|
|
return $this->convertCondition($expr1) . $operators[$operator] . $this->convertCondition($expr2); |
|
347
|
|
|
} |
|
348
|
|
|
|
|
349
|
|
|
protected function parens($expr) |
|
350
|
|
|
{ |
|
351
|
|
|
return '(' . $this->convertXPath($expr) . ')'; |
|
352
|
|
|
} |
|
353
|
|
|
|
|
354
|
|
|
protected function translate($str, $from, $to) |
|
355
|
|
|
{ |
|
356
|
|
|
preg_match_all('(.)su', substr($from, 1, -1), $matches); |
|
357
|
|
|
$from = $matches[0]; |
|
358
|
|
|
|
|
359
|
|
|
preg_match_all('(.)su', substr($to, 1, -1), $matches); |
|
360
|
|
|
$to = $matches[0]; |
|
361
|
|
|
|
|
362
|
|
|
// Remove duplicates from $from, keep matching elements in $to then add missing elements |
|
363
|
|
|
$from = array_unique($from); |
|
364
|
|
|
$to = array_intersect_key($to, $from); |
|
365
|
|
|
$to += array_fill_keys(array_keys(array_diff_key($from, $to)), ''); |
|
366
|
|
|
|
|
367
|
|
|
// Start building the strtr() call |
|
368
|
|
|
$php = 'strtr(' . $this->convertXPath($str) . ','; |
|
369
|
|
|
|
|
370
|
|
|
// Test whether all elements in $from and $to are exactly 1 byte long, meaning they |
|
371
|
|
|
// are ASCII and with no empty strings. If so, we can use the scalar version of |
|
372
|
|
|
// strtr(), otherwise we have to use the array version |
|
373
|
|
|
if ([1] === array_unique(array_map('strlen', $from)) |
|
374
|
|
|
&& [1] === array_unique(array_map('strlen', $to))) |
|
375
|
|
|
{ |
|
376
|
|
|
$php .= var_export(implode('', $from), true) . ',' . var_export(implode('', $to), true); |
|
377
|
|
|
} |
|
378
|
|
|
else |
|
379
|
|
|
{ |
|
380
|
|
|
$elements = []; |
|
381
|
|
|
foreach ($from as $k => $str) |
|
382
|
|
|
{ |
|
383
|
|
|
$elements[] = var_export($str, true) . '=>' . var_export($to[$k], true); |
|
384
|
|
|
} |
|
385
|
|
|
$php .= '[' . implode(',', $elements) . ']'; |
|
386
|
|
|
} |
|
387
|
|
|
$php .= ')'; |
|
388
|
|
|
|
|
389
|
|
|
return $php; |
|
390
|
|
|
} |
|
391
|
|
|
|
|
392
|
|
|
protected function math($expr1, $operator, $expr2) |
|
393
|
|
|
{ |
|
394
|
|
|
if (!is_numeric($expr1)) |
|
395
|
|
|
{ |
|
396
|
|
|
$expr1 = $this->convertXPath($expr1); |
|
397
|
|
|
} |
|
398
|
|
|
|
|
399
|
|
|
if (!is_numeric($expr2)) |
|
400
|
|
|
{ |
|
401
|
|
|
$expr2 = $this->convertXPath($expr2); |
|
402
|
|
|
} |
|
403
|
|
|
|
|
404
|
|
|
if ($operator === 'div') |
|
405
|
|
|
{ |
|
406
|
|
|
$operator = '/'; |
|
407
|
|
|
} |
|
408
|
|
|
|
|
409
|
|
|
return $expr1 . $operator . $expr2; |
|
410
|
|
|
} |
|
411
|
|
|
|
|
412
|
|
|
/** |
|
413
|
|
|
* Export an XPath expression as PHP with special consideration for XPath variables |
|
414
|
|
|
* |
|
415
|
|
|
* Will return PHP source representing the XPath expression, with special consideration for XPath |
|
416
|
|
|
* variables which are returned as a method call to XPath::export() |
|
417
|
|
|
* |
|
418
|
|
|
* @param string $expr XPath expression |
|
419
|
|
|
* @return string PHP representation of the expression |
|
420
|
|
|
*/ |
|
421
|
|
|
protected function exportXPath($expr) |
|
422
|
|
|
{ |
|
423
|
|
|
$phpTokens = []; |
|
424
|
|
|
foreach ($this->tokenizeXPathForExport($expr) as list($type, $content)) |
|
425
|
|
|
{ |
|
426
|
|
|
$methodName = 'exportXPath' . ucfirst($type); |
|
427
|
|
|
$phpTokens[] = $this->$methodName($content); |
|
428
|
|
|
} |
|
429
|
|
|
|
|
430
|
|
|
return implode('.', $phpTokens); |
|
431
|
|
|
} |
|
432
|
|
|
|
|
433
|
|
|
/** |
|
434
|
|
|
* Convert a "current()" XPath expression to its PHP source representation |
|
435
|
|
|
* |
|
436
|
|
|
* @return string |
|
437
|
|
|
*/ |
|
438
|
|
|
protected function exportXPathCurrent() |
|
439
|
|
|
{ |
|
440
|
|
|
return '$node->getNodePath()'; |
|
441
|
|
|
} |
|
442
|
|
|
|
|
443
|
|
|
/** |
|
444
|
|
|
* Convert a fragment of an XPath expression to its PHP source representation |
|
445
|
|
|
* |
|
446
|
|
|
* @param string $fragment |
|
447
|
|
|
* @return string |
|
448
|
|
|
*/ |
|
449
|
|
|
protected function exportXPathFragment($fragment) |
|
450
|
|
|
{ |
|
451
|
|
|
return var_export($fragment, true); |
|
452
|
|
|
} |
|
453
|
|
|
|
|
454
|
|
|
/** |
|
455
|
|
|
* Convert an XSLT parameter to its PHP source representation |
|
456
|
|
|
* |
|
457
|
|
|
* @param string $param Parameter, including the leading $ |
|
458
|
|
|
* @return string |
|
459
|
|
|
*/ |
|
460
|
|
|
protected function exportXPathParam($param) |
|
461
|
|
|
{ |
|
462
|
|
|
$paramName = ltrim($param, '$'); |
|
463
|
|
|
|
|
464
|
|
|
return '$this->getParamAsXPath(' . var_export($paramName, true) . ')'; |
|
465
|
|
|
} |
|
466
|
|
|
|
|
467
|
|
|
/** |
|
468
|
|
|
* Generate a regexp used to parse XPath expressions |
|
469
|
|
|
* |
|
470
|
|
|
* @return void |
|
471
|
|
|
*/ |
|
472
|
|
|
protected function generateXPathRegexp() |
|
473
|
|
|
{ |
|
474
|
|
|
if (isset($this->regexp)) |
|
475
|
|
|
{ |
|
476
|
|
|
return; |
|
477
|
|
|
} |
|
478
|
|
|
|
|
479
|
|
|
$patterns = [ |
|
480
|
|
|
'attr' => ['@', '(?<attr0>[-\\w]+)'], |
|
481
|
|
|
'dot' => '\\.', |
|
482
|
|
|
'name' => 'name\\(\\)', |
|
483
|
|
|
'lname' => 'local-name\\(\\)', |
|
484
|
|
|
'param' => ['\\$', '(?<param0>\\w+)'], |
|
485
|
|
|
'string' => '"[^"]*"|\'[^\']*\'', |
|
486
|
|
|
'number' => ['(?<number0>-?)', '(?<number1>\\d++)'], |
|
487
|
|
|
'strlen' => ['string-length', '\\(', '(?<strlen0>(?&value)?)', '\\)'], |
|
488
|
|
|
'contains' => [ |
|
489
|
|
|
'contains', |
|
490
|
|
|
'\\(', |
|
491
|
|
|
'(?<contains0>(?&value))', |
|
492
|
|
|
',', |
|
493
|
|
|
'(?<contains1>(?&value))', |
|
494
|
|
|
'\\)' |
|
495
|
|
|
], |
|
496
|
|
|
'translate' => [ |
|
497
|
|
|
'translate', |
|
498
|
|
|
'\\(', |
|
499
|
|
|
'(?<translate0>(?&value))', |
|
500
|
|
|
',', |
|
501
|
|
|
'(?<translate1>(?&string))', |
|
502
|
|
|
',', |
|
503
|
|
|
'(?<translate2>(?&string))', |
|
504
|
|
|
'\\)' |
|
505
|
|
|
], |
|
506
|
|
|
'substr' => [ |
|
507
|
|
|
'substring', |
|
508
|
|
|
'\\(', |
|
509
|
|
|
'(?<substr0>(?&value))', |
|
510
|
|
|
',', |
|
511
|
|
|
'(?<substr1>(?&value))', |
|
512
|
|
|
'(?:, (?<substr2>(?&value)))?', |
|
513
|
|
|
'\\)' |
|
514
|
|
|
], |
|
515
|
|
|
'substringafter' => [ |
|
516
|
|
|
'substring-after', |
|
517
|
|
|
'\\(', |
|
518
|
|
|
'(?<substringafter0>(?&value))', |
|
519
|
|
|
',', |
|
520
|
|
|
'(?<substringafter1>(?&string))', |
|
521
|
|
|
'\\)' |
|
522
|
|
|
], |
|
523
|
|
|
'substringbefore' => [ |
|
524
|
|
|
'substring-before', |
|
525
|
|
|
'\\(', |
|
526
|
|
|
'(?<substringbefore0>(?&value))', |
|
527
|
|
|
',', |
|
528
|
|
|
'(?<substringbefore1>(?&value))', |
|
529
|
|
|
'\\)' |
|
530
|
|
|
], |
|
531
|
|
|
'startswith' => [ |
|
532
|
|
|
'starts-with', |
|
533
|
|
|
'\\(', |
|
534
|
|
|
'(?<startswith0>(?&value))', |
|
535
|
|
|
',', |
|
536
|
|
|
'(?<startswith1>(?&value))', |
|
537
|
|
|
'\\)' |
|
538
|
|
|
], |
|
539
|
|
|
'math' => [ |
|
540
|
|
|
'(?<math0>(?&attr)|(?&number)|(?¶m))', |
|
541
|
|
|
'(?<math1>[-+*]|div)', |
|
542
|
|
|
'(?<math2>(?&math)|(?&math0))' |
|
543
|
|
|
], |
|
544
|
|
|
'notcontains' => [ |
|
545
|
|
|
'not', |
|
546
|
|
|
'\\(', |
|
547
|
|
|
'contains', |
|
548
|
|
|
'\\(', |
|
549
|
|
|
'(?<notcontains0>(?&value))', |
|
550
|
|
|
',', |
|
551
|
|
|
'(?<notcontains1>(?&value))', |
|
552
|
|
|
'\\)', |
|
553
|
|
|
'\\)' |
|
554
|
|
|
] |
|
555
|
|
|
]; |
|
556
|
|
|
|
|
557
|
|
|
$exprs = []; |
|
558
|
|
|
if (version_compare($this->pcreVersion, '8.13', '>=')) |
|
559
|
|
|
{ |
|
560
|
|
|
// Create a regexp that matches a comparison such as "@foo = 1" |
|
561
|
|
|
// NOTE: cannot support < or > because of NaN -- (@foo<5) returns false if @foo='' |
|
562
|
|
|
$exprs[] = '(?<cmp>(?<cmp0>(?&value)) (?<cmp1>!?=) (?<cmp2>(?&value)))'; |
|
563
|
|
|
|
|
564
|
|
|
// Create a regexp that matches a parenthesized expression |
|
565
|
|
|
// NOTE: could be expanded to support any expression |
|
566
|
|
|
$exprs[] = '(?<parens>\\( (?<parens0>(?&bool)|(?&cmp)|(?&math)) \\))'; |
|
567
|
|
|
|
|
568
|
|
|
// Create a regexp that matches boolean operations |
|
569
|
|
|
$exprs[] = '(?<bool>(?<bool0>(?&cmp)|(?¬)|(?&value)|(?&parens)) (?<bool1>and|or) (?<bool2>(?&bool)|(?&cmp)|(?¬)|(?&value)|(?&parens)))'; |
|
570
|
|
|
|
|
571
|
|
|
// Create a regexp that matches not() expressions |
|
572
|
|
|
$exprs[] = '(?<not>not \\( (?<not0>(?&bool)|(?&value)) \\))'; |
|
573
|
|
|
|
|
574
|
|
|
// Modify the math pattern to accept parenthesized expressions |
|
575
|
|
|
$patterns['math'][0] = str_replace('))', ')|(?&parens))', $patterns['math'][0]); |
|
576
|
|
|
$patterns['math'][1] = str_replace('))', ')|(?&parens))', $patterns['math'][1]); |
|
577
|
|
|
} |
|
578
|
|
|
|
|
579
|
|
|
// Create a regexp that matches values, such as "@foo" or "42" |
|
580
|
|
|
$valueExprs = []; |
|
581
|
|
|
foreach ($patterns as $name => $pattern) |
|
582
|
|
|
{ |
|
583
|
|
|
if (is_array($pattern)) |
|
584
|
|
|
{ |
|
585
|
|
|
$pattern = implode(' ', $pattern); |
|
586
|
|
|
} |
|
587
|
|
|
|
|
588
|
|
|
if (strpos($pattern, '?&') === false || version_compare($this->pcreVersion, '8.13', '>=')) |
|
589
|
|
|
{ |
|
590
|
|
|
$valueExprs[] = '(?<' . $name . '>' . $pattern . ')'; |
|
591
|
|
|
} |
|
592
|
|
|
} |
|
593
|
|
|
array_unshift($exprs, '(?<value>' . implode('|', $valueExprs) . ')'); |
|
594
|
|
|
|
|
595
|
|
|
// Assemble the final regexp |
|
596
|
|
|
$regexp = '#^(?:' . implode('|', $exprs) . ')$#S'; |
|
597
|
|
|
|
|
598
|
|
|
// Replace spaces with any amount of whitespace |
|
599
|
|
|
$regexp = str_replace(' ', '\\s*', $regexp); |
|
600
|
|
|
|
|
601
|
|
|
$this->regexp = $regexp; |
|
602
|
|
|
} |
|
603
|
|
|
|
|
604
|
|
|
/** |
|
605
|
|
|
* Match the relevant components of an XPath expression |
|
606
|
|
|
* |
|
607
|
|
|
* @param string $expr XPath expression |
|
608
|
|
|
* @return array |
|
609
|
|
|
*/ |
|
610
|
|
|
protected function matchXPathForExport($expr) |
|
611
|
|
|
{ |
|
612
|
|
|
$tokenExprs = [ |
|
613
|
|
|
'(?<current>\\bcurrent\\(\\))', |
|
614
|
|
|
'(?<param>\\$\\w+)', |
|
615
|
|
|
'(?<fragment>"[^"]*"|\'[^\']*\'|.)' |
|
616
|
|
|
]; |
|
617
|
|
|
preg_match_all('(' . implode('|', $tokenExprs) . ')s', $expr, $matches, PREG_SET_ORDER); |
|
618
|
|
|
|
|
619
|
|
|
// Merge fragment tokens |
|
620
|
|
|
$i = count($matches); |
|
621
|
|
|
while (--$i > 0) |
|
622
|
|
|
{ |
|
623
|
|
|
if (isset($matches[$i]['fragment'], $matches[$i - 1]['fragment'])) |
|
624
|
|
|
{ |
|
625
|
|
|
$matches[$i - 1]['fragment'] .= $matches[$i]['fragment']; |
|
626
|
|
|
unset($matches[$i]); |
|
627
|
|
|
} |
|
628
|
|
|
} |
|
629
|
|
|
|
|
630
|
|
|
return array_values($matches); |
|
631
|
|
|
} |
|
632
|
|
|
|
|
633
|
|
|
/** |
|
634
|
|
|
* Tokenize an XPath expression for use in PHP |
|
635
|
|
|
* |
|
636
|
|
|
* @param string $expr XPath expression |
|
637
|
|
|
* @return array |
|
638
|
|
|
*/ |
|
639
|
|
|
protected function tokenizeXPathForExport($expr) |
|
640
|
|
|
{ |
|
641
|
|
|
$tokens = []; |
|
642
|
|
|
foreach ($this->matchXPathForExport($expr) as $match) |
|
643
|
|
|
{ |
|
644
|
|
|
foreach (array_reverse($match) as $k => $v) |
|
645
|
|
|
{ |
|
646
|
|
|
// Use the last non-numeric match |
|
647
|
|
|
if (!is_numeric($k)) |
|
648
|
|
|
{ |
|
649
|
|
|
$tokens[] = [$k, $v]; |
|
650
|
|
|
break; |
|
651
|
|
|
} |
|
652
|
|
|
} |
|
653
|
|
|
} |
|
654
|
|
|
|
|
655
|
|
|
return $tokens; |
|
656
|
|
|
} |
|
657
|
|
|
} |