1
|
|
|
<?php |
2
|
|
|
|
3
|
|
|
/** |
4
|
|
|
* @package s9e\TextFormatter |
5
|
|
|
* @copyright Copyright (c) 2010-2017 The s9e Authors |
6
|
|
|
* @license http://www.opensource.org/licenses/mit-license.php The MIT License |
7
|
|
|
*/ |
8
|
|
|
namespace s9e\TextFormatter\Configurator\Helpers; |
9
|
|
|
|
10
|
|
|
use RuntimeException; |
11
|
|
|
use s9e\TextFormatter\Utils\XPath; |
12
|
|
|
|
13
|
|
|
abstract class XPathHelper |
14
|
|
|
{ |
15
|
|
|
/** |
16
|
|
|
* Return the list of variables used in a given XPath expression |
17
|
|
|
* |
18
|
|
|
* @param string $expr XPath expression |
19
|
|
|
* @return array Alphabetically sorted list of unique variable names |
20
|
|
|
*/ |
21
|
|
|
public static function getVariables($expr) |
22
|
|
|
{ |
23
|
|
|
// First, remove strings' contents to prevent false-positives |
24
|
|
|
$expr = preg_replace('/(["\']).*?\\1/s', '$1$1', $expr); |
25
|
|
|
|
26
|
|
|
// Capture all the variable names |
27
|
|
|
preg_match_all('/\\$(\\w+)/', $expr, $matches); |
28
|
|
|
|
29
|
|
|
// Dedupe and sort names |
30
|
|
|
$varNames = array_unique($matches[1]); |
31
|
|
|
sort($varNames); |
32
|
|
|
|
33
|
|
|
return $varNames; |
34
|
|
|
} |
35
|
|
|
|
36
|
|
|
/** |
37
|
|
|
* Determine whether given XPath expression definitely evaluates to a number |
38
|
|
|
* |
39
|
|
|
* @param string $expr XPath expression |
40
|
|
|
* @return bool Whether given XPath expression definitely evaluates to a number |
41
|
|
|
*/ |
42
|
|
|
public static function isExpressionNumeric($expr) |
43
|
|
|
{ |
44
|
|
|
// Trim the expression and remove parentheses that are not part of a function call. PCRE |
45
|
|
|
// does not support lookbehind assertions of variable length so we have to flip the string. |
46
|
|
|
// We exclude the XPath operator "div" (flipped into "vid") to avoid false positives |
47
|
|
|
$expr = strrev(preg_replace('(\\((?!\\s*(?!vid(?!\\w))\\w))', ' ', strrev($expr))); |
48
|
|
|
$expr = str_replace(')', ' ', $expr); |
49
|
|
|
if (preg_match('(^\\s*([$@][-\\w]++|-?\\.\\d++|-?\\d++(?:\\.\\d++)?)(?>\\s*(?>[-+*]|div)\\s*(?1))++\\s*$)', $expr)) |
50
|
|
|
{ |
51
|
|
|
return true; |
52
|
|
|
} |
53
|
|
|
|
54
|
|
|
return false; |
55
|
|
|
} |
56
|
|
|
|
57
|
|
|
/** |
58
|
|
|
* Remove extraneous space in a given XPath expression |
59
|
|
|
* |
60
|
|
|
* @param string $expr Original XPath expression |
61
|
|
|
* @return string Minified XPath expression |
62
|
|
|
*/ |
63
|
|
|
public static function minify($expr) |
64
|
|
|
{ |
65
|
|
|
$old = $expr; |
66
|
|
|
$strings = []; |
67
|
|
|
|
68
|
|
|
// Trim the surrounding whitespace then temporarily remove literal strings |
69
|
|
|
$expr = preg_replace_callback( |
70
|
|
|
'/"[^"]*"|\'[^\']*\'/', |
71
|
|
|
function ($m) use (&$strings) |
72
|
|
|
{ |
73
|
|
|
$uniqid = '(' . sha1(uniqid()) . ')'; |
74
|
|
|
$strings[$uniqid] = $m[0]; |
75
|
|
|
|
76
|
|
|
return $uniqid; |
77
|
|
|
}, |
78
|
|
|
trim($expr) |
79
|
|
|
); |
80
|
|
|
|
81
|
|
|
if (preg_match('/[\'"]/', $expr)) |
82
|
|
|
{ |
83
|
|
|
throw new RuntimeException("Cannot parse XPath expression '" . $old . "'"); |
84
|
|
|
} |
85
|
|
|
|
86
|
|
|
// Normalize whitespace to a single space |
87
|
|
|
$expr = preg_replace('/\\s+/', ' ', $expr); |
88
|
|
|
|
89
|
|
|
// Remove the space between a non-word character and a word character |
90
|
|
|
$expr = preg_replace('/([-a-z_0-9]) ([^-a-z_0-9])/i', '$1$2', $expr); |
91
|
|
|
$expr = preg_replace('/([^-a-z_0-9]) ([-a-z_0-9])/i', '$1$2', $expr); |
92
|
|
|
|
93
|
|
|
// Remove the space between two non-word characters as long as they're not two - |
94
|
|
|
$expr = preg_replace('/(?!- -)([^-a-z_0-9]) ([^-a-z_0-9])/i', '$1$2', $expr); |
95
|
|
|
|
96
|
|
|
// Remove the space between a - and a word character, as long as there's a space before - |
97
|
|
|
$expr = preg_replace('/ - ([a-z_0-9])/i', ' -$1', $expr); |
98
|
|
|
|
99
|
|
|
// Remove the spaces between a number and the div operator and the next token |
100
|
|
|
$expr = preg_replace('/((?:^|[ \\(])\\d+) div ?/', '$1div', $expr); |
101
|
|
|
|
102
|
|
|
// Remove the space between the div operator the next token |
103
|
|
|
$expr = preg_replace('/([^-a-z_0-9]div) (?=[$0-9@])/', '$1', $expr); |
104
|
|
|
|
105
|
|
|
// Restore the literals |
106
|
|
|
$expr = strtr($expr, $strings); |
107
|
|
|
|
108
|
|
|
return $expr; |
109
|
|
|
} |
110
|
|
|
} |