1 | <?php |
||
2 | |||
3 | /** |
||
4 | * It's free open-source software released under the MIT License. |
||
5 | * |
||
6 | * @author Anatoly Nekhay <[email protected]> |
||
7 | * @copyright Copyright (c) 2018, Anatoly Nekhay |
||
8 | * @license https://github.com/sunrise-php/http-router/blob/master/LICENSE |
||
9 | * @link https://github.com/sunrise-php/http-router |
||
10 | */ |
||
11 | |||
12 | declare(strict_types=1); |
||
13 | |||
14 | namespace Sunrise\Http\Router\Helper; |
||
15 | |||
16 | use function trim; |
||
17 | |||
18 | /** |
||
19 | * @since 3.0.0 |
||
20 | */ |
||
21 | final class HeaderParser |
||
22 | { |
||
23 | private const IN_IDENTIFIER = 1; |
||
24 | private const IN_PARAMETER_NAME = 2; |
||
25 | private const IN_PARAMETER_VALUE = 4; |
||
26 | private const IN_QUOTED_STRING = 8; |
||
27 | private const IN_QUOTED_PAIR = 16; |
||
28 | |||
29 | private const MAX_FIELD_VALUE_LENGTH = 512; |
||
30 | |||
31 | /** |
||
32 | * @link https://datatracker.ietf.org/doc/html/rfc7230#section-3.2.6 |
||
33 | */ |
||
34 | private const RFC7230_FIELD_VALUE_CHARSET = [ |
||
35 | "\x09" => 1, "\x20" => 1, "\x21" => 1, "\x22" => 1, "\x23" => 1, "\x24" => 1, "\x25" => 1, "\x26" => 1, |
||
36 | "\x27" => 1, "\x28" => 1, "\x29" => 1, "\x2a" => 1, "\x2b" => 1, "\x2c" => 1, "\x2d" => 1, "\x2e" => 1, |
||
37 | "\x2f" => 1, "\x30" => 1, "\x31" => 1, "\x32" => 1, "\x33" => 1, "\x34" => 1, "\x35" => 1, "\x36" => 1, |
||
38 | "\x37" => 1, "\x38" => 1, "\x39" => 1, "\x3a" => 1, "\x3b" => 1, "\x3c" => 1, "\x3d" => 1, "\x3e" => 1, |
||
39 | "\x3f" => 1, "\x40" => 1, "\x41" => 1, "\x42" => 1, "\x43" => 1, "\x44" => 1, "\x45" => 1, "\x46" => 1, |
||
40 | "\x47" => 1, "\x48" => 1, "\x49" => 1, "\x4a" => 1, "\x4b" => 1, "\x4c" => 1, "\x4d" => 1, "\x4e" => 1, |
||
41 | "\x4f" => 1, "\x50" => 1, "\x51" => 1, "\x52" => 1, "\x53" => 1, "\x54" => 1, "\x55" => 1, "\x56" => 1, |
||
42 | "\x57" => 1, "\x58" => 1, "\x59" => 1, "\x5a" => 1, "\x5b" => 1, "\x5c" => 1, "\x5d" => 1, "\x5e" => 1, |
||
43 | "\x5f" => 1, "\x60" => 1, "\x61" => 1, "\x62" => 1, "\x63" => 1, "\x64" => 1, "\x65" => 1, "\x66" => 1, |
||
44 | "\x67" => 1, "\x68" => 1, "\x69" => 1, "\x6a" => 1, "\x6b" => 1, "\x6c" => 1, "\x6d" => 1, "\x6e" => 1, |
||
45 | "\x6f" => 1, "\x70" => 1, "\x71" => 1, "\x72" => 1, "\x73" => 1, "\x74" => 1, "\x75" => 1, "\x76" => 1, |
||
46 | "\x77" => 1, "\x78" => 1, "\x79" => 1, "\x7a" => 1, "\x7b" => 1, "\x7c" => 1, "\x7d" => 1, "\x7e" => 1, |
||
47 | "\x80" => 1, "\x81" => 1, "\x82" => 1, "\x83" => 1, "\x84" => 1, "\x85" => 1, "\x86" => 1, "\x87" => 1, |
||
48 | "\x88" => 1, "\x89" => 1, "\x8a" => 1, "\x8b" => 1, "\x8c" => 1, "\x8d" => 1, "\x8e" => 1, "\x8f" => 1, |
||
49 | "\x90" => 1, "\x91" => 1, "\x92" => 1, "\x93" => 1, "\x94" => 1, "\x95" => 1, "\x96" => 1, "\x97" => 1, |
||
50 | "\x98" => 1, "\x99" => 1, "\x9a" => 1, "\x9b" => 1, "\x9c" => 1, "\x9d" => 1, "\x9e" => 1, "\x9f" => 1, |
||
51 | "\xa0" => 1, "\xa1" => 1, "\xa2" => 1, "\xa3" => 1, "\xa4" => 1, "\xa5" => 1, "\xa6" => 1, "\xa7" => 1, |
||
52 | "\xa8" => 1, "\xa9" => 1, "\xaa" => 1, "\xab" => 1, "\xac" => 1, "\xad" => 1, "\xae" => 1, "\xaf" => 1, |
||
53 | "\xb0" => 1, "\xb1" => 1, "\xb2" => 1, "\xb3" => 1, "\xb4" => 1, "\xb5" => 1, "\xb6" => 1, "\xb7" => 1, |
||
54 | "\xb8" => 1, "\xb9" => 1, "\xba" => 1, "\xbb" => 1, "\xbc" => 1, "\xbd" => 1, "\xbe" => 1, "\xbf" => 1, |
||
55 | "\xc0" => 1, "\xc1" => 1, "\xc2" => 1, "\xc3" => 1, "\xc4" => 1, "\xc5" => 1, "\xc6" => 1, "\xc7" => 1, |
||
56 | "\xc8" => 1, "\xc9" => 1, "\xca" => 1, "\xcb" => 1, "\xcc" => 1, "\xcd" => 1, "\xce" => 1, "\xcf" => 1, |
||
57 | "\xd0" => 1, "\xd1" => 1, "\xd2" => 1, "\xd3" => 1, "\xd4" => 1, "\xd5" => 1, "\xd6" => 1, "\xd7" => 1, |
||
58 | "\xd8" => 1, "\xd9" => 1, "\xda" => 1, "\xdb" => 1, "\xdc" => 1, "\xdd" => 1, "\xde" => 1, "\xdf" => 1, |
||
59 | "\xe0" => 1, "\xe1" => 1, "\xe2" => 1, "\xe3" => 1, "\xe4" => 1, "\xe5" => 1, "\xe6" => 1, "\xe7" => 1, |
||
60 | "\xe8" => 1, "\xe9" => 1, "\xea" => 1, "\xeb" => 1, "\xec" => 1, "\xed" => 1, "\xee" => 1, "\xef" => 1, |
||
61 | "\xf0" => 1, "\xf1" => 1, "\xf2" => 1, "\xf3" => 1, "\xf4" => 1, "\xf5" => 1, "\xf6" => 1, "\xf7" => 1, |
||
62 | "\xf8" => 1, "\xf9" => 1, "\xfa" => 1, "\xfb" => 1, "\xfc" => 1, "\xfd" => 1, "\xfe" => 1, "\xff" => 1, |
||
63 | ]; |
||
64 | |||
65 | /** |
||
66 | * @return array<int<0, max>, array{0: string, 1: array<string, string>}> |
||
0 ignored issues
–
show
Documentation
Bug
introduced
by
![]() |
|||
67 | */ |
||
68 | 74 | public static function parseHeader(string $header): array |
|
69 | { |
||
70 | 74 | if ($header === '') { |
|
71 | 7 | return []; |
|
72 | } |
||
73 | |||
74 | 67 | $cursor = self::IN_IDENTIFIER; |
|
75 | 67 | $value = 0; |
|
76 | 67 | $param = -1; |
|
77 | |||
78 | /** @var array<int<0, max>, array{0?: string, 1?: array<int<0, max>, array{0?: string, 1?: string}>}> $values */ |
||
79 | 67 | $values = []; |
|
80 | |||
81 | 67 | for ($offset = 0; isset($header[$offset]) && $offset < self::MAX_FIELD_VALUE_LENGTH; $offset++) { |
|
82 | 67 | if (!isset(self::RFC7230_FIELD_VALUE_CHARSET[$header[$offset]])) { |
|
83 | 2 | continue; |
|
84 | } |
||
85 | |||
86 | 67 | if ($header[$offset] === ',' && !($cursor & self::IN_QUOTED_STRING)) { |
|
87 | 39 | $cursor = self::IN_IDENTIFIER; |
|
88 | 39 | $value++; |
|
89 | 39 | $param = -1; |
|
90 | 39 | continue; |
|
91 | } |
||
92 | 67 | if ($header[$offset] === ';' && !($cursor & self::IN_QUOTED_STRING)) { |
|
93 | 30 | $cursor = self::IN_PARAMETER_NAME; |
|
94 | 30 | $param++; |
|
95 | 30 | continue; |
|
96 | } |
||
97 | 67 | if ($header[$offset] === '=' && ($cursor & self::IN_PARAMETER_NAME)) { |
|
98 | 30 | $cursor = self::IN_PARAMETER_VALUE; |
|
99 | 30 | continue; |
|
100 | } |
||
101 | 67 | if ($header[$offset] === '"' && ($cursor & self::IN_PARAMETER_VALUE) && !($cursor & self::IN_QUOTED_PAIR)) { |
|
102 | 15 | $cursor ^= self::IN_QUOTED_STRING; |
|
103 | 15 | continue; |
|
104 | } |
||
105 | 67 | if ($header[$offset] === '\\' && ($cursor & self::IN_QUOTED_STRING) && !($cursor & self::IN_QUOTED_PAIR)) { |
|
106 | 4 | $cursor |= self::IN_QUOTED_PAIR; |
|
107 | 4 | continue; |
|
108 | } |
||
109 | |||
110 | 67 | if (($cursor & self::IN_IDENTIFIER)) { |
|
111 | 67 | $values[$value][0] ??= ''; |
|
112 | 67 | $values[$value][0] .= $header[$offset]; |
|
113 | 67 | continue; |
|
114 | } |
||
115 | 30 | if (($cursor & self::IN_PARAMETER_NAME)) { |
|
116 | 30 | $values[$value][1][$param][0] ??= ''; |
|
117 | 30 | $values[$value][1][$param][0] .= $header[$offset]; |
|
118 | 30 | continue; |
|
119 | } |
||
120 | 30 | if (($cursor & self::IN_PARAMETER_VALUE)) { |
|
121 | 30 | $values[$value][1][$param][1] ??= ''; |
|
122 | 30 | $values[$value][1][$param][1] .= $header[$offset]; |
|
123 | 30 | $cursor &= ~self::IN_QUOTED_PAIR; |
|
124 | 30 | continue; |
|
125 | } |
||
126 | } |
||
127 | |||
128 | 67 | $result = []; |
|
129 | 67 | foreach ($values as $index => $value) { |
|
130 | 67 | unset($values[$index]); |
|
131 | |||
132 | 67 | $value[0] = trim($value[0] ?? ''); |
|
133 | 67 | if ($value[0] === '') { |
|
134 | 1 | continue; |
|
135 | } |
||
136 | |||
137 | 67 | $params = []; |
|
138 | 67 | foreach ($value[1] ?? [] as $param) { |
|
139 | 30 | $param[0] = trim($param[0] ?? ''); |
|
140 | 30 | if ($param[0] === '') { |
|
141 | 1 | continue; |
|
142 | } |
||
143 | |||
144 | 30 | $params[$param[0]] = trim($param[1] ?? ''); |
|
145 | } |
||
146 | |||
147 | 67 | $result[$index] = [$value[0], $params]; |
|
148 | } |
||
149 | |||
150 | 67 | return $result; |
|
151 | } |
||
152 | } |
||
153 |