Conditions | 11 |
Paths | 128 |
Total Lines | 128 |
Code Lines | 67 |
Lines | 0 |
Ratio | 0 % |
Changes | 1 | ||
Bugs | 0 | Features | 0 |
Small methods make your code easier to understand, in particular if combined with a good name. Besides, if your method is small, finding a good name is usually much easier.
For example, if you find yourself adding comments to a method's body, this is usually a good sign to extract the commented part to a new method, and use the comment as a starting point when coming up with a good name for this new method.
Commonly applied refactorings include:
If many parameters/temporary variables are present:
1 | <?php |
||
159 | public static function testSqlAndScriptInject($val, $type) |
||
160 | { |
||
161 | // Decode string first because a lot of things are obfuscated by encoding or multiple encoding. |
||
162 | // So <svg onload='console.log("123")' become <svg onload='console.log("123")' |
||
163 | // So ":'" become ":'" (due to ENT_HTML5) |
||
164 | // So "	
" become "" |
||
165 | // So "()" become "()" |
||
166 | |||
167 | // Loop to decode until no more things to decode. |
||
168 | //print "before decoding $val\n"; |
||
169 | do { |
||
170 | $oldval = $val; |
||
171 | $val = html_entity_decode($val, ENT_QUOTES | ENT_HTML5); // Decode ':', ''', '	', '&NewLine', ... |
||
172 | // Sometimes we have entities without the ; at end so html_entity_decode does not work but entities is still interpreted by browser. |
||
173 | $val = preg_replace_callback( |
||
174 | '/&#(x?[0-9][0-9a-f]+;?)/i', |
||
175 | /** |
||
176 | * @param string[] $m |
||
177 | * @return string |
||
178 | */ |
||
179 | static function ($m) { |
||
180 | // Decode 'n', ... |
||
181 | return Filters::realCharForNumericEntities($m); |
||
182 | }, |
||
183 | $val |
||
184 | ); |
||
185 | |||
186 | // We clean html comments because some hacks try to obfuscate evil strings by inserting HTML comments. Example: on<!-- -->error=alert(1) |
||
187 | $val = preg_replace('/<!--[^>]*-->/', '', $val); |
||
188 | $val = preg_replace('/[\r\n\t]/', '', $val); |
||
189 | } while ($oldval != $val); |
||
190 | //print "type = ".$type." after decoding: ".$val."\n"; |
||
191 | |||
192 | $inj = 0; |
||
193 | |||
194 | // We check string because some hacks try to obfuscate evil strings by inserting non printable chars. Example: 'java(ascci09)scr(ascii00)ipt' is processed like 'javascript' (whatever is place of evil ascii char) |
||
195 | // We should use dol_string_nounprintableascii but function is not yet loaded/available |
||
196 | // Example of valid UTF8 chars: |
||
197 | // utf8=utf8mb3: '\x09', '\x0A', '\x0D', '\x7E' |
||
198 | // utf8=utf8mb3: '\xE0\xA0\x80' |
||
199 | // utf8mb4: '\xF0\x9D\x84\x9E' (but this may be refused by the database insert if pagecode is utf8=utf8mb3) |
||
200 | $newval = preg_replace('/[\x00-\x08\x0B-\x0C\x0E-\x1F\x7F]/u', '', $val); // /u operator makes UTF8 valid characters being ignored so are not included into the replace |
||
201 | |||
202 | // Note that $newval may also be completely empty '' when non valid UTF8 are found. |
||
203 | if ($newval != $val) { |
||
204 | // If $val has changed after removing non valid UTF8 chars, it means we have an evil string. |
||
205 | $inj += 1; |
||
206 | } |
||
207 | //print 'inj='.$inj.'-type='.$type.'-val='.$val.'-newval='.$newval."\n"; |
||
208 | |||
209 | // For SQL Injection (only GET are used to scan for such injection strings) |
||
210 | if ($type == 1 || $type == 3) { |
||
211 | // Note the \s+ is replaced into \s* because some spaces may have been modified in previous loop |
||
212 | $inj += preg_match('/delete\s*from/i', $val); |
||
213 | $inj += preg_match('/create\s*table/i', $val); |
||
214 | $inj += preg_match('/insert\s*into/i', $val); |
||
215 | $inj += preg_match('/select\s*from/i', $val); |
||
216 | $inj += preg_match('/into\s*(outfile|dumpfile)/i', $val); |
||
217 | $inj += preg_match('/user\s*\(/i', $val); // avoid to use function user() or mysql_user() that return current database login |
||
218 | $inj += preg_match('/information_schema/i', $val); // avoid to use request that read information_schema database |
||
219 | $inj += preg_match('/<svg/i', $val); // <svg can be allowed in POST |
||
220 | $inj += preg_match('/update[^&=\w].*set.+=/i', $val); // the [^&=\w] test is to avoid error when request is like action=update&...set... or &updatemodule=...set... |
||
221 | $inj += preg_match('/union.+select/i', $val); |
||
222 | } |
||
223 | if ($type == 3) { |
||
224 | // Note the \s+ is replaced into \s* because some spaces may have been modified in previous loop |
||
225 | $inj += preg_match('/select|update|delete|truncate|replace|group\s*by|concat|count|from|union/i', $val); |
||
226 | } |
||
227 | if ($type != 2) { // Not common key strings, so we can check them both on GET and POST |
||
228 | $inj += preg_match('/updatexml\(/i', $val); |
||
229 | $inj += preg_match('/(\.\.%2f)+/i', $val); |
||
230 | $inj += preg_match('/\s@@/', $val); |
||
231 | } |
||
232 | // For XSS Injection done by closing textarea to execute content into a textarea field |
||
233 | $inj += preg_match('/<\/textarea/i', $val); |
||
234 | // For XSS Injection done by adding javascript with script |
||
235 | // This is all cases a browser consider text is javascript: |
||
236 | // When it found '<script', 'javascript:', '<style', 'onload\s=' on body tag, '="&' on a tag size with old browsers |
||
237 | // All examples on page: http://ha.ckers.org/xss.html#XSScalc |
||
238 | // More on https://www.owasp.org/index.php/XSS_Filter_Evasion_Cheat_Sheet |
||
239 | $inj += preg_match('/<audio/i', $val); |
||
240 | $inj += preg_match('/<embed/i', $val); |
||
241 | $inj += preg_match('/<iframe/i', $val); |
||
242 | $inj += preg_match('/<object/i', $val); |
||
243 | $inj += preg_match('/<script/i', $val); |
||
244 | $inj += preg_match('/Set\.constructor/i', $val); // ECMA script 6 |
||
245 | if (!defined('NOSTYLECHECK')) { |
||
246 | $inj += preg_match('/<style/i', $val); |
||
247 | } |
||
248 | $inj += preg_match('/base\s+href/si', $val); |
||
249 | $inj += preg_match('/=data:/si', $val); |
||
250 | // List of dom events is on https://www.w3schools.com/jsref/dom_obj_event.asp and https://developer.mozilla.org/en-US/docs/Web/Events |
||
251 | $inj += preg_match('/on(mouse|drag|key|load|touch|pointer|select|transition)[a-z]*\s*=/i', $val); // onmousexxx can be set on img or any html tag like <img title='...' onmouseover=alert(1)> |
||
252 | $inj += preg_match('/on(abort|after|animation|auxclick|before|blur|cancel|canplay|canplaythrough|change|click|close|contextmenu|cuechange|copy|cut)[a-z]*\s*=/i', $val); |
||
253 | $inj += preg_match('/on(dblclick|drop|durationchange|emptied|end|ended|error|focus|focusin|focusout|formdata|gotpointercapture|hashchange|input|invalid)[a-z]*\s*=/i', $val); |
||
254 | $inj += preg_match('/on(lostpointercapture|offline|online|pagehide|pageshow)[a-z]*\s*=/i', $val); |
||
255 | $inj += preg_match('/on(paste|pause|play|playing|progress|ratechange|reset|resize|scroll|search|seeked|seeking|show|stalled|start|submit|suspend)[a-z]*\s*=/i', $val); |
||
256 | $inj += preg_match('/on(timeupdate|toggle|unload|volumechange|waiting|wheel)[a-z]*\s*=/i', $val); |
||
257 | // More not into the previous list |
||
258 | |||
259 | $inj += preg_match('/on(repeat|begin|finish|beforeinput)[a-z]*\s*=/i', $val); |
||
260 | |||
261 | // We refuse html into html because some hacks try to obfuscate evil strings by inserting HTML into HTML. Example: <img on<a>error=alert(1) to bypass test on onerror |
||
262 | $tmpval = preg_replace('/<[^<]+>/', '', $val); |
||
263 | // List of dom events is on https://www.w3schools.com/jsref/dom_obj_event.asp and https://developer.mozilla.org/en-US/docs/Web/Events |
||
264 | $inj += preg_match('/on(mouse|drag|key|load|touch|pointer|select|transition)[a-z]*\s*=/i', $tmpval); // onmousexxx can be set on img or any html tag like <img title='...' onmouseover=alert(1)> |
||
265 | $inj += preg_match('/on(abort|after|animation|auxclick|before|blur|cancel|canplay|canplaythrough|change|click|close|contextmenu|cuechange|copy|cut)[a-z]*\s*=/i', $tmpval); |
||
266 | $inj += preg_match('/on(dblclick|drop|durationchange|emptied|end|ended|error|focus|focusin|focusout|formdata|gotpointercapture|hashchange|input|invalid)[a-z]*\s*=/i', $tmpval); |
||
267 | $inj += preg_match('/on(lostpointercapture|offline|online|pagehide|pageshow)[a-z]*\s*=/i', $tmpval); |
||
268 | $inj += preg_match('/on(paste|pause|play|playing|progress|ratechange|reset|resize|scroll|search|seeked|seeking|show|stalled|start|submit|suspend)[a-z]*\s*=/i', $tmpval); |
||
269 | $inj += preg_match('/on(timeupdate|toggle|unload|volumechange|waiting|wheel)[a-z]*\s*=/i', $tmpval); |
||
270 | // More not into the previous list |
||
271 | $inj += preg_match('/on(repeat|begin|finish|beforeinput)[a-z]*\s*=/i', $tmpval); |
||
272 | |||
273 | //$inj += preg_match('/on[A-Z][a-z]+\*=/', $val); // To lock event handlers onAbort(), ... |
||
274 | $inj += preg_match('/:|:|:/i', $val); // refused string ':' encoded (no reason to have it encoded) to lock 'javascript:...' |
||
275 | $inj += preg_match('/j\s*a\s*v\s*a\s*s\s*c\s*r\s*i\s*p\s*t\s*:/i', $val); |
||
276 | $inj += preg_match('/vbscript\s*:/i', $val); |
||
277 | // For XSS Injection done by adding javascript closing html tags like with onmousemove, etc... (closing a src or href tag with not cleaned param) |
||
278 | if ($type == 1 || $type == 3) { |
||
279 | $val = str_replace('enclosure="', 'enclosure=X', $val); // We accept enclosure=" for the export/import module |
||
280 | $inj += preg_match('/"/i', $val); // We refused " in GET parameters value. |
||
281 | } |
||
282 | if ($type == 2) { |
||
283 | $inj += preg_match('/[:;"\'<>\?\(\){}\$%]/', $val); // PHP_SELF is a file system (or url path without parameters). It can contains spaces. |
||
284 | } |
||
285 | |||
286 | return $inj; |
||
287 | } |
||
324 |
In general, usage of exit should be done with care and only when running in a scripting context like a CLI script.