@@ 237-246 (lines=10) @@ | ||
234 | $cc2 = ($c1 & "\x3f") | "\x80"; |
|
235 | $buf .= $cc1 . $cc2; |
|
236 | } |
|
237 | } elseif ($c1 >= "\xe0" & $c1 <= "\xef") { //looks like 3 bytes UTF8 |
|
238 | if ($c2 >= "\x80" && $c2 <= "\xbf" && $c3 >= "\x80" && $c3 <= "\xbf") { //yeah, almost sure it's UTF8 already |
|
239 | $buf .= $c1 . $c2 . $c3; |
|
240 | $i = $i + 2; |
|
241 | } else { //not valid UTF8. Convert it. |
|
242 | $cc1 = (chr(ord($c1) / 64) | "\xc0"); |
|
243 | $cc2 = ($c1 & "\x3f") | "\x80"; |
|
244 | $buf .= $cc1 . $cc2; |
|
245 | } |
|
246 | } elseif ($c1 >= "\xf0" & $c1 <= "\xf7") { //looks like 4 bytes UTF8 |
|
247 | if ($c2 >= "\x80" && $c2 <= "\xbf" && $c3 >= "\x80" && $c3 <= "\xbf" && $c4 >= "\x80" && $c4 <= "\xbf") { //yeah, almost sure it's UTF8 already |
|
248 | $buf .= $c1 . $c2 . $c3; |
|
249 | $i = $i + 2; |
|
@@ 247-254 (lines=8) @@ | ||
244 | $buf .= $cc1 . $cc2; |
|
245 | } |
|
246 | } elseif ($c1 >= "\xf0" & $c1 <= "\xf7") { //looks like 4 bytes UTF8 |
|
247 | if ($c2 >= "\x80" && $c2 <= "\xbf" && $c3 >= "\x80" && $c3 <= "\xbf" && $c4 >= "\x80" && $c4 <= "\xbf") { //yeah, almost sure it's UTF8 already |
|
248 | $buf .= $c1 . $c2 . $c3; |
|
249 | $i = $i + 2; |
|
250 | } else { //not valid UTF8. Convert it. |
|
251 | $cc1 = (chr(ord($c1) / 64) | "\xc0"); |
|
252 | $cc2 = ($c1 & "\x3f") | "\x80"; |
|
253 | $buf .= $cc1 . $cc2; |
|
254 | } |
|
255 | } else { //doesn't look like UTF8, but should be converted |
|
256 | $cc1 = (chr(ord($c1) / 64) | "\xc0"); |
|
257 | $cc2 = (($c1 & "\x3f") | "\x80"); |