|
@@ 675-680 (lines=6) @@
|
| 672 |
|
$utf8 .= $chrs{$c}; |
| 673 |
|
break; |
| 674 |
|
|
| 675 |
|
case ($ord_chrs_c & 0xE0) == 0xC0: |
| 676 |
|
// characters U-00000080 - U-000007FF, mask 110XXXXX |
| 677 |
|
//see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8 |
| 678 |
|
$utf8 .= $this->substr8($chrs, $c, 2); |
| 679 |
|
++$c; |
| 680 |
|
break; |
| 681 |
|
|
| 682 |
|
case ($ord_chrs_c & 0xF0) == 0xE0: |
| 683 |
|
// characters U-00000800 - U-0000FFFF, mask 1110XXXX |
|
@@ 682-687 (lines=6) @@
|
| 679 |
|
++$c; |
| 680 |
|
break; |
| 681 |
|
|
| 682 |
|
case ($ord_chrs_c & 0xF0) == 0xE0: |
| 683 |
|
// characters U-00000800 - U-0000FFFF, mask 1110XXXX |
| 684 |
|
// see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8 |
| 685 |
|
$utf8 .= $this->substr8($chrs, $c, 3); |
| 686 |
|
$c += 2; |
| 687 |
|
break; |
| 688 |
|
|
| 689 |
|
case ($ord_chrs_c & 0xF8) == 0xF0: |
| 690 |
|
// characters U-00010000 - U-001FFFFF, mask 11110XXX |
|
@@ 689-694 (lines=6) @@
|
| 686 |
|
$c += 2; |
| 687 |
|
break; |
| 688 |
|
|
| 689 |
|
case ($ord_chrs_c & 0xF8) == 0xF0: |
| 690 |
|
// characters U-00010000 - U-001FFFFF, mask 11110XXX |
| 691 |
|
// see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8 |
| 692 |
|
$utf8 .= $this->substr8($chrs, $c, 4); |
| 693 |
|
$c += 3; |
| 694 |
|
break; |
| 695 |
|
|
| 696 |
|
case ($ord_chrs_c & 0xFC) == 0xF8: |
| 697 |
|
// characters U-00200000 - U-03FFFFFF, mask 111110XX |
|
@@ 696-701 (lines=6) @@
|
| 693 |
|
$c += 3; |
| 694 |
|
break; |
| 695 |
|
|
| 696 |
|
case ($ord_chrs_c & 0xFC) == 0xF8: |
| 697 |
|
// characters U-00200000 - U-03FFFFFF, mask 111110XX |
| 698 |
|
// see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8 |
| 699 |
|
$utf8 .= $this->substr8($chrs, $c, 5); |
| 700 |
|
$c += 4; |
| 701 |
|
break; |
| 702 |
|
|
| 703 |
|
case ($ord_chrs_c & 0xFE) == 0xFC: |
| 704 |
|
// characters U-04000000 - U-7FFFFFFF, mask 1111110X |
|
@@ 703-708 (lines=6) @@
|
| 700 |
|
$c += 4; |
| 701 |
|
break; |
| 702 |
|
|
| 703 |
|
case ($ord_chrs_c & 0xFE) == 0xFC: |
| 704 |
|
// characters U-04000000 - U-7FFFFFFF, mask 1111110X |
| 705 |
|
// see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8 |
| 706 |
|
$utf8 .= $this->substr8($chrs, $c, 6); |
| 707 |
|
$c += 5; |
| 708 |
|
break; |
| 709 |
|
|
| 710 |
|
} |
| 711 |
|
|