1
|
|
|
<?php |
2
|
|
|
|
3
|
|
|
namespace Faytekin\LZW; |
4
|
|
|
|
5
|
|
|
class LZW |
6
|
|
|
{ |
7
|
|
|
public function compress(string $uncompress): string |
8
|
|
|
{ |
9
|
|
|
$dictSize = 256; |
10
|
|
|
$dictionary = []; |
11
|
|
|
|
12
|
|
|
for ($i = 0; $i < 256; $i++) { |
13
|
|
|
$dictionary[$this->uniChr($i)] = $i; |
14
|
|
|
} |
15
|
|
|
|
16
|
|
|
$w = ''; |
17
|
|
|
$result = []; |
18
|
|
|
|
19
|
|
|
for ($i = 0; $i < strlen($uncompress); $i++) { |
20
|
|
|
$c = $this->charAt($uncompress, $i); |
21
|
|
|
$wc = $w.$c; |
22
|
|
|
|
23
|
|
|
if (isset($dictionary[$wc])) { |
24
|
|
|
$w = $wc; |
25
|
|
|
} else { |
26
|
|
|
array_push($result, $dictionary[$w]); |
27
|
|
|
|
28
|
|
|
$dictionary[$wc] = $dictSize++; |
29
|
|
|
$w = strval($c); |
30
|
|
|
} |
31
|
|
|
} |
32
|
|
|
|
33
|
|
|
if ($w != '') { |
34
|
|
|
array_push($result, $dictionary[$w]); |
35
|
|
|
} |
36
|
|
|
|
37
|
|
|
return implode(',', $result); |
38
|
|
|
} |
39
|
|
|
|
40
|
|
|
public function decompress(string $compressed): ?string |
41
|
|
|
{ |
42
|
|
|
$compressed = explode(',', $compressed); |
43
|
|
|
$dictSize = 256; |
44
|
|
|
$dictionary = []; |
45
|
|
|
|
46
|
|
|
for ($i = 1; $i < $dictSize; $i++) { |
47
|
|
|
$dictionary[$i] = $this->uniChr($i); |
48
|
|
|
} |
49
|
|
|
|
50
|
|
|
$w = $this->uniChr($compressed[0]); |
|
|
|
|
51
|
|
|
$result = $w; |
52
|
|
|
|
53
|
|
|
for ($i = 1; $i < count($compressed); $i++) { |
|
|
|
|
54
|
|
|
$k = $compressed[$i]; |
55
|
|
|
|
56
|
|
|
if (isset($dictionary[$k])) { |
57
|
|
|
$entry = $dictionary[$k]; |
58
|
|
|
} elseif ($k == $dictSize) { |
59
|
|
|
$entry = $w.$this->charAt($w, 0); |
60
|
|
|
} else { |
61
|
|
|
return null; |
62
|
|
|
} |
63
|
|
|
|
64
|
|
|
$result .= $entry; |
65
|
|
|
$dictionary[$dictSize++] = $w.$this->charAt($entry, 0); |
66
|
|
|
$w = $entry; |
67
|
|
|
} |
68
|
|
|
|
69
|
|
|
return $result; |
70
|
|
|
} |
71
|
|
|
|
72
|
|
|
public function charAt(string $string, int $index): ?string |
73
|
|
|
{ |
74
|
|
|
if ($index < mb_strlen($string)) { |
75
|
|
|
return mb_substr($string, $index, 1, 'UTF-8'); |
76
|
|
|
} |
77
|
|
|
|
78
|
|
|
return null; |
79
|
|
|
} |
80
|
|
|
|
81
|
|
|
public function uniChr(int $u): string |
82
|
|
|
{ |
83
|
|
|
return mb_convert_encoding('&#'.intval($u).';', 'UTF-8', 'HTML-ENTITIES'); |
|
|
|
|
84
|
|
|
} |
85
|
|
|
} |
86
|
|
|
|