Completed
Push — master ( 111737...5430e3 )
by Andreas
09:48
created

WordsWithNCharsCounter::__construct()   A

Complexity

Conditions 1
Paths 1

Size

Total Lines 7
Code Lines 5

Duplication

Lines 0
Ratio 0 %

Importance

Changes 0
Metric Value
dl 0
loc 7
rs 9.4285
c 0
b 0
f 0
cc 1
eloc 5
nc 1
nop 1
1
<?php
2
/**
3
 * Copyright (c) Andreas Heigl<[email protected]>
4
 * Permission is hereby granted, free of charge, to any person obtaining a copy
5
 * of this software and associated documentation files (the "Software"), to deal
6
 * in the Software without restriction, including without limitation the rights
7
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
8
 * copies of the Software, and to permit persons to whom the Software is
9
 * furnished to do so, subject to the following conditions:
10
 * The above copyright notice and this permission notice shall be included in
11
 * all copies or substantial portions of the Software.
12
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
13
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
14
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
15
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
16
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
17
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
18
 * THE SOFTWARE.
19
 *
20
 * @author    Andreas Heigl<[email protected]>
21
 * @copyright Andreas Heigl
22
 * @license   http://www.opensource.org/licenses/mit-license.php MIT-License
23
 * @since     12.10.2016
24
 * @link      http://github.com/heiglandreas/org.heigl.TextStatistics
25
 */
26
27
namespace Org_Heigl\TextStatistics\Calculator;
28
29
use Org\Heigl\Hyphenator\Tokenizer\PunctuationTokenizer;
30
use Org\Heigl\Hyphenator\Tokenizer\TokenizerRegistry;
31
use Org\Heigl\Hyphenator\Tokenizer\WhitespaceTokenizer;
32
use Org\Heigl\Hyphenator\Tokenizer\WordToken;
33
use Org_Heigl\TextStatistics\Text;
34
35
class WordsWithNCharsCounter implements CalculatorInterface
36
{
37
    protected $tokenizer;
38
39
    protected $minChars;
40
41
    public function __construct($minChars)
42
    {
43
        $this->minChars = $minChars;
44
        $this->tokenizer = new TokenizerRegistry();
45
        $this->tokenizer->add(new PunctuationTokenizer());
46
        $this->tokenizer->add(new WhitespaceTokenizer());
47
    }
48
49
    /**
50
     * Do the actual calculation of a statistic
51
     *
52
     * @param Text $text
53
     *
54
     * @return mixed
55
     */
56
    public function calculate(Text $text)
57
    {
58
        $tokens = $this->tokenizer->tokenize($text->getPlainText());
59
        foreach ($tokens as $token) {
60
            if (! $token instanceof WordToken) {
61
                $tokens->replace($token, []);
62
            }
63
            if (mb_strlen($token->getFilteredContent()) < $this->minChars) {
64
                $tokens->replace($token, []);
65
            }
66
        }
67
68
        return $tokens->count();
69
    }
70
}
71