Passed
Push — master ( aeeab5...454cf7 )
by Kacper
02:57
created

Perl::getOpenClose()   A

Complexity

Conditions 1
Paths 1

Size

Total Lines 10
Code Lines 6

Duplication

Lines 0
Ratio 0 %

Importance

Changes 1
Bugs 0 Features 0
Metric Value
c 1
b 0
f 0
dl 0
loc 10
rs 9.4285
cc 1
eloc 6
nc 1
nop 0
1
<?php
2
/**
3
 * Highlighter
4
 *
5
 * Copyright (C) 2016, Some right reserved.
6
 *
7
 * @author Kacper "Kadet" Donat <[email protected]>
8
 *
9
 * Contact with author:
10
 * Xmpp: [email protected]
11
 * E-mail: [email protected]
12
 *
13
 * From Kadet with love.
14
 */
15
16
namespace Kadet\Highlighter\Language;
17
18
19
use Kadet\Highlighter\Matcher\CommentMatcher;
20
use Kadet\Highlighter\Matcher\RegexMatcher;
21
use Kadet\Highlighter\Matcher\SubStringMatcher;
22
use Kadet\Highlighter\Matcher\WordMatcher;
23
use Kadet\Highlighter\Parser\CloseRule;
24
use Kadet\Highlighter\Parser\OpenRule;
25
use Kadet\Highlighter\Parser\Rule;
26
use Kadet\Highlighter\Parser\Token\ContextualToken;
27
use Kadet\Highlighter\Parser\Token\LanguageToken;
28
use Kadet\Highlighter\Parser\Token\Token;
29
use Kadet\Highlighter\Parser\TokenFactory;
30
31
class Perl extends Language
32
{
33
    /**
34
     * Tokenization rules definition
35
     *
36
     * @return Rule[]|Rule[][]
37
     */
38
    public function getRules()
39
    {
40
        $identifier = '\w+';
41
        $number = '[+-]?(?=\d|\.\d)\d*(\.\d*)?([Ee]([+-]?\d+))?';
42
43
        return [
44
            'comment' => new Rule(new CommentMatcher(['#'], [])),
45
46
            'keyword' => new Rule(new WordMatcher([
47
                'case', 'continue', 'do', 'else', 'elsif', 'for', 'foreach',
48
                'if', 'last', 'my', 'next', 'our', 'redo', 'reset', 'then',
49
                'unless', 'until', 'while', 'use', 'print', 'new', 'BEGIN',
50
                'sub', 'CHECK', 'INIT', 'END', 'return', 'exit'
51
            ])),
52
53
            'string.single' => new Rule(new SubStringMatcher('\''), [
54
                'context' => ['!keyword', '!comment', '!string', '!language', '!number'],
55
                'factory' => new TokenFactory(ContextualToken::class),
56
            ]),
57
58
            'string.double' => new Rule(new SubStringMatcher('"'), [
59
                'context' => ['!keyword', '!comment', '!string', '!language', '!number'],
60
                'factory' => new TokenFactory(ContextualToken::class),
61
            ]),
62
63
            'keyword.escape' => new Rule(new RegexMatcher('/(\\\.)/'), [
64
                'context' => ['string']
65
            ]),
66
67
            'string.nowdoc'  => new Rule(
68
                new RegexMatcher('/<<\s*\'(\w+)\';(?P<string>.*?)\n\1/sm', [
69
                    'string' => Token::NAME,
70
                          0  => 'keyword.nowdoc'
71
                ]), ['context' => ['!comment']]
72
            ),
73
74
            'language.shell' => new Rule(new SubStringMatcher('`'), [
75
                'context' => ['!keyword.escape', '!comment', '!string', '!keyword.nowdoc'],
76
                'factory' => new TokenFactory(ContextualToken::class),
77
            ]),
78
79
            'variable.scalar' => new Rule(new RegexMatcher("/(\\\$$identifier)/")),
80
            'variable.array'  => new Rule(new RegexMatcher("/(\\@$identifier)/")),
81
            'variable.hash'   => new Rule(new RegexMatcher("/(\\%$identifier)/")),
82
83
            'variable.property'   => new Rule(new RegexMatcher("/\\\$$identifier{($identifier)}/")),
84
85
            // Stupidly named var? Perl one, for sure.
86
            'variable.special'   => new Rule(new RegexMatcher('/([$@%][^\s\w]+[\w]*)/')),
87
88
            'operator' => [
89
                new Rule(new RegexMatcher('/(-[rwxoRWXOezsfdlpSbctugkTBMAC])/')),
90
                new Rule(new WordMatcher([
91
                    'not', 'and', 'or', 'xor', 'goto', 'last', 'next', 'redo', 'dump',
92
                    'eq', 'ne', 'cmp', 'not', 'and', 'or', 'xor'
93
                ], ['atomic' => true])),
94
            ],
95
96
            'call' => new Rule(new RegexMatcher('/([a-z]\w+)(?:\s*\(|\s+[$%@"\'`{])/i')),
97
98
            'number' => [
99
                new Rule(new RegexMatcher("/(\\b|\"|')$number\\1/", [
100
                    0 => Token::NAME
101
                ]), ['priority' => 5]),
102
            ],
103
104
            'string.regex' => [
105
                new OpenRule(new RegexMatcher('#~\s*(/).*?/#m')),
106
                new Rule(new RegexMatcher('#\/.*(/[gimuy]{0,5})#m'), [
107
                    'priority' => 1,
108
                    'factory'  => new TokenFactory(ContextualToken::class),
109
                    'context'  => ['!keyword.escape', 'string.regex']
110
                ])
111
            ],
112
113
            'symbol.iterator' => [
114
                new Rule(new RegexMatcher('#(<\w+>)#s'))
115
            ]
116
        ];
117
    }
118
119
    /**
120
     * Unique language identifier, for example 'php'
121
     *
122
     * @return string
123
     */
124
    public function getIdentifier()
125
    {
126
        return 'perl';
127
    }
128
129
    public function getOpenClose()
130
    {
131
        return [
132
            parent::getOpenClose(),
133
            new CloseRule(new SubStringMatcher('__END__'), [
134
                'factory'  => new TokenFactory(LanguageToken::class),
135
                'language' => $this
136
            ])
137
        ];
138
    }
139
}