Total Complexity | 2 |
Total Lines | 17 |
Duplicated Lines | 0 % |
Changes | 0 |
1 | """Simplemma analyzer for Annif, based on simplemma lemmatizer.""" |
||
2 | |||
3 | import simplemma |
||
4 | from . import analyzer |
||
5 | |||
6 | |||
7 | class SimplemmaAnalyzer(analyzer.Analyzer): |
||
8 | name = "simplemma" |
||
9 | |||
10 | def __init__(self, param, **kwargs): |
||
11 | self.lang = param |
||
12 | self.langdata = simplemma.load_data(self.lang) |
||
13 | super().__init__(**kwargs) |
||
14 | |||
15 | def _normalize_word(self, word): |
||
16 | return simplemma.lemmatize(word, self.langdata) |
||
17 |