Welcome to mirror list, hosted at ThFree Co, Russian Federation.

__init__.py « stemmer « util « sphinx - github.com/sphinx-doc/sphinx.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: d7576a94e4a8664f4c3b327f63a5ddfbd3fd10ea (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
"""Word stemming utilities for Sphinx.

    :copyright: Copyright 2007-2022 by the Sphinx team, see AUTHORS.
    :license: BSD, see LICENSE for details.
"""

from sphinx.util.stemmer.porter import PorterStemmer

try:
    from Stemmer import Stemmer as _PyStemmer
    PYSTEMMER = True
except ImportError:
    PYSTEMMER = False


class BaseStemmer:
    def stem(self, word: str) -> str:
        raise NotImplementedError()


class PyStemmer(BaseStemmer):
    def __init__(self) -> None:
        self.stemmer = _PyStemmer('porter')

    def stem(self, word: str) -> str:
        return self.stemmer.stemWord(word)


class StandardStemmer(PorterStemmer, BaseStemmer):
    """All those porter stemmer implementations look hideous;
    make at least the stem method nicer.
    """
    def stem(self, word: str) -> str:  # type: ignore
        return super().stem(word, 0, len(word) - 1)


def get_stemmer() -> BaseStemmer:
    if PYSTEMMER:
        return PyStemmer()
    else:
        return StandardStemmer()