Source code for pyconversations.ld.lid

from langid.langid import LanguageIdentifier
from langid.langid import model

from .base import BaseLangDetect


[docs]class LangidLangDetect(BaseLangDetect): """ Language detection using the langid package """ def __init__(self): self._model = LanguageIdentifier.from_modelstring(model, norm_probs=True)
[docs] def get(self, text): """ Uses langid module to detect a language Parameters ---------- text : str The raw text to detect the language of Returns ------- tuple(str, float) The detected language and confidence of detection """ lang, conf = self._model.classify(text) return lang, conf