Source code for pyconversations.tokenizers.base

from abc import abstractmethod


[docs]class BaseTokenizer: """ The abstract Tokenizer class. """ def __init__(self, name): self._name = name def __call__(self, s): return self.tokenize(s)
[docs] @abstractmethod def tokenize(self, s): """ Splits a string into tokens. Parameters ---------- s : str The string to tokenize Returns ------- list(str) A list of tokens Raises ------ NotImplementedError Must be implemented in extensions """ raise NotImplementedError