Source code for pyconversations.tokenizers.default

from .base import BaseTokenizer


[docs]class DefaultTokenizer(BaseTokenizer): """ A tokenizer that just uses Python's basic str.split function. """ def __init__(self): super(DefaultTokenizer, self).__init__('Default')
[docs] def tokenize(self, s): """ Splits a string into tokens. Parameters ---------- s : str The string to tokenize Returns ------- list(str) A list of tokens """ return s.split()