from torchnlp.encoders.text.delimiter_encoder import DelimiterEncoder
[docs]class WhitespaceEncoder(DelimiterEncoder):
""" Encodes a text by splitting on whitespace.
Args:
**args: Arguments passed onto ``DelimiterEncoder.__init__``.
**kwargs: Keyword arguments passed onto ``DelimiterEncoder.__init__``.
Example:
>>> encoder = WhitespaceEncoder(["This ain't funny.", "Don't?"])
>>> encoder.encode("This ain't funny.")
tensor([5, 6, 7])
>>> encoder.vocab
['<pad>', '<unk>', '</s>', '<s>', '<copy>', 'This', "ain't", 'funny.', "Don't?"]
>>> encoder.decode(encoder.encode("This ain't funny."))
"This ain't funny."
"""
def __init__(self, *args, **kwargs):
super().__init__(' ', *args, **kwargs)