Dig deeper in cut-by-token approach.

This commit is contained in:
kenkeiras 2018-04-15 17:47:04 +02:00
parent d601ae3f83
commit 998a183fd2
4 changed files with 86 additions and 16 deletions

View file

@ -65,6 +65,8 @@ def main():
with session().log(example['text']):
tokens = list(knowledge.tokenize(example['text']))
print(tokens)
print(example['tokens'])
assert example['tokens'] == tokens
else: