We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent b1c63e1 commit 73519bcCopy full SHA for 73519bc
bnlp/tokenizer/basic.py
@@ -65,7 +65,6 @@ class BasicTokenizer:
65
def tokenize(self, text):
66
"""Tokenizes a piece of text."""
67
text = convert_to_unicode(text)
68
- # handle (.) in bangla text
69
70
orig_tokens = whitespace_tokenize(text)
71
# print("original tokens: ", orig_tokens)
@@ -75,7 +74,6 @@ def tokenize(self, text):
75
74
76
# print("split tokens: ", split_tokens)
77
output_tokens = whitespace_tokenize(" ".join(split_tokens))
78
- # get (.) back in output tokens
79
return output_tokens
80
81
def _run_strip_accents(self, text):
0 commit comments