We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 69f2319 commit 3921e66Copy full SHA for 3921e66
pythainlp/corpus/words_th.txt
@@ -15594,7 +15594,6 @@
15594
ชิงไหวชิงพริบ
15595
ชิงฮื้อ
15596
ชิชะ
15597
-ชิชิ
15598
ชิณณะ
15599
ชิด
15600
ชิดขวา
tests/test_tokenize.py
@@ -208,6 +208,13 @@ def test_word_tokenize_newmm(self):
208
self.assertIsNotNone(
209
word_tokenize(long_danger_text, engine="newmm-safe")
210
)
211
+ text = "ชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิชิ"
212
+ self.assertIsNotNone(
213
+ word_tokenize(text, engine="newmm")
214
+ )
215
216
+ word_tokenize(text, engine="newmm-safe")
217
218
219
def test_word_tokenize_attacut(self):
220
self.assertEqual(attacut.segment(None), [])
0 commit comments