|
6 | 6 |  |
7 | 7 |
|
8 | 8 | PyThaiNLP is a Python library for Thai natural language processing. |
9 | | -It includes word tokenizers, transliterators, soundex converters, part-of-speech taggers, and spell checkers. |
| 9 | +The library provides functions like word tokenization, part-of-speech tagging, |
| 10 | +transliteration, soundex generation, and spell checking. |
10 | 11 |
|
11 | 12 | ## Install |
12 | 13 |
|
|
16 | 17 | pip install pythainlp |
17 | 18 | ``` |
18 | 19 |
|
19 | | -Some functionalities, like word vector, required extra packages. See https://github.com/PyThaiNLP/pythainlp for installation options. |
| 20 | +Some functionalities, like word vector, required extra packages. |
| 21 | +See https://github.com/PyThaiNLP/pythainlp for installation options. |
20 | 22 |
|
21 | | -**Note for Windows**: `marisa-trie` wheels can be obtained from https://www.lfd.uci.edu/~gohlke/pythonlibs/#marisa-trie |
| 23 | +**Note for Windows**: `marisa-trie` wheels can be obtained from |
| 24 | +https://www.lfd.uci.edu/~gohlke/pythonlibs/#marisa-trie |
22 | 25 | Install it with pip, for example: `pip install marisa_trie‑xxx.whl` |
23 | 26 | """ |
24 | 27 |
|
|
32 | 35 | ] |
33 | 36 |
|
34 | 37 | extras = { |
35 | | - "artagger": ["artagger"], |
36 | | - "attacut": ["attacut"], |
37 | | - "benchmarks": ["numpy", "pandas"], |
38 | | - "deepcut": ["deepcut", "keras", "tensorflow"], |
39 | | - "icu": ["pyicu"], |
40 | | - "ipa": ["epitran"], |
41 | | - "ml": ["keras", "numpy", "torch"], |
42 | | - "ner": ["sklearn-crfsuite"], |
43 | | - "ssg": ["ssg"], |
44 | | - "thai2fit": ["emoji", "gensim", "numpy"], |
45 | | - "thai2rom": ["torch", "numpy"], |
| 38 | + "artagger": ["artagger>=0.1.0.3"], |
| 39 | + "attacut": ["attacut>=1.0.2"], |
| 40 | + "benchmarks": ["numpy>=1.17.2", "pandas>=0.25.1"], |
| 41 | + "deepcut": ["deepcut>=0.6.1.0", "keras>=2.3.0", "tensorflow>=1.14.0"], |
| 42 | + "icu": ["pyicu>=2.3.1"], |
| 43 | + "ipa": ["epitran>=1.1"], |
| 44 | + "ml": ["keras>=2.3.0", "numpy>=1.17.2", "torch>=1.2.0"], |
| 45 | + "ner": ["sklearn-crfsuite>=0.3.6"], |
| 46 | + "ssg": ["ssg>=0.0.4"], |
| 47 | + "thai2fit": ["emoji>0.5.4", "gensim>=3.8.0", "numpy>=1.17.2"], |
| 48 | + "thai2rom": ["torch>=1.2.0", "numpy>=1.17.2"], |
46 | 49 | "full": [ |
47 | | - "artagger", |
48 | | - "attacut", |
49 | | - "deepcut", |
50 | | - "epitran", |
51 | | - "gensim", |
52 | | - "keras", |
53 | | - "numpy", |
54 | | - "pyicu", |
55 | | - "sklearn-crfsuite", |
56 | | - "tensorflow", |
57 | | - "torch", |
58 | | - "ssg", |
59 | | - "emoji", |
60 | | - "pandas", |
| 50 | + "artagger>=0.1.0.3", |
| 51 | + "attacut>=1.0.2", |
| 52 | + "deepcut>=0.6.1.0", |
| 53 | + "epitran>=1.1", |
| 54 | + "gensim>=3.8.0", |
| 55 | + "keras>=2.3.0", |
| 56 | + "numpy>=1.17.2", |
| 57 | + "pyicu>=2.3.1", |
| 58 | + "sklearn-crfsuite>=0.3.6", |
| 59 | + "tensorflow>=1.14.0", |
| 60 | + "torch>=1.2.0", |
| 61 | + "ssg>=0.0.4", |
| 62 | + "emoji>=0.5.4", |
| 63 | + "pandas>=0.25.1", |
61 | 64 | ], |
62 | 65 | } |
63 | 66 |
|
|
0 commit comments