botok

View on PyPIReverse Dependencies (6)

0.8.12 botok-0.8.12-py3-none-any.whl

Wheel Details

Project: botok
Version: 0.8.12
Filename: botok-0.8.12-py3-none-any.whl
Download: [link]
Size: 79740
MD5: 510f9ceb9728eb8a5b15e6f78ac9a3a3
SHA256: ad7f7d8350f8c0a18430ab0a7465ac0f9e4aa566cb5acc2a0fb738dfa45c48f5
Uploaded: 2023-05-17 11:36:35 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: botok
Version: 0.8.12
Summary: Tibetan Word Tokenizer
Author: Esukhia development team
Author-Email: esukhiadev[at]gmail.com
Home-Page: https://github.com/Esukhia/botok
Project-Url: Source, https://github.com/Esukhia/botok
Project-Url: Tracker, https://github.com/Esukhia/botok/issues
License: Apache2
Keywords: nlp computational_linguistics tibetan tokenizer token
Classifier: Development Status :: 3 - Alpha
Classifier: Topic :: Text Processing :: Linguistic
Classifier: Programming Language :: Python :: 3
Classifier: Operating System :: OS Independent
Classifier: Intended Audience :: Developers
Classifier: Intended Audience :: Science/Research
Classifier: License :: OSI Approved :: Apache Software License
Classifier: Natural Language :: Tibetan
Requires-Python: >=3.6
Requires-Dist: pyyaml
Requires-Dist: requests
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 7056 characters]

WHEEL

Wheel-Version: 1.0
Generator: bdist_wheel (0.40.0)
Root-Is-Purelib: true
Tag: py3-none-any

RECORD

Path Digest Size
botok/__init__.py sha256=o4NnZkRPBwAZhFHthSeTW9k9LejpoIODPTS099ZU77w 1606
botok/config.py sha256=0c3fwNpMeI9bY1NDJAPvuMXw_PGWO_o_g_NY4if3JJA 4398
botok/vars.py sha256=jTRrybW5cjTFk2nNsSgaxHAlXzSu_4uMNBrl0rX8ncI 1537
botok/chunks/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/chunks/chunkframework.py sha256=tV5E8evT2ou-Xj7VEYFFP0Ey31crZhdJSnL18zHqIco 15219
botok/chunks/chunkframeworkbase.py sha256=6Sn2bA-43nS8Zc1gw7oUQGht-oeW4jL-0knlYxZVZTs 8729
botok/chunks/chunks.py sha256=TY6fC4HGyLpGnw5da3-VWkJqZOD-Cmeq8rRMa04wkKI 4504
botok/modifytokens/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/modifytokens/adjusttokens.py sha256=TY-hQ0Id4ipgSQ4CBaWuHajnXc8LiwWFzw3bq8_WQUI 4785
botok/modifytokens/cqlmatcher.py sha256=Fu1Th7MbzzZ69LS5_pwriMSuywDAus1tauiLyaQqL8c 1048
botok/modifytokens/mergedagdra.py sha256=6uvjRs0XosGOf6XmEUToetNzr8Lr-xwVZ3s_fyN91nY 1842
botok/modifytokens/mergingmatcher.py sha256=wBCY1ms5uWJhL9hW9ikWl_I5hECYvaF1uJEKueMYWNg 1470
botok/modifytokens/replacingmatcher.py sha256=IPr22-RGLx6uClqoxtiByKSuXdJEUvm5zmNIzP7_4Xo 882
botok/modifytokens/splitaffixed.py sha256=P06X_LV2oTJrM2oUgOz0732SM9iLcg-Fxy_ie9SI-6M 1400
botok/modifytokens/splittingmatcher.py sha256=qAf9oekAuGT7exYOb_EIZmdnJ0LQ9LDuHOFpf31cX90 1563
botok/modifytokens/tokenmerge.py sha256=Q4sTu3tRvTwxZD6UKeaDCqzGgEQ8CMCYRIeBmUqmZIw 3189
botok/modifytokens/tokensplit.py sha256=Yo32aWuYLUKybhxOI50IilrkXa8Inj-qrVGpbAcoqsA 4414
botok/resources/README.md sha256=zMtV7hEoOvrxjc-Pedd3aT8As8U8iPngidVbltdewjs 1786
botok/resources/SylComponents.json sha256=RBp_TSYEYXqHkSdws1Ufcj3PO4FEGHqI6kPaR_zWPPc 16855
botok/resources/bo_punct_position.csv sha256=BgJTtPJ4EVKstlEFIAR7f7VEVu_hlx3KhbiavpUtUmk 903
botok/resources/bo_uni_table.csv sha256=EU1kwva92BBHVERFMmDxh8BL7437o5kdwkGtBzJh4-E 16138
botok/resources/particles.tsv sha256=1uJixk-8DWnwqbZsnf5lpDCgslQa-jB3vCQMP2PvACc 1597
botok/text/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/text/format.py sha256=JY6eD6uEKb-PAZCxzBRD96K7CEyK1cAGUYVCwH2MnwY 1094
botok/text/modify.py sha256=9RbvAhBfAnKl-wVSQ7h9vLaUPg3pbtaJTNGc4TbeWlM 2503
botok/text/pipelinebase.py sha256=WwlKff-4Q3Y8f5MiGut8WirHhlHn3HL8PzEkKE6-eeA 3477
botok/text/preprocess.py sha256=d87ocgst2_n2epwEVL3XKJWTFKdFYaGz2YTN1ZPYXWU 301
botok/text/text.py sha256=orlcGLQvEziQX_vmERaRZS4Zq7rtnHBRJ422VWpG4UQ 5473
botok/text/tokenize.py sha256=JfSnA8Cd3ASRikCYFUHtPTGYgzfAFZvnuireKlbsTnU 1288
botok/textunits/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/textunits/bostring.py sha256=pTO8ZuBurS4IqHaItlx-lhXmm9K0xE3pgZzrEJO7rCg 4714
botok/textunits/bosyl.py sha256=ieu4W8-pQXsaNRDetjVMEd4C7MIYtxoueKA4tvr6-DQ 1849
botok/textunits/charcategories.py sha256=Y3wf_aU46TngpFBC7p2XO_Vr3csJX6EYtwmymIe4Das 2420
botok/textunits/sylcomponents.py sha256=fLfwGwXpxU6ZvhuF-rpCYvqUy0uS33ItuI0NIFWl4VM 7883
botok/third_party/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/third_party/cqlparser.py sha256=B26dw2O64j5scY9KKo81ey2pfIUrauUN48ObU9lJg3M 2435
botok/third_party/has_skrt_syl.py sha256=46449u-iQJR-bfyaDeqFqQdT1r7Zvd7xSs9Abkg7nP4 1414
botok/third_party/pynpl/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/third_party/pynpl/cql.py sha256=Nht9uHVp2YjAVh5jxqNiGQ2uFMqRvRixzLrKXslsMt0 8956
botok/third_party/pynpl/fsa.py sha256=4cuU0nKkYu9D7KSNs6vRvX9C73OcW8Z_1G6JEdqFQKI 3796
botok/tokenizers/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/tokenizers/chunktokenizer.py sha256=Mudh-YPeD-AWa0l0w-2V9FYmsEMOwKGQW4tQVWxE1U4 255
botok/tokenizers/paragraphtokenizer.py sha256=117com-xW8dq1jZnSojwGSyizX7tUqUqTR5LuYhRq7U 1081
botok/tokenizers/sentencetokenizer.py sha256=eRP_V4LZgYoyzl6taqPSOlJ4gYicInT6hzj5fhNMinE 8955
botok/tokenizers/stacktokenizer.py sha256=myvOxLQxIWI7nsRN8AvhVDcmTgw4sphZEFSoxkOkAUI 895
botok/tokenizers/token.py sha256=cObVJzCZ0Gc6Pf327lfASyCXJMyb_A91V8l1InoFS9c 4890
botok/tokenizers/tokenize.py sha256=yRPYuqvUGLrcVDwNJjsta2n1Lt86KXyuf36Zl41HLkQ 10554
botok/tokenizers/wordtokenizer.py sha256=oHhOO4IzpBpfKycDC2zuArw5INrcBH3xU3Dp6gNdtAc 5191
botok/tries/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/tries/basictrie.py sha256=bTbs4EZBLazEYnsr_OwQGXqjQiNjba3rm03v2NDYPas 4985
botok/tries/trie.py sha256=GHjbsBnWWkcNIAw4MGKxs-eOJ93kbcOBYTZ5e2G5u68 7499
botok/utils/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
botok/utils/expose_data.py sha256=mTiZ_zNFiS3VmsY6tCZJk3l4ysGoVO-v5QyKAGBquZA 1136
botok/utils/helpers.py sha256=08xKC6fTGCCNdagVdYwxvbY4EdedRG3_OMQqakaMwvs 143
botok/utils/lenient_normalization.py sha256=EqYKdnjGDyjvVqU3ecVULTvs8TRMvuW1XSogFLzjmOM 14375
botok/utils/unicode_normalization.py sha256=7AK2zeQMpRreM1V0KzJjXc5jCcyRkMFVOvb2MeC-934 7457
tests/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
tests/conftest.py sha256=Onv2JkM7apJgBtAiL-Xzs2duYqVCHtcEllUuqAstv10 373
tests/test_bugs.py sha256=H8HGil6WHIfdUPi1aBKkIh9Y2AV0cHTDLTZasARaFlU 7168
tests/test_config.py sha256=1DEC4hCbJrR77UHpTlq7ix3zkXq4JrjIXgmjfvC9NR8 1855
botok-0.8.12.dist-info/LICENSE sha256=xazLvYVG6Uw0rtJK_miaYXYn0Y7tWmxIJ35I21fCOFE 11356
botok-0.8.12.dist-info/METADATA sha256=BCF_O3kGSWEexA9wZ0aHCFJfImHxDzZJbGdXfSJYW3o 9477
botok-0.8.12.dist-info/WHEEL sha256=pkctZYzUS4AYVn6dJ-7367OJZivF2e8RA9b_ZBjif18 92
botok-0.8.12.dist-info/top_level.txt sha256=UWUNLF65dVzc2DHJcZUPcoSG_-Wsc3CFTTo02UYyRrQ 12
botok-0.8.12.dist-info/RECORD

top_level.txt

botok
tests