tokenizers

View on PyPIReverse Dependencies (356)

0.19.1 tokenizers-0.19.1-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-cp39-cp39-manylinux_2_17_armv7l.manylinux2014_armv7l.whl
tokenizers-0.19.1-cp39-cp39-manylinux_2_17_s390x.manylinux2014_s390x.whl
tokenizers-0.19.1-cp39-cp39-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl
tokenizers-0.19.1-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-cp39-cp39-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-cp39-none-win_amd64.whl
tokenizers-0.19.1-cp39-none-win32.whl
tokenizers-0.19.1-cp39-cp39-macosx_10_12_x86_64.whl
tokenizers-0.19.1-cp39-cp39-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-cp39-cp39-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-cp39-cp39-macosx_11_0_arm64.whl
tokenizers-0.19.1-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-cp38-cp38-manylinux_2_17_armv7l.manylinux2014_armv7l.whl
tokenizers-0.19.1-cp38-cp38-manylinux_2_17_s390x.manylinux2014_s390x.whl
tokenizers-0.19.1-cp38-cp38-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl
tokenizers-0.19.1-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-cp38-cp38-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-cp38-none-win_amd64.whl
tokenizers-0.19.1-cp38-none-win32.whl
tokenizers-0.19.1-cp38-cp38-macosx_10_12_x86_64.whl
tokenizers-0.19.1-cp38-cp38-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-cp38-cp38-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-cp38-cp38-macosx_11_0_arm64.whl
tokenizers-0.19.1-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-cp37-cp37m-manylinux_2_17_armv7l.manylinux2014_armv7l.whl
tokenizers-0.19.1-cp37-cp37m-manylinux_2_17_s390x.manylinux2014_s390x.whl
tokenizers-0.19.1-cp37-cp37m-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl
tokenizers-0.19.1-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-cp37-cp37m-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-cp37-none-win_amd64.whl
tokenizers-0.19.1-cp37-none-win32.whl
tokenizers-0.19.1-cp37-cp37m-macosx_10_12_x86_64.whl
tokenizers-0.19.1-cp37-cp37m-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-cp37-cp37m-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-cp37-cp37m-macosx_11_0_arm64.whl
tokenizers-0.19.1-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-cp312-cp312-manylinux_2_17_armv7l.manylinux2014_armv7l.whl
tokenizers-0.19.1-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl
tokenizers-0.19.1-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl
tokenizers-0.19.1-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-cp312-cp312-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-cp312-none-win_amd64.whl
tokenizers-0.19.1-cp312-none-win32.whl
tokenizers-0.19.1-cp312-cp312-macosx_10_12_x86_64.whl
tokenizers-0.19.1-cp312-cp312-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-cp312-cp312-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-cp312-cp312-macosx_11_0_arm64.whl
tokenizers-0.19.1-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-cp311-cp311-manylinux_2_17_armv7l.manylinux2014_armv7l.whl
tokenizers-0.19.1-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl
tokenizers-0.19.1-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl
tokenizers-0.19.1-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-cp311-cp311-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-cp311-none-win_amd64.whl
tokenizers-0.19.1-cp311-none-win32.whl
tokenizers-0.19.1-cp311-cp311-macosx_10_12_x86_64.whl
tokenizers-0.19.1-cp311-cp311-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-cp311-cp311-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-cp311-cp311-macosx_11_0_arm64.whl
tokenizers-0.19.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-cp310-cp310-manylinux_2_17_armv7l.manylinux2014_armv7l.whl
tokenizers-0.19.1-cp310-cp310-manylinux_2_17_s390x.manylinux2014_s390x.whl
tokenizers-0.19.1-cp310-cp310-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl
tokenizers-0.19.1-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-cp310-cp310-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-cp310-none-win_amd64.whl
tokenizers-0.19.1-cp310-none-win32.whl
tokenizers-0.19.1-cp310-cp310-macosx_10_12_x86_64.whl
tokenizers-0.19.1-cp310-cp310-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-cp310-cp310-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-cp310-cp310-macosx_11_0_arm64.whl
tokenizers-0.19.1-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-pp39-pypy39_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-pp39-pypy39_pp73-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-pp39-pypy39_pp73-macosx_10_12_x86_64.whl
tokenizers-0.19.1-pp39-pypy39_pp73-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-pp39-pypy39_pp73-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-pp39-pypy39_pp73-macosx_11_0_arm64.whl
tokenizers-0.19.1-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-pp38-pypy38_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-pp38-pypy38_pp73-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-pp38-pypy38_pp73-macosx_10_12_x86_64.whl
tokenizers-0.19.1-pp38-pypy38_pp73-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-pp38-pypy38_pp73-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-pp38-pypy38_pp73-macosx_11_0_arm64.whl
tokenizers-0.19.1-pp37-pypy37_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-pp37-pypy37_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-pp37-pypy37_pp73-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-pp37-pypy37_pp73-macosx_10_12_x86_64.whl
tokenizers-0.19.1-pp37-pypy37_pp73-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-pp37-pypy37_pp73-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-pp310-pypy310_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
tokenizers-0.19.1-pp310-pypy310_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
tokenizers-0.19.1-pp310-pypy310_pp73-manylinux_2_12_i686.manylinux2010_i686.whl
tokenizers-0.19.1-pp310-pypy310_pp73-macosx_10_12_x86_64.whl
tokenizers-0.19.1-pp310-pypy310_pp73-musllinux_1_1_x86_64.whl
tokenizers-0.19.1-pp310-pypy310_pp73-musllinux_1_1_aarch64.whl
tokenizers-0.19.1-pp310-pypy310_pp73-macosx_11_0_arm64.whl

Wheel Details

Project: tokenizers
Version: 0.19.1
Filename: tokenizers-0.19.1-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
Download: [link]
Size: 3608229
MD5: c2bc45a39179f702ddae9c0fd06e188e
SHA256: b4c89aa46c269e4e70c4d4f9d6bc644fcc39bb409cb2a81227923404dd6f5227
Uploaded: 2024-04-17 21:39:02 +0000

dist-info

METADATA

Metadata-Version: 2.3
Name: tokenizers
Version: 0.19.1
Author: Anthony MOI <m.anthony.moi@gmail.com>
Author-Email: Nicolas Patry <patry.nicolas[at]protonmail.com>, Anthony Moi <anthony[at]huggingface.co>
Project-Url: Homepage, https://github.com/huggingface/tokenizers
Project-Url: Source, https://github.com/huggingface/tokenizers
Keywords: NLP,tokenizer,BPE,transformer,deep learning
Classifier: Development Status :: 5 - Production/Stable
Classifier: Intended Audience :: Developers
Classifier: Intended Audience :: Education
Classifier: Intended Audience :: Science/Research
Classifier: License :: OSI Approved :: Apache Software License
Classifier: Operating System :: OS Independent
Classifier: Programming Language :: Python :: 3
Classifier: Programming Language :: Python :: 3.7
Classifier: Programming Language :: Python :: 3.8
Classifier: Programming Language :: Python :: 3.9
Classifier: Programming Language :: Python :: 3.10
Classifier: Programming Language :: Python :: 3.11
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
Requires-Python: >=3.7
Requires-Dist: huggingface-hub (<1.0,>=0.16.4)
Requires-Dist: pytest; extra == "testing"
Requires-Dist: requests; extra == "testing"
Requires-Dist: numpy; extra == "testing"
Requires-Dist: datasets; extra == "testing"
Requires-Dist: black (==22.3); extra == "testing"
Requires-Dist: ruff; extra == "testing"
Requires-Dist: sphinx; extra == "docs"
Requires-Dist: sphinx-rtd-theme; extra == "docs"
Requires-Dist: setuptools-rust; extra == "docs"
Requires-Dist: tokenizers[testing]; extra == "dev"
Provides-Extra: testing
Provides-Extra: docs
Provides-Extra: dev
Description-Content-Type: text/markdown; charset=UTF-8; variant=GFM
[Description omitted; length: 5006 characters]

WHEEL

Wheel-Version: 1.0
Generator: maturin (1.5.1)
Root-Is-Purelib: false
Tag: cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64

RECORD

Path Digest Size
tokenizers-0.19.1.dist-info/METADATA sha256=rCAgg9DA_ZsETxHzh_dz0hPeRKTvoj9m9kUNZe14vxc 6719
tokenizers-0.19.1.dist-info/WHEEL sha256=ZecsC-02CgJW1eVh0SnzSmfDXdlpfFNFEdQSIIzPs-Q 127
tokenizers/decoders/__init__.py sha256=lGp32h8qerE0F48gyZL8wGmeQVlmjVpeIsRb1SM9kf4 335
tokenizers/decoders/__init__.pyi sha256=xsReo7OFRCiQ4bBZY9ogYb1iLJ5DTgI5elNB-Uggocs 7244
tokenizers/tools/visualizer.py sha256=gi-E2NCP7FuG6ujpQOdalSTXUlaV85V6NI-ZPPTvA_4 14625
tokenizers/tools/__init__.py sha256=xG8caB9OHC8cbB01S5vYV14HZxhO6eWbLehsb70ppio 55
tokenizers/tools/visualizer-styles.css sha256=zAydq1oGWD8QEll4-eyL8Llw0B1sty_hpIE3tYxL02k 4850
tokenizers/pre_tokenizers/__init__.py sha256=wd6KYQA_RsGSQK-HeG9opTRhv4ttSRkyno2dk6az-PM 557
tokenizers/pre_tokenizers/__init__.pyi sha256=IhF7dZt9_9_WM2ESKwEIvN59uW_YzS2PzmWBUScysWU 23258
tokenizers/__init__.py sha256=ZE5ZagUvobBScrHBQdEobhx4wqM0bsq9F9aLYkBNjYQ 2615
tokenizers/__init__.pyi sha256=YBIWZCSN4Rs_-yKdEwhVv77bgHRE36hX9iwFrWGMJ8E 38536
tokenizers/implementations/sentencepiece_bpe.py sha256=LwrofoohnUfME2lK2lQYoyQIhP84RP0CIlHRaj0hyNs 3738
tokenizers/implementations/sentencepiece_unigram.py sha256=SYiVXL8ZtqLXKpuqwnwmrfxgGotu8yAkOu7dLztEXIo 7580
tokenizers/implementations/char_level_bpe.py sha256=Q2ZEAW0xMQHF7YCUtmplwaxbU-J0P2NK4PJGMxUb-_c 5466
tokenizers/implementations/byte_level_bpe.py sha256=OA_jyy3EQmYTa6hnf-EKwLOFuyroqFYOJz25ysM2BUk 4289
tokenizers/implementations/__init__.py sha256=VzAsplaIo7rl4AFO8Miu7ig7MfZjvonwVblZw01zR6M 310
tokenizers/implementations/base_tokenizer.py sha256=2TFZhLupaJiMDYGJuUNmxYJv-cnR8bDHmbMzaYpFROs 14206
tokenizers/implementations/bert_wordpiece.py sha256=sKCum0FKPYdSgJFJN8LDerVBoTDRSqyqSdrcm-lvQqI 5520
tokenizers/normalizers/__init__.py sha256=hKOwnqWM-IlcVv7HDWT9SYhlczevuCNDQJY05ZFxkzk 808
tokenizers/normalizers/__init__.pyi sha256=5SGm-u896MZht6TXMS9sWv1lCATnwNqbC2Udl5aP4dg 19597
tokenizers/models/__init__.py sha256=eJZ4HTAQZpxnKILNylWaTFqxXy-Ba6OKswWN47feeV8 176
tokenizers/models/__init__.pyi sha256=wH4M-ZZprw3UQ98fxWrF3MpivuNVY3s3pv4pGY0A_kE 16932
tokenizers/processors/__init__.py sha256=xM2DEKwKtHIumHsszM8AMkq-AlaqvBZFXWgLU8SNhOY 307
tokenizers/processors/__init__.pyi sha256=hx767ZY8SHhxb_hiXPRxm-f_KcoR4XDx7vfK2c0lR-Q 11357
tokenizers/trainers/__init__.py sha256=UTu22AGcp76IvpW45xLRbJWET04NxPW6NfCb2YYz0EM 248
tokenizers/trainers/__init__.pyi sha256=3TwFKts4me7zQfVRcSTmtXYiP4XwcRjfAYtwqoZVtoQ 5382
tokenizers/tokenizers.cpython-39-x86_64-linux-gnu.so sha256=k1sl24EzellCirjGve8FoHBg4YSl6h_jPJ9CdPYIj2E 11817040
tokenizers-0.19.1.dist-info/RECORD