| [build-system] |
| requires = ["setuptools>=68.0", "wheel"] |
| build-backend = "setuptools.build_meta" |
|
|
| [project] |
| name = "xerv-crayon" |
| version = "5.3.6" |
| description = "Omni-Backend Tokenizer - CPU (AVX2/512), CUDA (NVIDIA), ROCm (AMD) with automatic hardware detection" |
| readme = "README.md" |
| requires-python = ">=3.8,<3.13" |
| license = {file = "LICENSE"} |
| authors = [ |
| {name = "Xerv Research Engineering Division", email = "xerv.org@gmail.com"} |
| ] |
| keywords = [ |
| "tokenizer", |
| "nlp", |
| "simd", |
| "avx2", |
| "avx512", |
| "cuda", |
| "rocm", |
| "hip", |
| "gpu", |
| "high-performance", |
| "zero-copy", |
| "dat", |
| "double-array-trie", |
| "machine-learning", |
| "deep-learning", |
| "transformers", |
| "llm", |
| "nvcuda", |
| "amd", |
| "nvidia" |
| ] |
| classifiers = [ |
| "Development Status :: 5 - Production/Stable", |
| "Intended Audience :: Science/Research", |
| "Intended Audience :: Developers", |
| "Programming Language :: Python :: 3", |
| "Programming Language :: Python :: 3.10", |
| "Programming Language :: Python :: 3.11", |
| "Programming Language :: Python :: 3.12", |
| "Programming Language :: Python :: 3.13", |
| "Programming Language :: C", |
| "Programming Language :: C++", |
| "Topic :: Scientific/Engineering :: Artificial Intelligence", |
| "Topic :: Text Processing :: Linguistic", |
| "Operating System :: POSIX :: Linux", |
| "Operating System :: Microsoft :: Windows", |
| "Operating System :: MacOS", |
| "Environment :: GPU :: NVIDIA CUDA", |
| ] |
|
|
| |
| dependencies = [] |
|
|
| |
| [project.optional-dependencies] |
| full = [ |
| "requests>=2.31.0", |
| "datasets>=2.18.0", |
| "huggingface-hub>=0.21.0" |
| ] |
| cuda = [ |
| "torch>=2.0.0", |
| "torchvision>=0.15.0", |
| "torchaudio>=2.0.0" |
| ] |
| dev = [ |
| "pytest>=7.0.0", |
| "pytest-benchmark>=4.0.0", |
| "build>=1.0.0", |
| "twine>=4.0.0", |
| "torch>=2.0.0" |
| ] |
| benchmark = [ |
| "tiktoken>=0.5.0", |
| "transformers>=4.30.0", |
| "matplotlib>=3.7.0" |
| ] |
|
|
| [project.urls] |
| Homepage = "https://github.com/Electroiscoding/CRAYON" |
| Repository = "https://github.com/Electroiscoding/CRAYON.git" |
| Documentation = "https://github.com/Electroiscoding/CRAYON#readme" |
| "Bug Tracker" = "https://github.com/Electroiscoding/CRAYON/issues" |
|
|
| [project.scripts] |
| crayon-benchmark = "crayon.cli:run_benchmark" |
|
|
| [tool.setuptools] |
| package-dir = {"" = "src"} |
|
|
| [tool.setuptools.packages.find] |
| where = ["src"] |
|
|
| [tool.setuptools.package-data] |
| "crayon" = [ |
| "resources/dat/vocab_lite.dat", |
| "resources/dat/vocab_lite.json", |
| "resources/dat/vocab_standard.dat", |
| "resources/dat/vocab_standard.json", |
| "resources/*.txt", |
| "resources/*.csv", |
| "c_ext/*.h", |
| "c_ext/*.c", |
| "c_ext/*.cpp", |
| "c_ext/*.cu", |
| "c_ext/*.hip", |
| "c_ext/*.pyd", |
| "c_ext/*.so", |
| "c_ext/*.py", |
| "c_ext/compiled/*.pyd", |
| "c_ext/compiled/*.so" |
| ] |
|
|
| [tool.pytest.ini_options] |
| testpaths = ["tests"] |
| python_files = ["test_*.py"] |
|
|