EZ-Tokenizer / pyproject.toml
Johnnyman1100's picture
Upload 38 files
4265aea verified
[build-system]
requires = ["setuptools>=42.0", "setuptools-scm>=3.4"]
build-backend = "setuptools.build_meta"
[project]
name = "ez-tokenizer"
version = "1.0.0"
description = "High-performance tokenizer builder for code and text datasets with adaptive resource management"
readme = "README.md"
requires-python = ">=3.8"
license = {text = "MIT with Company Restriction"}
authors = [
{name = "NexForge", email = "[email protected]"}
]
maintainers = [
{name = "NexForge", email = "[email protected]"}
]
classifiers = [
"Development Status :: 4 - Beta",
"Intended Audience :: Developers",
"Intended Audience :: Science/Research",
"License :: Other/Proprietary License",
"Programming Language :: Python :: 3.8",
"Programming Language :: Python :: 3.9",
"Programming Language :: Python :: 3.10",
"Programming Language :: Python :: 3.11",
"Programming Language :: Python :: 3.12",
"Topic :: Software Development :: Libraries :: Python Modules",
"Topic :: Text Processing :: Linguistic"
]
dependencies = [
"torch>=1.9.0",
"tokenizers>=0.12.0",
"tqdm>=4.62.0",
"psutil>=5.9.0",
"python-dateutil>=2.8.2"
]
[project.optional-dependencies]
dev = [
"pytest>=6.0",
"pytest-cov>=2.12.1",
"pytest-xdist>=2.4.0",
"black>=21.7b0",
"isort>=5.0.0",
"mypy>=0.910",
"pylint>=2.11.0",
"pre-commit>=2.15.0"
]
[tool.setuptools]
include-package-data = true
package-dir = { "" = "src" }
[tool.setuptools.packages.find]
where = ["src"]
namespaces = true
[tool.black]
line-length = 88
target-version = ['py38']
[tool.isort]
profile = "black"
multi_line_output = 3
include_trailing_comma = true
force_grid_wrap = 0
use_parentheses = true
ensure_newline_before_comments = true
[tool.mypy]
ignore_missing_imports = true
disallow_untyped_defs = true
disallow_incomplete_defs = true
check_untyped_defs = true
no_implicit_optional = true
warn_redundant_casts = true
warn_unused_ignores = true
warn_return_any = true
warn_unreachable = true
show_error_context = true