[build-system] requires = ["setuptools>=42.0", "setuptools-scm>=3.4"] build-backend = "setuptools.build_meta" [project] name = "ez-tokenizer" version = "1.0.0" description = "High-performance tokenizer builder for code and text datasets with adaptive resource management" readme = "README.md" requires-python = ">=3.8" license = {text = "MIT with Company Restriction"} authors = [ {name = "NexForge", email = "jm.talbot@outlook.com"} ] maintainers = [ {name = "NexForge", email = "jm.talbot@outlook.com"} ] classifiers = [ "Development Status :: 4 - Beta", "Intended Audience :: Developers", "Intended Audience :: Science/Research", "License :: Other/Proprietary License", "Programming Language :: Python :: 3.8", "Programming Language :: Python :: 3.9", "Programming Language :: Python :: 3.10", "Programming Language :: Python :: 3.11", "Programming Language :: Python :: 3.12", "Topic :: Software Development :: Libraries :: Python Modules", "Topic :: Text Processing :: Linguistic" ] dependencies = [ "torch>=1.9.0", "tokenizers>=0.12.0", "tqdm>=4.62.0", "psutil>=5.9.0", "python-dateutil>=2.8.2" ] [project.optional-dependencies] dev = [ "pytest>=6.0", "pytest-cov>=2.12.1", "pytest-xdist>=2.4.0", "black>=21.7b0", "isort>=5.0.0", "mypy>=0.910", "pylint>=2.11.0", "pre-commit>=2.15.0" ] [tool.setuptools] include-package-data = true package-dir = { "" = "src" } [tool.setuptools.packages.find] where = ["src"] namespaces = true [tool.black] line-length = 88 target-version = ['py38'] [tool.isort] profile = "black" multi_line_output = 3 include_trailing_comma = true force_grid_wrap = 0 use_parentheses = true ensure_newline_before_comments = true [tool.mypy] ignore_missing_imports = true disallow_untyped_defs = true disallow_incomplete_defs = true check_untyped_defs = true no_implicit_optional = true warn_redundant_casts = true warn_unused_ignores = true warn_return_any = true warn_unreachable = true show_error_context = true