| [project] | |
| name = "grpo-countdown-problem" | |
| version = "0.1.0" | |
| description = "A simple project training an LLM to solve the GRPO countdown problem" | |
| requires-python = ">=3.12" | |
| dependencies = [ | |
| "datasets>=4.1.1", | |
| "hydra-core>=1.3.2", | |
| "metrics>=0.0.2", | |
| "openai>=1.0.0", | |
| "pandas>=2.0.0", | |
| "peft>=0.17.1", | |
| "python-dotenv>=1.1.1", | |
| "scikit-learn>=1.3.0", | |
| "tensorboard>=2.20.0", | |
| "trl>=0.23.0", | |
| ] | |
| [dependency-groups] | |
| dev = [ | |
| "ruff>=0.13.1", | |
| ] | |
| [tool.ruff] | |
| # Exclude a variety of commonly ignored directories. | |
| exclude = [ | |
| ".bzr", | |
| ".direnv", | |
| ".eggs", | |
| ".git", | |
| ".git-rewrite", | |
| ".hg", | |
| ".ipynb_checkpoints", | |
| ".mypy_cache", | |
| ".nox", | |
| ".pants.d", | |
| ".pyenv", | |
| ".pytest_cache", | |
| ".pytype", | |
| ".ruff_cache", | |
| ".svn", | |
| ".tox", | |
| ".venv", | |
| ".vscode", | |
| "__pypackages__", | |
| "_build", | |
| "buck-out", | |
| "build", | |
| "dist", | |
| "node_modules", | |
| "site-packages", | |
| "venv", | |
| ] | |
| # Same as Black. | |
| line-length = 88 | |
| indent-width = 4 | |
| # Assume Python 3.12 | |
| target-version = "py312" | |
| [tool.ruff.lint] | |
| # Enable Pyflakes (`F`) and a subset of the pycodestyle (`E`) codes by default. | |
| select = [ | |
| "E4", # Import errors | |
| "E7", # Statement errors | |
| "E9", # Runtime errors | |
| "F", # Pyflakes | |
| "W", # pycodestyle warnings | |
| "I", # isort | |
| "N", # pep8-naming | |
| "UP", # pyupgrade | |
| "B", # flake8-bugbear | |
| "C4", # flake8-comprehensions | |
| "SIM", # flake8-simplify | |
| "RUF", # Ruff-specific rules | |
| ] | |
| ignore = [ | |
| "E501", # Line too long (handled by formatter) | |
| "E722", # Do not use bare except | |
| ] | |
| # Allow fix for all enabled rules (when `--fix`) is provided. | |
| fixable = ["ALL"] | |
| unfixable = [] | |
| # Allow unused variables when underscore-prefixed. | |
| dummy-variable-rgx = "^(_+|(_+[a-zA-Z0-9_]*[a-zA-Z0-9]+?))$" | |
| [tool.ruff.format] | |
| # Like Black, use double quotes for strings. | |
| quote-style = "double" | |
| # Like Black, indent with spaces, rather than tabs. | |
| indent-style = "space" | |
| # Like Black, respect magic trailing commas. | |
| skip-magic-trailing-comma = false | |
| # Like Black, automatically detect the appropriate line ending. | |
| line-ending = "auto" | |