[metadata] name = trl version = 0.19.0.dev0 description = Train transformer language models with reinforcement learning. long_description = file: README.md long_description_content_type = text/markdown author = Leandro von Werra author_email = leandro.vonwerra@gmail.com url = https://github.com/huggingface/trl keywords = transformers, huggingface, language modeling, post-training, rlhf, sft, dpo, grpo license_file = LICENSE classifiers = Development Status :: 2 - Pre-Alpha Intended Audience :: Developers Intended Audience :: Science/Research Natural Language :: English Operating System :: OS Independent Programming Language :: Python :: 3 Programming Language :: Python :: 3.9 Programming Language :: Python :: 3.10 Programming Language :: Python :: 3.11 Programming Language :: Python :: 3.12 Programming Language :: Python :: 3.13 [options] packages = find: python_requires = >=3.9 include_package_data = True install_requires = accelerate>=1.4.0 datasets>=3.0.0 transformers>=4.51.0 [options.packages.find] exclude = tests* [options.package_data] trl = templates/*.md accelerate_configs/*.yaml [options.extras_require] bco = scikit-learn joblib deepspeed = deepspeed>=0.14.4 diffusers = diffusers>=0.18.0 judges = openai>=1.23.2 llm-blender>=0.0.2 liger = liger-kernel>=0.5.9 peft = peft>=0.8.0 quantization = bitsandbytes scikit = scikit-learn test = parameterized pytest-cov pytest-rerunfailures pytest-xdist pytest vllm = # vLLM package does not yet support Python 3.13. These constraints can be lifted once support is added: # see https://github.com/vllm-project/vllm/pull/13164 vllm>=0.8.3; python_version < "3.13" fastapi; python_version < "3.13" pydantic; python_version < "3.13" requests; python_version < "3.13" uvicorn; python_version < "3.13" vlm = Pillow dev = %(bco)s %(deepspeed)s %(diffusers)s %(judges)s %(liger)s %(peft)s %(quantization)s %(scikit)s %(test)s %(vlm)s [options.entry_points] console_scripts = trl = trl.cli:main [coverage:run] branch = True