BDEPEND=dev-python/torch[python_targets_python3_11(-)?,python_targets_python3_12(-)?,python_targets_python3_13(-)?,python_targets_python3_14(-)?] dev-python/transformers[python_targets_python3_11(-)?,python_targets_python3_12(-)?,python_targets_python3_13(-)?,python_targets_python3_14(-)?] =dev-python/gpep517-15[python_targets_python3_11(-)?,python_targets_python3_12(-)?,python_targets_python3_13(-)?,python_targets_python3_14(-)?] DEFINED_PHASES=compile configure install prepare test unpack DESCRIPTION=Train transformer language models with reinforcement learning. EAPI=8 HOMEPAGE=https://github.com/huggingface/trl INHERIT=python-r1 gs-pypi IUSE=benchmark deepspeed dev diffusers llm-judge peft quantization test python_targets_python3_11 python_targets_python3_12 python_targets_python3_13 python_targets_python3_14 KEYWORDS=~amd64 ~x86 LICENSE=Apache-2.0 RDEPEND=dev-python/torch[python_targets_python3_11(-)?,python_targets_python3_12(-)?,python_targets_python3_13(-)?,python_targets_python3_14(-)?] dev-python/transformers[python_targets_python3_11(-)?,python_targets_python3_12(-)?,python_targets_python3_13(-)?,python_targets_python3_14(-)?]