├── .gitignore ├── README.md ├── main.py ├── pyproject.toml ├── requirements.txt ├── src └── grpo_optuna │ ├── __init__.py │ ├── cli.py │ ├── data.py │ ├── pipeline.py │ ├── rewards.py │ └── text_utils.py ├── tests └── test_objective.py └── uv.lock /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/README.md -------------------------------------------------------------------------------- /main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/main.py -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/pyproject.toml -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/requirements.txt -------------------------------------------------------------------------------- /src/grpo_optuna/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/src/grpo_optuna/__init__.py -------------------------------------------------------------------------------- /src/grpo_optuna/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/src/grpo_optuna/cli.py -------------------------------------------------------------------------------- /src/grpo_optuna/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/src/grpo_optuna/data.py -------------------------------------------------------------------------------- /src/grpo_optuna/pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/src/grpo_optuna/pipeline.py -------------------------------------------------------------------------------- /src/grpo_optuna/rewards.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/src/grpo_optuna/rewards.py -------------------------------------------------------------------------------- /src/grpo_optuna/text_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/src/grpo_optuna/text_utils.py -------------------------------------------------------------------------------- /tests/test_objective.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/tests/test_objective.py -------------------------------------------------------------------------------- /uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/s-smits/grpo-optuna/HEAD/uv.lock --------------------------------------------------------------------------------