mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-22 16:49:06 +00:00
Test training with trl (#70)
* first trl grpo implementation * added config yaml file * added read me and dependencies * updated reward format func
This commit is contained in:
parent
a607db79f7
commit
d61db3772a
5 changed files with 287 additions and 0 deletions
10
examples/trl/requirements.txt
Normal file
10
examples/trl/requirements.txt
Normal file
|
|
@ -0,0 +1,10 @@
|
|||
torch --index-url https://download.pytorch.org/whl/cu124
|
||||
torchvision --index-url https://download.pytorch.org/whl/cu124
|
||||
torchaudio --index-url https://download.pytorch.org/whl/cu124
|
||||
datasets
|
||||
peft
|
||||
transformers
|
||||
trl
|
||||
wandb
|
||||
huggingface_hub
|
||||
flash-attn --no-build-isolation
|
||||
Loading…
Add table
Add a link
Reference in a new issue