mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-26 17:13:17 +00:00
Fix chain sum veRL example for latest veRL (#371)
* fixes for latest verl * add balance_batch cofg * 1 -> 2 gpu * tweaks * also add raw ids to server script
This commit is contained in:
parent
8a0cacc054
commit
bd13b1b92a
5 changed files with 11 additions and 1 deletions
|
|
@ -118,6 +118,7 @@ class ReasoningGymDataset(Dataset):
|
|||
"entry_id": entry.entry_id,
|
||||
"metadata": entry.metadata,
|
||||
"index": index,
|
||||
"raw_prompt_ids": self.tokenizer.encode(prompt, add_special_tokens=False),
|
||||
}
|
||||
|
||||
# Add raw chat if requested
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue