Fix chain sum veRL example for latest veRL (#371)

* fixes for latest verl

* add balance_batch cofg

* 1 -> 2 gpu

* tweaks

* also add raw ids to server script
This commit is contained in:
Oliver Stanley 2025-03-14 19:15:54 +00:00 committed by GitHub
parent 8a0cacc054
commit bd13b1b92a
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
5 changed files with 11 additions and 1 deletions

View file

@ -118,6 +118,7 @@ class ReasoningGymDataset(Dataset):
"entry_id": entry.entry_id,
"metadata": entry.metadata,
"index": index,
"raw_prompt_ids": self.tokenizer.encode(prompt, add_special_tokens=False),
}
# Add raw chat if requested