mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-24 17:04:55 +00:00
simplified config and reward
This commit is contained in:
parent
7e95c0b67d
commit
c506bb147e
4 changed files with 210 additions and 455 deletions
|
|
@ -4,7 +4,7 @@ from transformers import PreTrainedTokenizer
|
|||
from atroposlib.type_definitions import Message
|
||||
|
||||
# Roles that should be masked in the loss calculation (not used for training)
|
||||
UNMASKED_ROLES = ["assistant"]
|
||||
UNMASKED_ROLES = ["assistant", "agent"]
|
||||
|
||||
|
||||
def tokenize_for_trainer(
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue