We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d9f9e2b commit 8b0a3ceCopy full SHA for 8b0a3ce
trl/trainer/reward_trainer.py
@@ -488,13 +488,15 @@ def tokenize_fn(example, processing_class):
488
chosen_input_ids = processing_class.apply_chat_template(
489
example["chosen"],
490
tools=example.get("tools"),
491
+ return_dict=True,
492
**example.get("chat_template_kwargs", {}),
- )
493
+ )["input_ids"]
494
rejected_input_ids = processing_class.apply_chat_template(
495
example["rejected"],
496
497
498
499
500
output = {"chosen_input_ids": chosen_input_ids, "rejected_input_ids": rejected_input_ids}
501
else:
502
output = {
0 commit comments