huggingface · younesbelkada · Jun 11, 2024 · Jun 11, 2024 · Jun 11, 2024
diff --git a/docs/source/kto_trainer.mdx b/docs/source/kto_trainer.mdx
@@ -49,7 +49,8 @@ kto_dataset_dict = {
 ```
 
 where the `prompt` contains the context inputs, `completion` contains the corresponding responses and `label` contains the corresponding flag that indicates if the generated completion is desired (`True`) or undesired (`False`).
-A prompt can have multiple responses and this is reflected in the entries being repeated in the dictionary's value arrays.
+A prompt can have multiple responses and this is reflected in the entries being repeated in the dictionary's value arrays. It is required that the dataset contains at least one desirable and one undesirable completion.
+
 
 ## Expected model format
 The KTO trainer expects a model of `AutoModelForCausalLM`, compared to PPO that expects `AutoModelForCausalLMWithValueHead` for the value function.

diff --git a/tests/test_kto_trainer.py b/tests/test_kto_trainer.py
@@ -82,6 +82,74 @@ def _init_dummy_dataset(self):
         # fmt: on
         return Dataset.from_dict(dummy_dataset_dict)
 
+    def _init_dummy_dataset_only_desirable(self):
+        # fmt: off
+        dummy_dataset_unbalanced_dict = {
+            "prompt": [
+                "Hey, hello",
+                "How are you",
+                "What is your name?",
+                "What is your name?",
+                "Which is the best programming language?",
+                "Which is the best programming language?",
+                "Which is the best programming language?",
+            ],
+            "completion": [
+                "hi nice to meet you",
+                "leave me alone",
+                "I don't have a name",
+                "My name is Mary",
+                "Python",
+                "C++",
+                "Java",
+            ],
+            "label": [
+                True,
+                True,
+                True,
+                True,
+                True,
+                True,
+                True,
+            ],
+        }
+        # fmt: on
+        return Dataset.from_dict(dummy_dataset_unbalanced_dict)
+
+    def _init_dummy_dataset_no_desirable(self):
+        # fmt: off
+        dummy_dataset_unbalanced_dict = {
+            "prompt": [
+                "Hey, hello",
+                "How are you",
+                "What is your name?",
+                "What is your name?",
+                "Which is the best programming language?",
+                "Which is the best programming language?",
+                "Which is the best programming language?",
+            ],
+            "completion": [
+                "hi nice to meet you",
+                "leave me alone",
+                "I don't have a name",
+                "My name is Mary",
+                "Python",
+                "C++",
+                "Java",
+            ],
+            "label": [
+                False,
+                False,
+                False,
+                False,
+                False,
+                False,
+                False,
+            ],
+        }
+        # fmt: on
+        return Dataset.from_dict(dummy_dataset_unbalanced_dict)
+
     @parameterized.expand(
         [
             ["gpt2", "kto", True, True],
@@ -144,6 +212,60 @@ def test_kto_trainer(self, name, loss_type, pre_compute, eval_dataset):
                 if param.sum() != 0:
                     self.assertFalse(torch.equal(param, new_param))
 
+    @require_no_wandb
+    def test_kto_trainer_no_desirable_input(self):
+        with tempfile.TemporaryDirectory() as tmp_dir:
+            training_args = KTOConfig(
+                output_dir=tmp_dir,
+                remove_unused_columns=False,
+            )
+
+            dummy_dataset = self._init_dummy_dataset_no_desirable()
+
+            model = self.model
+            ref_model = self.ref_model
+            tokenizer = self.tokenizer
+
+            with self.assertRaises(
+                ValueError,
+                msg="The set of desirable completions cannot be empty.",
+            ):
+                _ = KTOTrainer(
+                    model=model,
+                    ref_model=ref_model,
+                    args=training_args,
+                    tokenizer=tokenizer,
+                    train_dataset=dummy_dataset,
+                    eval_dataset=None,
+                )
+
+    @require_no_wandb
+    def test_kto_trainer_only_desirable_input(self):
+        with tempfile.TemporaryDirectory() as tmp_dir:
+            training_args = KTOConfig(
+                output_dir=tmp_dir,
+                remove_unused_columns=False,
+            )
+
+            dummy_dataset = self._init_dummy_dataset_only_desirable()
+
+            model = self.model
+            ref_model = self.ref_model
+            tokenizer = self.tokenizer
+
+            with self.assertRaises(
+                ValueError,
+                msg="The set of undesirable completions cannot be empty.",
+            ):
+                _ = KTOTrainer(
+                    model=model,
+                    ref_model=ref_model,
+                    args=training_args,
+                    tokenizer=tokenizer,
+                    train_dataset=dummy_dataset,
+                    eval_dataset=None,
+                )
+
     def test_tokenize_and_process_tokens(self):
         with tempfile.TemporaryDirectory() as tmp_dir:
             training_args = KTOConfig(

diff --git a/trl/trainer/kto_trainer.py b/trl/trainer/kto_trainer.py
@@ -646,6 +646,11 @@ def make_inputs_require_grad(module, input, output):
                 lambda x: not x["label"], num_proc=args.dataset_num_proc, desc="Filtering undesirable examples"
             )
 
+            if len(desirable) == 0:
+                raise ValueError("The set of desirable completions cannot be empty.")
+            elif len(undesirable) == 0:
+                raise ValueError("The set of undesirable completions cannot be empty.")
+
             if len(desirable) != len(undesirable):
                 # The lower and upper bounds come from Eq. (8) of https://arxiv.org/abs/2402.01306
                 des_weight_lower_bound = round((len(undesirable) * self.undesirable_weight / len(desirable)) * 1, 2)