From 4f4052829c50a631d62b8d4668f6acdcf0e8dd82 Mon Sep 17 00:00:00 2001
From: Younes Belkada <49240599+younesbelkada@users.noreply.github.com>
Date: Mon, 17 Jun 2024 17:08:32 +0200
Subject: [PATCH 1/4] remove old tests

---
 tests/test_kto_trainer.py | 54 ---------------------------------------
 1 file changed, 54 deletions(-)

diff --git a/tests/test_kto_trainer.py b/tests/test_kto_trainer.py
index 08a96a2a930..bc31cdbd32d 100644
--- a/tests/test_kto_trainer.py
+++ b/tests/test_kto_trainer.py
@@ -212,60 +212,6 @@ def test_kto_trainer(self, name, loss_type, pre_compute, eval_dataset):
                 if param.sum() != 0:
                     self.assertFalse(torch.equal(param, new_param))
 
-    @require_no_wandb
-    def test_kto_trainer_no_desirable_input(self):
-        with tempfile.TemporaryDirectory() as tmp_dir:
-            training_args = KTOConfig(
-                output_dir=tmp_dir,
-                remove_unused_columns=False,
-            )
-
-            dummy_dataset = self._init_dummy_dataset_no_desirable()
-
-            model = self.model
-            ref_model = self.ref_model
-            tokenizer = self.tokenizer
-
-            with self.assertRaises(
-                ValueError,
-                msg="The set of desirable completions cannot be empty.",
-            ):
-                _ = KTOTrainer(
-                    model=model,
-                    ref_model=ref_model,
-                    args=training_args,
-                    tokenizer=tokenizer,
-                    train_dataset=dummy_dataset,
-                    eval_dataset=None,
-                )
-
-    @require_no_wandb
-    def test_kto_trainer_only_desirable_input(self):
-        with tempfile.TemporaryDirectory() as tmp_dir:
-            training_args = KTOConfig(
-                output_dir=tmp_dir,
-                remove_unused_columns=False,
-            )
-
-            dummy_dataset = self._init_dummy_dataset_only_desirable()
-
-            model = self.model
-            ref_model = self.ref_model
-            tokenizer = self.tokenizer
-
-            with self.assertRaises(
-                ValueError,
-                msg="The set of undesirable completions cannot be empty.",
-            ):
-                _ = KTOTrainer(
-                    model=model,
-                    ref_model=ref_model,
-                    args=training_args,
-                    tokenizer=tokenizer,
-                    train_dataset=dummy_dataset,
-                    eval_dataset=None,
-                )
-
     def test_tokenize_and_process_tokens(self):
         with tempfile.TemporaryDirectory() as tmp_dir:
             training_args = KTOConfig(

From df7991a9759ff42119e0d12932099e3468ed0888 Mon Sep 17 00:00:00 2001
From: Younes Belkada <49240599+younesbelkada@users.noreply.github.com>
Date: Mon, 17 Jun 2024 17:12:34 +0200
Subject: [PATCH 2/4] remove datasets

---
 tests/test_kto_trainer.py | 68 ---------------------------------------
 1 file changed, 68 deletions(-)

diff --git a/tests/test_kto_trainer.py b/tests/test_kto_trainer.py
index bc31cdbd32d..bc315d7cb51 100644
--- a/tests/test_kto_trainer.py
+++ b/tests/test_kto_trainer.py
@@ -82,74 +82,6 @@ def _init_dummy_dataset(self):
         # fmt: on
         return Dataset.from_dict(dummy_dataset_dict)
 
-    def _init_dummy_dataset_only_desirable(self):
-        # fmt: off
-        dummy_dataset_unbalanced_dict = {
-            "prompt": [
-                "Hey, hello",
-                "How are you",
-                "What is your name?",
-                "What is your name?",
-                "Which is the best programming language?",
-                "Which is the best programming language?",
-                "Which is the best programming language?",
-            ],
-            "completion": [
-                "hi nice to meet you",
-                "leave me alone",
-                "I don't have a name",
-                "My name is Mary",
-                "Python",
-                "C++",
-                "Java",
-            ],
-            "label": [
-                True,
-                True,
-                True,
-                True,
-                True,
-                True,
-                True,
-            ],
-        }
-        # fmt: on
-        return Dataset.from_dict(dummy_dataset_unbalanced_dict)
-
-    def _init_dummy_dataset_no_desirable(self):
-        # fmt: off
-        dummy_dataset_unbalanced_dict = {
-            "prompt": [
-                "Hey, hello",
-                "How are you",
-                "What is your name?",
-                "What is your name?",
-                "Which is the best programming language?",
-                "Which is the best programming language?",
-                "Which is the best programming language?",
-            ],
-            "completion": [
-                "hi nice to meet you",
-                "leave me alone",
-                "I don't have a name",
-                "My name is Mary",
-                "Python",
-                "C++",
-                "Java",
-            ],
-            "label": [
-                False,
-                False,
-                False,
-                False,
-                False,
-                False,
-                False,
-            ],
-        }
-        # fmt: on
-        return Dataset.from_dict(dummy_dataset_unbalanced_dict)
-
     @parameterized.expand(
         [
             ["gpt2", "kto", True, True],

From 4f1c41915ea65aca94bf4eae9a58e411974f8d1f Mon Sep 17 00:00:00 2001
From: Younes Belkada <49240599+younesbelkada@users.noreply.github.com>
Date: Tue, 18 Jun 2024 10:38:54 +0200
Subject: [PATCH 3/4] Update test_dpo_trainer.py

---
 tests/test_dpo_trainer.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_dpo_trainer.py b/tests/test_dpo_trainer.py
index e047c17cdb2..8b8630c39a9 100644
--- a/tests/test_dpo_trainer.py
+++ b/tests/test_dpo_trainer.py
@@ -35,7 +35,7 @@ def setUpClass(cls):
         cls.tokenizer.pad_token = cls.tokenizer.eos_token
 
         # get t5 as seq2seq example:
-        model_id = "trl-internal-testing/tiny-T5ForConditionalGeneration-correct-vocab"
+        model_id = "trl-internal-testing/T5ForConditionalGeneration-correct-vocab-calibrated"
         cls.t5_model = AutoModelForSeq2SeqLM.from_pretrained(model_id)
         cls.t5_ref_model = AutoModelForSeq2SeqLM.from_pretrained(model_id)
         cls.t5_tokenizer = AutoTokenizer.from_pretrained(model_id)

From 184b274920d9ab843ea495418674fb816ebcc5e9 Mon Sep 17 00:00:00 2001
From: Younes Belkada <49240599+younesbelkada@users.noreply.github.com>
Date: Tue, 18 Jun 2024 10:59:29 +0200
Subject: [PATCH 4/4] Update test_dpo_trainer.py

---
 tests/test_dpo_trainer.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/test_dpo_trainer.py b/tests/test_dpo_trainer.py
index 8b8630c39a9..80856adeb3c 100644
--- a/tests/test_dpo_trainer.py
+++ b/tests/test_dpo_trainer.py
@@ -125,8 +125,8 @@ def test_dpo_trainer(self, name, loss_type, pre_compute):
                 ref_model = self.t5_ref_model
                 tokenizer = self.t5_tokenizer
 
-            if name == "t5" and loss_type == "nca_pair":
-                self.skipTest("For some reason t5 + nca_pair does not compute gradients properly on tiny models")
+            if name == "t5":
+                self.skipTest("For some reason t5 does not compute gradients properly on tiny models")
 
             trainer = DPOTrainer(
                 model=model,