diff --git a/tests/test_rloo_trainer.py b/tests/test_rloo_trainer.py index 6861b6e83e..2672d37f9c 100644 --- a/tests/test_rloo_trainer.py +++ b/tests/test_rloo_trainer.py @@ -12,8 +12,6 @@ # See the License for the specific language governing permissions and # limitations under the License. -import platform -import subprocess import tempfile import unittest @@ -24,34 +22,6 @@ from trl import RLOOConfig, RLOOTrainer -def test(): - command = """\ -python examples/scripts/rloo/rloo.py \ - --dataset_name trl-internal-testing/descriptiveness-sentiment-trl-style \ - --dataset_train_split descriptiveness \ - --learning_rate 3e-6 \ - --output_dir models/minimal/rloo \ - --per_device_train_batch_size 4 \ - --gradient_accumulation_steps 1 \ - --total_episodes 10 \ - --model_name_or_path trl-internal-testing/tiny-Qwen2ForCausalLM-2.5 \ - --sft_model_path trl-internal-testing/tiny-Qwen2ForCausalLM-2.5 \ - --reward_model_path trl-internal-testing/tiny-Qwen2ForCausalLM-2.5 \ - --missing_eos_penalty 1.0 \ - --save_strategy no \ - --stop_token eos -""" - if platform.system() == "Windows": - # windows CI does not work with subprocesses for some reason - # e.g., https://github.com/huggingface/trl/actions/runs/9600036224/job/26475286210?pr=1743 - return - subprocess.run( - command, - shell=True, - check=True, - ) - - class RLOOTrainerTester(unittest.TestCase): def setUp(self): self.model_id = "trl-internal-testing/tiny-Qwen2ForCausalLM-2.5"