From bb614286e30a80a24000f8e711989b5c664213a1 Mon Sep 17 00:00:00 2001 From: lmeribal Date: Thu, 28 Nov 2024 13:17:17 +0000 Subject: [PATCH] ld-dpo config --- tests/fixtures/configs/train/lddpo/base.json | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/fixtures/configs/train/lddpo/base.json b/tests/fixtures/configs/train/lddpo/base.json index 3140625..43eae2a 100644 --- a/tests/fixtures/configs/train/lddpo/base.json +++ b/tests/fixtures/configs/train/lddpo/base.json @@ -112,6 +112,7 @@ "pad_token": "" }, "trainer_settings": { + "lc_alpha": 0.5, "evaluation_strategy": "steps", "per_device_train_batch_size": 2, "per_device_eval_batch_size": 2,