From 9f0ee02d4b011c789b4ded28185fbd2a6621cf5b Mon Sep 17 00:00:00 2001 From: Pengcheng He Date: Tue, 9 Feb 2021 10:47:42 -0500 Subject: [PATCH] Add qqp script --- experiments/glue/qqp.sh | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/experiments/glue/qqp.sh b/experiments/glue/qqp.sh index 96cec4d..6c55cac 100755 --- a/experiments/glue/qqp.sh +++ b/experiments/glue/qqp.sh @@ -24,14 +24,14 @@ case ${init,,} in parameters=" --num_train_epochs 8 \ --warmup 500 \ --learning_rate 2e-5 \ - --train_batch_size 32 \ + --train_batch_size 64 \ --cls_drop_out 0.15 " ;; large) parameters=" --num_train_epochs 8 \ --warmup 500 \ --learning_rate 1e-5 \ - --train_batch_size 32 \ + --train_batch_size 64 \ --cls_drop_out 0.15 \ --fp16 True " ;; @@ -39,23 +39,23 @@ case ${init,,} in parameters=" --num_train_epochs 8 \ --warmup 500 \ --learning_rate 7e-6 \ - --train_batch_size 32 \ + --train_batch_size 64 \ --cls_drop_out 0.2 \ --fp16 True " ;; xlarge-v2) - parameters=" --num_train_epochs 8 \ - --warmup 500 \ + parameters=" --num_train_epochs 10 \ + --warmup 1000 \ --learning_rate 4e-6 \ - --train_batch_size 32 \ + --train_batch_size 64 \ --cls_drop_out 0.2 \ --fp16 True " ;; xxlarge-v2) - parameters=" --num_train_epochs 8 \ - --warmup 500 \ + parameters=" --num_train_epochs 10 \ + --warmup 1000 \ --learning_rate 3e-6 \ - --train_batch_size 32 \ + --train_batch_size 64 \ --cls_drop_out 0.2 \ --fp16 True " ;; @@ -74,7 +74,7 @@ esac python -m DeBERTa.apps.run --model_config config.json \ --tag $tag \ --do_train \ - --max_seq_len 512 \ + --max_seq_len 320 \ --task_name $Task \ --data_dir $cache_dir/glue_tasks/$Task \ --init_model $init \