-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathrun_sts.sh
50 lines (49 loc) · 1.68 KB
/
run_sts.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
#!/bin/bash
model=${MODEL:-princeton-nlp/sup-simcse-roberta-large} # pre-trained model
encoding=${ENCODER_TYPE:-bi_encoder} # cross_encoder, bi_encoder, tri_encoder
lr=${LR:-1e-5} # learning rate
wd=${WD:-0.1} # weight decay
transform=${TRANSFORM:-False} # whether to use an additional linear layer after the encoder
objective=${OBJECTIVE:-mse} # mse, triplet, triplet_mse
triencoder_head=${TRIENCODER_HEAD:-None} # hadamard, concat (set for tri_encoder)
seed=${SEED:-42}
output_dir=${OUTPUT_DIR:-output}
config=enc_${encoding}__lr_${lr}__wd_${wd}__trans_${transform}__obj_${objective}__tri_${triencoder_head}__s_${seed}
train_file=${TRAIN_FILE:-data/csts_train.csv}
eval_file=${EVAL_FILE:-data/csts_validation.csv}
test_file=${TEST_FILE:-data/csts_test.csv}
python run_sts.py \
--output_dir "${output_dir}/${model//\//__}/${config}" \
--model_name_or_path ${model} \
--objective ${objective} \
--encoding_type ${encoding} \
--pooler_type cls \
--freeze_encoder False \
--transform ${transform} \
--triencoder_head ${triencoder_head} \
--max_seq_length 512 \
--train_file ${train_file} \
--validation_file ${eval_file} \
--test_file ${test_file} \
--condition_only False \
--sentences_only False \
--do_train \
--do_eval \
--do_predict \
--evaluation_strategy epoch \
--per_device_train_batch_size 8 \
--gradient_accumulation_steps 4 \
--learning_rate ${lr} \
--weight_decay ${wd} \
--max_grad_norm 0.0 \
--num_train_epochs 3 \
--lr_scheduler_type linear \
--warmup_ratio 0.1 \
--log_level info \
--disable_tqdm True \
--save_strategy epoch \
--save_total_limit 1 \
--seed ${seed} \
--data_seed ${seed} \
--fp16 True \
--log_time_interval 15