-
Notifications
You must be signed in to change notification settings - Fork 39
/
Copy pathrun_greaselm__medqa_usmle.sh
68 lines (56 loc) · 1.88 KB
/
run_greaselm__medqa_usmle.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
#!/bin/bash
export INHERIT_BERT=1
export CUDA_VISIBLE_DEVICES=0
export TOKENIZERS_PARALLELISM=true
dt=`date '+%Y%m%d_%H%M%S'`
dataset="medqa_usmle"
shift
encoder='cambridgeltl/SapBERT-from-PubMedBERT-fulltext'
args=$@
elr="5e-5"
dlr="1e-3"
bs=128
mbs=2
unfreeze_epoch=0
k=3 #num of gnn layers
gnndim=200
# Existing arguments but changed for GreaseLM
encoder_layer=-1
max_node_num=200
seed=5
lr_schedule=fixed
n_epochs=20
max_epochs_before_stop=10
ie_dim=400
max_seq_len=512
ent_emb=ddb
# Added for GreaseLM
info_exchange=true
ie_layer_num=1
resume_checkpoint=None
resume_id=None
sep_ie_layers=false
random_ent_emb=false
echo "***** hyperparameters *****"
echo "dataset: $dataset"
echo "enc_name: $encoder"
echo "batch_size: $bs mini_batch_size: $mbs"
echo "learning_rate: elr $elr dlr $dlr"
echo "gnn: dim $gnndim layer $k"
echo "ie_dim: ${ie_dim}, info_exchange: ${info_exchange}"
echo "******************************"
save_dir_pref='runs'
mkdir -p $save_dir_pref
run_name=greaselm__ds_${dataset}__enc_sapbert__k${k}__sd${seed}__iedim${ie_dim}__unfrz${unfreeze_epoch}__${dt}
log=logs/train_${dataset}__${run_name}.log.txt
###### Training ######
python3 -u greaselm.py \
--dataset $dataset \
--encoder $encoder -k $k --gnn_dim $gnndim -elr $elr -dlr $dlr -bs $bs --seed $seed -mbs ${mbs} --unfreeze_epoch ${unfreeze_epoch} --encoder_layer=${encoder_layer} -sl ${max_seq_len} --max_node_num ${max_node_num} \
--n_epochs $n_epochs --max_epochs_before_stop ${max_epochs_before_stop} \
--save_dir ${save_dir_pref}/${dataset}/${run_name} \
--run_name ${run_name} \
--ie_dim ${ie_dim} --info_exchange ${info_exchange} --ie_layer_num ${ie_layer_num} --resume_checkpoint ${resume_checkpoint} --resume_id ${resume_id} --sep_ie_layers ${sep_ie_layers} --random_ent_emb ${random_ent_emb} --ent_emb ${ent_emb//,/ } --lr_schedule ${lr_schedule} \
--data_dir data \
> ${log}
# echo log: ${log}