-
Notifications
You must be signed in to change notification settings - Fork 455
/
train_nsp.sh
43 lines (41 loc) · 1.69 KB
/
train_nsp.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
#!/bin/bash
#
TOTAL_NUM_UPDATES=250000
WARMUP_UPDATES=50000
PEAK_LR=0.00005
TOKENS_PER_SAMPLE=8192
MAX_POSITIONS=8192
BATCH_SIZE=64
MAX_SENTENCES=4
N_GPU_LOCAL=$(nvidia-smi --query-gpu=name --format=csv,noheader | wc -l)
UPDATE_FREQ=$((${BATCH_SIZE} / ${MAX_SENTENCES} / ${N_GPU_LOCAL}))
if [ -z ${1+x} ]; then echo "task not set" && exit 1; else echo "task = ${1}"; fi
if [ -z ${2+x} ]; then echo "model not set" && exit 1; else echo "model = ${2}"; fi
HEAD_NAME=${1}_head
CHECKPOINT_SUFFIX=nsp_${1}_$(basename ${2%.pt})
MUSICBERT_PATH=${2}
fairseq-train ${1}_data_bin --user-dir musicbert \
--restore-file $MUSICBERT_PATH \
--max-update $TOTAL_NUM_UPDATES \
--batch-size $MAX_SENTENCES --update-freq $UPDATE_FREQ \
--max-positions $MAX_POSITIONS \
--max-tokens $((${TOKENS_PER_SAMPLE} * ${MAX_SENTENCES})) \
--task sentence_prediction \
--reset-optimizer --reset-dataloader --reset-meters \
--required-batch-size-multiple 1 \
--num-workers 0 \
--init-token 0 --separator-token 2 \
--arch musicbert_${CHECKPOINT_SUFFIX##*_} \
--criterion sentence_prediction \
--classification-head-name $HEAD_NAME \
--num-classes 2 \
--dropout 0.1 --attention-dropout 0.1 --weight-decay 0.1 \
--optimizer adam --adam-betas "(0.9, 0.98)" --adam-eps 1e-6 --clip-norm 0.0 \
--lr-scheduler polynomial_decay --lr $PEAK_LR --total-num-update $TOTAL_NUM_UPDATES --warmup-updates $WARMUP_UPDATES \
--log-format simple --log-interval 100 \
--best-checkpoint-metric accuracy --maximize-best-checkpoint-metric \
--shorten-method "truncate" \
--checkpoint-suffix _${CHECKPOINT_SUFFIX} \
--no-epoch-checkpoints \
--disable-validation \
--find-unused-parameters