-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathtrain.sh
More file actions
executable file
·58 lines (39 loc) · 3.11 KB
/
train.sh
File metadata and controls
executable file
·58 lines (39 loc) · 3.11 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
#!/bin/bash
log_error() {
echo "$(date) - Error in script at line $1: $2" >> error_log.txt
}
trap 'log_error $LINENO "$BASH_COMMAND"' ERR
# ----------------------------------------------------------------------------------
# It's important to note that:
# - we trained all models for approximately 8 hours on a single A100 GPU with 40GB RAM
# - checkpoints for each of the models below are already available at https://huggingface.co/Wouter01/mT5Ranking
# - uncommenting all of the below will results in a run time of at least a month on a single A100 GPU (on the large dataset)
# - if you decide to increase/decrease the batch size we recommend changing the learning rate by the same factor
# ----------------------------------------------------------------------------------
cd code
# python train.py --batch_size 32 --labda 0.0 --dataset large --model CGc --prompt titles
# python train.py --batch_size 32 --labda 0.4 --dataset large --model CGc --prompt titles
# python train.py --batch_size 32 --labda 0.0 --dataset large --model CGc --prompt subtitles
# python train.py --batch_size 32 --labda 0.4 --dataset large --model CGc --prompt subtitles
# python train.py --batch_size 32 --labda 0.0 --dataset large --model CGc --prompt diversity
# python train.py --batch_size 32 --labda 0.4 --dataset large --model CGc --prompt diversity
# python train.py --batch_size 32 --labda 0.0 --dataset large --model CGc --prompt pubtime
# python train.py --batch_size 32 --labda 0.4 --dataset large --model CGc --prompt pubtime
# python train.py --batch_size 32 --labda 0.0 --dataset large --model CG --prompt titles
# python train.py --batch_size 32 --labda 0.4 --dataset large --model CG --prompt titles
# python train.py --batch_size 32 --labda 0.0 --dataset large --model CG --prompt subtitles
# python train.py --batch_size 32 --labda 0.4 --dataset large --model CG --prompt subtitles
# python train.py --batch_size 32 --labda 0.0 --dataset large --model CG --prompt diversity
# python train.py --batch_size 32 --labda 0.4 --dataset large --model CG --prompt diversity
# python train.py --batch_size 32 --labda 0.0 --dataset large --model CG --prompt pubtime
# python train.py --batch_size 32 --labda 0.4 --dataset large --model CG --prompt pubtime
# python train.py --batch_size 16 --labda 0.0 --dataset large --model QA --prompt titles
# python train.py --batch_size 16 --labda 0.4 --dataset large --model QA --prompt titles
# python train.py --batch_size 16 --labda 0.0 --dataset large --model QA --prompt subtitles
# python train.py --batch_size 16 --labda 0.4 --dataset large --model QA --prompt subtitles
# python train.py --batch_size 16 --labda 0.0 --dataset large --model QA --prompt diversity
# python train.py --batch_size 16 --labda 0.4 --dataset large --model QA --prompt diversity
# python train.py --batch_size 16 --labda 0.0 --dataset large --model QA --prompt pubtime
# python train.py --batch_size 16 --labda 0.4 --dataset large --model QA --prompt pubtime
# python train.py --lr 5e-5 --batch_size 8 --labda 0.0 --dataset large --model QA+ --prompt QA+
# python train.py --lr 5e-5 --batch_size 8 --labda 0.4 --dataset large --model QA+ --prompt QA+