boris commited on
Commit
650ecb1
1 Parent(s): 8ba598c

feat: update script

Browse files
Files changed (2) hide show
  1. seq2seq/do_run.sh +8 -3
  2. seq2seq/sweep.yaml +1 -1
seq2seq/do_run.sh CHANGED
@@ -3,9 +3,14 @@ python run_seq2seq_flax.py \
3
  --train_file /data/CC12M/encoded-small-train.tsv \
4
  --validation_file /data/CC12M/encoded-small-valid.tsv \
5
  --output_dir output \
6
- --per_device_train_batch_size 24 \
7
- --per_device_eval_batch_size 24 \
8
- --preprocessing_num_workers 48 \
9
  --warmup_steps 1000 \
 
10
  --do_train \
11
  --do_eval \
 
 
 
 
 
3
  --train_file /data/CC12M/encoded-small-train.tsv \
4
  --validation_file /data/CC12M/encoded-small-valid.tsv \
5
  --output_dir output \
6
+ --per_device_train_batch_size 56 \
7
+ --per_device_eval_batch_size 56 \
8
+ --preprocessing_num_workers 80 \
9
  --warmup_steps 1000 \
10
+ --gradient_accumulation_steps 8 \
11
  --do_train \
12
  --do_eval \
13
+ --adafactor \
14
+ --num_train_epochs 1 \
15
+ --max_train_samples 200000 \
16
+ --learning_rate
seq2seq/sweep.yaml CHANGED
@@ -25,7 +25,7 @@ command:
25
  - "--num_train_epochs"
26
  - 1
27
  - "--max_train_samples"
28
- - 1000
29
  - "--per_device_train_batch_size"
30
  - 32
31
  - "--per_device_eval_batch_size"
 
25
  - "--num_train_epochs"
26
  - 1
27
  - "--max_train_samples"
28
+ - 200000
29
  - "--per_device_train_batch_size"
30
  - 32
31
  - "--per_device_eval_batch_size"