sakares commited on
Commit
e73a28c
·
1 Parent(s): 275ff1f

change saving and eval steps

Browse files
events.out.tfevents.1625628110.t1v-n-bf8aeee7-w-0.4744.3.v2 DELETED
Binary file (73.5 kB)
 
run.sh CHANGED
@@ -8,11 +8,18 @@ python3 run_mlm_flax.py \
8
  --dataset_name="oscar" \
9
  --dataset_config_name="unshuffled_deduplicated_th" \
10
  --max_seq_length="128" \
 
11
  --preprocessing_num_workers="64" \
12
  --per_device_train_batch_size="64" \
13
  --per_device_eval_batch_size="64" \
14
- --learning_rate="2e-4" \
15
  --warmup_steps="1000" \
16
  --overwrite_output_dir \
17
- --num_train_epochs="8" \
 
 
 
 
 
 
18
  --push_to_hub
 
8
  --dataset_name="oscar" \
9
  --dataset_config_name="unshuffled_deduplicated_th" \
10
  --max_seq_length="128" \
11
+ --weight_decay="0.01" \
12
  --preprocessing_num_workers="64" \
13
  --per_device_train_batch_size="64" \
14
  --per_device_eval_batch_size="64" \
15
+ --learning_rate="3e-4" \
16
  --warmup_steps="1000" \
17
  --overwrite_output_dir \
18
+ --num_train_epochs="10" \
19
+ --adam_beta1="0.9" \
20
+ --adam_beta2="0.98" \
21
+ --logging_steps="500" \
22
+ --save_steps="10000" \
23
+ --eval_steps="10000" \
24
+ --dtype="bfloat16" \
25
  --push_to_hub