James Barry commited on
Commit
8e3ef58
·
1 Parent(s): d52d853

Create run_clm_flax.sh

Browse files
Files changed (1) hide show
  1. run_clm_flax.sh +22 -0
run_clm_flax.sh ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+
3
+ LANG="irish"
4
+
5
+ python transformers/examples/flax/language-modeling/run_clm_flax.py \
6
+ --output_dir="./$LANG-gpt2" \
7
+ --model_type="gpt2" \
8
+ --config_name="./$LANG-gpt2" \
9
+ --tokenizer_name="./$LANG-gpt2" \
10
+ --dataset_name="oscar" \
11
+ --dataset_config_name="unshuffled_deduplicated_ga" \
12
+ --do_train --do_eval \
13
+ --block_size="512" \
14
+ --per_device_train_batch_size="64" \
15
+ --per_device_eval_batch_size="64" \
16
+ --learning_rate="5e-3" --warmup_steps="1000" \
17
+ --adam_beta1="0.9" --adam_beta2="0.98" --weight_decay="0.01" \
18
+ --overwrite_output_dir \
19
+ --num_train_epochs="20" \
20
+ --logging_steps="500" \
21
+ --save_steps="500" \
22
+ --eval_steps="500"