finetune-indoMMLU-Merak-7B-v1
lora r=8 lora_alpha=16 lora_dropout=0.05
learning_rate = 2e-4 lr_scheduler = "cosine" max_seq_length = 2048
finetune-indoMMLU-Merak-7B-v1
lora r=8 lora_alpha=16 lora_dropout=0.05
learning_rate = 2e-4 lr_scheduler = "cosine" max_seq_length = 2048