train model
Browse files- scripts/model.yaml +2 -2
scripts/model.yaml
CHANGED
@@ -110,8 +110,8 @@ eval:
|
|
110 |
# Optimizer-related arguments
|
111 |
optimizer:
|
112 |
# class_path: torch.optim.AdamW
|
113 |
-
|
114 |
-
class_path: bitsandbytes.optim.AdamW8bit
|
115 |
# class_path: bitsandbytes.optim.PagedAdamW8bit
|
116 |
|
117 |
init_args:
|
|
|
110 |
# Optimizer-related arguments
|
111 |
optimizer:
|
112 |
# class_path: torch.optim.AdamW
|
113 |
+
class_path: grokadamw.GrokAdamW
|
114 |
+
# class_path: bitsandbytes.optim.AdamW8bit
|
115 |
# class_path: bitsandbytes.optim.PagedAdamW8bit
|
116 |
|
117 |
init_args:
|