Save model at global step 720
Browse files- config.yaml +7 -5
- data.pt +2 -2
- extra_state_world_size_4_rank_0.pt +1 -1
- extra_state_world_size_4_rank_1.pt +1 -1
- extra_state_world_size_4_rank_2.pt +1 -1
- extra_state_world_size_4_rank_3.pt +1 -1
- model_world_size_4_rank_0.pt +1 -1
- model_world_size_4_rank_1.pt +1 -1
- model_world_size_4_rank_2.pt +1 -1
- model_world_size_4_rank_3.pt +1 -1
- optim_world_size_4_rank_0.pt +1 -1
- optim_world_size_4_rank_1.pt +1 -1
- optim_world_size_4_rank_2.pt +1 -1
- optim_world_size_4_rank_3.pt +1 -1
config.yaml
CHANGED
@@ -23,6 +23,8 @@ actor_rollout_ref:
|
|
23 |
save_hf_repo_id: RyanYr/brm-numina-qwen2.5math-7B-base-lr5e-7constant-n4
|
24 |
actor:
|
25 |
loss: brm
|
|
|
|
|
26 |
qlearn:
|
27 |
use_replaybuffer: true
|
28 |
replaybuffer_size: 32
|
@@ -49,7 +51,7 @@ actor_rollout_ref:
|
|
49 |
lr_warmup_steps_ratio: 0
|
50 |
min_lr_ratio: null
|
51 |
warmup_style: constant
|
52 |
-
total_training_steps:
|
53 |
fsdp_config:
|
54 |
wrap_policy:
|
55 |
min_num_params: 0
|
@@ -105,7 +107,7 @@ trainer:
|
|
105 |
total_epochs: 1
|
106 |
total_training_steps: null
|
107 |
project_name: value-LLM
|
108 |
-
experiment_name: brm-numina-qwen2.5math-7B-
|
109 |
logger:
|
110 |
- wandb
|
111 |
val_generations_to_log_to_wandb: 0
|
@@ -122,8 +124,8 @@ trainer:
|
|
122 |
default_local_dir: ./BRM
|
123 |
hf_token: null
|
124 |
resume_from_hf:
|
125 |
-
enable:
|
126 |
-
hf_repo_id:
|
127 |
hf_token: null
|
128 |
-
revision:
|
129 |
val_before_train: true
|
|
|
23 |
save_hf_repo_id: RyanYr/brm-numina-qwen2.5math-7B-base-lr5e-7constant-n4
|
24 |
actor:
|
25 |
loss: brm
|
26 |
+
brm:
|
27 |
+
norm_factor: value
|
28 |
qlearn:
|
29 |
use_replaybuffer: true
|
30 |
replaybuffer_size: 32
|
|
|
51 |
lr_warmup_steps_ratio: 0
|
52 |
min_lr_ratio: null
|
53 |
warmup_style: constant
|
54 |
+
total_training_steps: 12496
|
55 |
fsdp_config:
|
56 |
wrap_policy:
|
57 |
min_num_params: 0
|
|
|
107 |
total_epochs: 1
|
108 |
total_training_steps: null
|
109 |
project_name: value-LLM
|
110 |
+
experiment_name: brm-numina-qwen2.5math-7B-base_lr5e-7constant-n4
|
111 |
logger:
|
112 |
- wandb
|
113 |
val_generations_to_log_to_wandb: 0
|
|
|
124 |
default_local_dir: ./BRM
|
125 |
hf_token: null
|
126 |
resume_from_hf:
|
127 |
+
enable: true
|
128 |
+
hf_repo_id: RyanYr/brm-numina-qwen2.5math-7B-base-lr5e-7constant-n4
|
129 |
hf_token: null
|
130 |
+
revision: 1932c649200c975a4b3ae08f1ed04561da3736ff
|
131 |
val_before_train: true
|
data.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e06c97ae80d68e431f3b42a0b6a8cae5b3cd4f368b4c2f0104e5976dab2aa1b
|
3 |
+
size 6948621
|
extra_state_world_size_4_rank_0.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14696
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e0ad982c07bf9ab5074316d3647fef623ced22c69dc94824767829323e69b18
|
3 |
size 14696
|
extra_state_world_size_4_rank_1.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14696
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6bcb5e830f3de7d7b7d47b9d02fb6ef20ec1e56aee62b8d86920f98d2c62e11
|
3 |
size 14696
|
extra_state_world_size_4_rank_2.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14696
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2313dd0833d09e9e7226ac195cfa9c9eff43af1438d348b4516a5cfa8a594646
|
3 |
size 14696
|
extra_state_world_size_4_rank_3.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14696
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c627889bc59b4e9322f2962c4ca71a3e89ecf8c69e79376f4d7b55a4399020da
|
3 |
size 14696
|
model_world_size_4_rank_0.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7615806874
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2f22a44c952586ef9ba2a66f5cdca77e13cfbc5b999a186902b33ea8d6296f5
|
3 |
size 7615806874
|
model_world_size_4_rank_1.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7615806874
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1baa1d6621d6b7693d3c4d729dfc55ce81beec80eabebf7dac8525c2b47c0b0
|
3 |
size 7615806874
|
model_world_size_4_rank_2.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7615806874
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de5ae1ddcfadb352b291ad14c6ca944a9e013435c25be3ca4bbb03ac665bd4aa
|
3 |
size 7615806874
|
model_world_size_4_rank_3.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7615806874
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5546c9b445a24ae8403788bedd513e7bbf30b93b37e9fedd8fa39863c6b7c0cd
|
3 |
size 7615806874
|
optim_world_size_4_rank_0.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15231260063
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad8d87f72c4076e135c1df4afd3ae5b960365820389db7b24780a6dcc5773519
|
3 |
size 15231260063
|
optim_world_size_4_rank_1.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15231260063
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa35095136ce833375921d9933ae977a522c1186be319ea3943d827715a2de66
|
3 |
size 15231260063
|
optim_world_size_4_rank_2.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15231260063
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:edbacffc89c994571bff28ab7ec76a3a586c30c9bedad7a929e5efba9d4f9c02
|
3 |
size 15231260063
|
optim_world_size_4_rank_3.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15231260063
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90120a1a35bc21006c8e59bfe7442f692fffd89b3197c508f718b9969f387f17
|
3 |
size 15231260063
|