RyanYr commited on
Commit
0d4d417
·
verified ·
1 Parent(s): 1932c64

Save model at global step 720

Browse files
config.yaml CHANGED
@@ -23,6 +23,8 @@ actor_rollout_ref:
23
  save_hf_repo_id: RyanYr/brm-numina-qwen2.5math-7B-base-lr5e-7constant-n4
24
  actor:
25
  loss: brm
 
 
26
  qlearn:
27
  use_replaybuffer: true
28
  replaybuffer_size: 32
@@ -49,7 +51,7 @@ actor_rollout_ref:
49
  lr_warmup_steps_ratio: 0
50
  min_lr_ratio: null
51
  warmup_style: constant
52
- total_training_steps: 3998
53
  fsdp_config:
54
  wrap_policy:
55
  min_num_params: 0
@@ -105,7 +107,7 @@ trainer:
105
  total_epochs: 1
106
  total_training_steps: null
107
  project_name: value-LLM
108
- experiment_name: brm-numina-qwen2.5math-7B-base_5e-7constant-n4
109
  logger:
110
  - wandb
111
  val_generations_to_log_to_wandb: 0
@@ -122,8 +124,8 @@ trainer:
122
  default_local_dir: ./BRM
123
  hf_token: null
124
  resume_from_hf:
125
- enable: false
126
- hf_repo_id: null
127
  hf_token: null
128
- revision: main
129
  val_before_train: true
 
23
  save_hf_repo_id: RyanYr/brm-numina-qwen2.5math-7B-base-lr5e-7constant-n4
24
  actor:
25
  loss: brm
26
+ brm:
27
+ norm_factor: value
28
  qlearn:
29
  use_replaybuffer: true
30
  replaybuffer_size: 32
 
51
  lr_warmup_steps_ratio: 0
52
  min_lr_ratio: null
53
  warmup_style: constant
54
+ total_training_steps: 12496
55
  fsdp_config:
56
  wrap_policy:
57
  min_num_params: 0
 
107
  total_epochs: 1
108
  total_training_steps: null
109
  project_name: value-LLM
110
+ experiment_name: brm-numina-qwen2.5math-7B-base_lr5e-7constant-n4
111
  logger:
112
  - wandb
113
  val_generations_to_log_to_wandb: 0
 
124
  default_local_dir: ./BRM
125
  hf_token: null
126
  resume_from_hf:
127
+ enable: true
128
+ hf_repo_id: RyanYr/brm-numina-qwen2.5math-7B-base-lr5e-7constant-n4
129
  hf_token: null
130
+ revision: 1932c649200c975a4b3ae08f1ed04561da3736ff
131
  val_before_train: true
data.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f6e23c1ad350476914ba4285d3733035a70ac54e39cb86079add44aa8cad0ce
3
- size 6948557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e06c97ae80d68e431f3b42a0b6a8cae5b3cd4f368b4c2f0104e5976dab2aa1b
3
+ size 6948621
extra_state_world_size_4_rank_0.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c34819473441050fa7876c02b91dc7652f994402a111346dae6c5690f2cf549
3
  size 14696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e0ad982c07bf9ab5074316d3647fef623ced22c69dc94824767829323e69b18
3
  size 14696
extra_state_world_size_4_rank_1.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d67e783ef060901a891e0213cb6fd6aad1c73c2cdffbcb1b37e50d2acef8eff0
3
  size 14696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6bcb5e830f3de7d7b7d47b9d02fb6ef20ec1e56aee62b8d86920f98d2c62e11
3
  size 14696
extra_state_world_size_4_rank_2.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43369f73006b31692008bba580e91790d3c6d9d0f0d7962faab066f167dcb084
3
  size 14696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2313dd0833d09e9e7226ac195cfa9c9eff43af1438d348b4516a5cfa8a594646
3
  size 14696
extra_state_world_size_4_rank_3.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:631e9be36c7107c8b025efa187602f585a272953dca1d54887a29a56fdc79edb
3
  size 14696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c627889bc59b4e9322f2962c4ca71a3e89ecf8c69e79376f4d7b55a4399020da
3
  size 14696
model_world_size_4_rank_0.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7434ee5a727cc905731ceeb14ac3b9b83c618f7a0d1b6b1e3fd29c3a92d880f
3
  size 7615806874
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2f22a44c952586ef9ba2a66f5cdca77e13cfbc5b999a186902b33ea8d6296f5
3
  size 7615806874
model_world_size_4_rank_1.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19e39888800dc32d924d5edfa8091963bc5acc20877e14b3a05742d73fc20b3f
3
  size 7615806874
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1baa1d6621d6b7693d3c4d729dfc55ce81beec80eabebf7dac8525c2b47c0b0
3
  size 7615806874
model_world_size_4_rank_2.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c42fe46da957f068bdd7ef397ddc7010afe53a7694aa698efab5c3ef1278468c
3
  size 7615806874
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de5ae1ddcfadb352b291ad14c6ca944a9e013435c25be3ca4bbb03ac665bd4aa
3
  size 7615806874
model_world_size_4_rank_3.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a65b14beece8bcf85a8df9805abc898e25c4c45014340bc8155a9aa46f1d9f89
3
  size 7615806874
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5546c9b445a24ae8403788bedd513e7bbf30b93b37e9fedd8fa39863c6b7c0cd
3
  size 7615806874
optim_world_size_4_rank_0.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1ec4a49a8728456551f4af1db70a254abead40c248fee8c6649a3895a63e9f1
3
  size 15231260063
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad8d87f72c4076e135c1df4afd3ae5b960365820389db7b24780a6dcc5773519
3
  size 15231260063
optim_world_size_4_rank_1.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d309e8207cc2989fad90f9025e30015a8196e79d8040f5f46808dc42b8da20db
3
  size 15231260063
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa35095136ce833375921d9933ae977a522c1186be319ea3943d827715a2de66
3
  size 15231260063
optim_world_size_4_rank_2.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a51e6b767f828f1f6be76e06e7cbcb699d0c333addf5aec413a51d3ca02184ad
3
  size 15231260063
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edbacffc89c994571bff28ab7ec76a3a586c30c9bedad7a929e5efba9d4f9c02
3
  size 15231260063
optim_world_size_4_rank_3.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8296a13d4b4881b4dfffa59c0515d01193d6ff758e9e9a194866d063899fced5
3
  size 15231260063
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90120a1a35bc21006c8e59bfe7442f692fffd89b3197c508f718b9969f387f17
3
  size 15231260063