Training in progress, step 1984, checkpoint
Browse files
last-checkpoint/adapter_config.json
CHANGED
@@ -20,13 +20,13 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"q_proj",
|
25 |
-
"o_proj",
|
26 |
-
"gate_proj",
|
27 |
-
"v_proj",
|
28 |
"k_proj",
|
29 |
-
"
|
|
|
|
|
|
|
|
|
30 |
],
|
31 |
"task_type": "CAUSAL_LM",
|
32 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"down_proj",
|
|
|
|
|
|
|
|
|
24 |
"k_proj",
|
25 |
+
"v_proj",
|
26 |
+
"o_proj",
|
27 |
+
"q_proj",
|
28 |
+
"up_proj",
|
29 |
+
"gate_proj"
|
30 |
],
|
31 |
"task_type": "CAUSAL_LM",
|
32 |
"use_dora": false,
|
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 232169792
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a8df42a2c05cead50bc256fc821227a1c685d9421a56e6c6c225f8a79d954a0
|
3 |
size 232169792
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 117446154
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fd201181b6924563f49d1bab056ca8efb3154ceec6ba4e87c992e8c957190e6
|
3 |
size 117446154
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaee5b57bceca0a9dd281cd9ac702d8c230d90e4a749a0f30fcacc9028ab8d66
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bd095dae7ffbf005aa92a66a4077dd3d117f3f949f0ac377ea50e1a29fda449
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -35647,6 +35647,78 @@
|
|
35647 |
"rewards/margins": 0.32313817739486694,
|
35648 |
"rewards/rejected": -0.3992757499217987,
|
35649 |
"step": 1980
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
35650 |
}
|
35651 |
],
|
35652 |
"logging_steps": 1,
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.870787659622556,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 1984,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
35647 |
"rewards/margins": 0.32313817739486694,
|
35648 |
"rewards/rejected": -0.3992757499217987,
|
35649 |
"step": 1980
|
35650 |
+
},
|
35651 |
+
{
|
35652 |
+
"epoch": 2.8664481862357327,
|
35653 |
+
"grad_norm": 0.5579022169113159,
|
35654 |
+
"learning_rate": 2.4259573945100144e-07,
|
35655 |
+
"log_odds_chosen": 2.1421194076538086,
|
35656 |
+
"log_odds_ratio": -0.5158656239509583,
|
35657 |
+
"logits/chosen": -1.849534511566162,
|
35658 |
+
"logits/rejected": -1.6556165218353271,
|
35659 |
+
"logps/chosen": -0.8209269642829895,
|
35660 |
+
"logps/rejected": -2.6318562030792236,
|
35661 |
+
"loss": 1.0822,
|
35662 |
+
"nll_loss": 1.0306111574172974,
|
35663 |
+
"rewards/accuracies": 0.65625,
|
35664 |
+
"rewards/chosen": -0.08209270238876343,
|
35665 |
+
"rewards/margins": 0.18109291791915894,
|
35666 |
+
"rewards/rejected": -0.26318562030792236,
|
35667 |
+
"step": 1981
|
35668 |
+
},
|
35669 |
+
{
|
35670 |
+
"epoch": 2.867894677364674,
|
35671 |
+
"grad_norm": 0.5723074674606323,
|
35672 |
+
"learning_rate": 2.3735889697382996e-07,
|
35673 |
+
"log_odds_chosen": 3.1368532180786133,
|
35674 |
+
"log_odds_ratio": -0.4154900312423706,
|
35675 |
+
"logits/chosen": -1.7287541627883911,
|
35676 |
+
"logits/rejected": -1.3899829387664795,
|
35677 |
+
"logps/chosen": -0.7958812713623047,
|
35678 |
+
"logps/rejected": -3.4790496826171875,
|
35679 |
+
"loss": 0.9691,
|
35680 |
+
"nll_loss": 0.9275829792022705,
|
35681 |
+
"rewards/accuracies": 0.8125,
|
35682 |
+
"rewards/chosen": -0.07958813011646271,
|
35683 |
+
"rewards/margins": 0.2683168351650238,
|
35684 |
+
"rewards/rejected": -0.3479049801826477,
|
35685 |
+
"step": 1982
|
35686 |
+
},
|
35687 |
+
{
|
35688 |
+
"epoch": 2.869341168493615,
|
35689 |
+
"grad_norm": 0.5695856809616089,
|
35690 |
+
"learning_rate": 2.3217892643381256e-07,
|
35691 |
+
"log_odds_chosen": 1.77284574508667,
|
35692 |
+
"log_odds_ratio": -0.4833868145942688,
|
35693 |
+
"logits/chosen": -1.7728116512298584,
|
35694 |
+
"logits/rejected": -1.57659113407135,
|
35695 |
+
"logps/chosen": -0.7696139216423035,
|
35696 |
+
"logps/rejected": -2.138911008834839,
|
35697 |
+
"loss": 1.0594,
|
35698 |
+
"nll_loss": 1.0110141038894653,
|
35699 |
+
"rewards/accuracies": 0.703125,
|
35700 |
+
"rewards/chosen": -0.07696139067411423,
|
35701 |
+
"rewards/margins": 0.1369297057390213,
|
35702 |
+
"rewards/rejected": -0.21389110386371613,
|
35703 |
+
"step": 1983
|
35704 |
+
},
|
35705 |
+
{
|
35706 |
+
"epoch": 2.870787659622556,
|
35707 |
+
"grad_norm": 0.5508972406387329,
|
35708 |
+
"learning_rate": 2.2705583972770783e-07,
|
35709 |
+
"log_odds_chosen": 3.5796892642974854,
|
35710 |
+
"log_odds_ratio": -0.39506861567497253,
|
35711 |
+
"logits/chosen": -1.8140000104904175,
|
35712 |
+
"logits/rejected": -1.4643973112106323,
|
35713 |
+
"logps/chosen": -0.8209943771362305,
|
35714 |
+
"logps/rejected": -3.885220527648926,
|
35715 |
+
"loss": 1.0249,
|
35716 |
+
"nll_loss": 0.9854146242141724,
|
35717 |
+
"rewards/accuracies": 0.765625,
|
35718 |
+
"rewards/chosen": -0.08209944516420364,
|
35719 |
+
"rewards/margins": 0.3064225912094116,
|
35720 |
+
"rewards/rejected": -0.38852202892303467,
|
35721 |
+
"step": 1984
|
35722 |
}
|
35723 |
],
|
35724 |
"logging_steps": 1,
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:068f9f17f37a0b6c5693d6feb99bb88153b523b8cdd47d5dc7a2c2ceae6f4d45
|
3 |
size 5496
|