thobauma commited on
Commit
feae149
·
verified ·
1 Parent(s): b31f783

Model save

Browse files
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  tags:
3
  - trl
4
- - dpo
5
  - generated_from_trainer
6
  model-index:
7
  - name: opt-350m
 
1
  ---
2
  tags:
3
  - trl
4
+ - reward-trainer
5
  - generated_from_trainer
6
  model-index:
7
  - name: opt-350m
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.8458248774210612,
4
- "train_runtime": 38.2645,
5
  "train_samples": 42,
6
- "train_samples_per_second": 1.098,
7
- "train_steps_per_second": 0.078
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 0.8802837530771891,
4
+ "train_runtime": 29.5366,
5
  "train_samples": 42,
6
+ "train_samples_per_second": 1.422,
7
+ "train_steps_per_second": 0.102
8
  }
config.json CHANGED
@@ -4,7 +4,7 @@
4
  "activation_dropout": 0.0,
5
  "activation_function": "relu",
6
  "architectures": [
7
- "OPTForCausalLM"
8
  ],
9
  "attention_dropout": 0.0,
10
  "bos_token_id": 2,
@@ -14,7 +14,13 @@
14
  "eos_token_id": 2,
15
  "ffn_dim": 4096,
16
  "hidden_size": 1024,
 
 
 
17
  "init_std": 0.02,
 
 
 
18
  "layer_norm_elementwise_affine": true,
19
  "layerdrop": 0.0,
20
  "max_position_embeddings": 2048,
 
4
  "activation_dropout": 0.0,
5
  "activation_function": "relu",
6
  "architectures": [
7
+ "OPTForSequenceClassification"
8
  ],
9
  "attention_dropout": 0.0,
10
  "bos_token_id": 2,
 
14
  "eos_token_id": 2,
15
  "ffn_dim": 4096,
16
  "hidden_size": 1024,
17
+ "id2label": {
18
+ "0": "LABEL_0"
19
+ },
20
  "init_std": 0.02,
21
+ "label2id": {
22
+ "LABEL_0": 0
23
+ },
24
  "layer_norm_elementwise_affine": true,
25
  "layerdrop": 0.0,
26
  "max_position_embeddings": 2048,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96757bee906119aac800b9f547e51e7c5ce2ccce2d4097f0dc0f59a533e2b3f6
3
- size 1324830880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c806859e833e81d5b6cdd2855af6e39e3c4ee38e323a169bba6278af096a35c
3
+ size 1324833016
runs/Apr25_11-53-16_MacBook-Pro-3.local/events.out.tfevents.1714038821.MacBook-Pro-3.local.39724.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cba84c12cfbf3327a8119c1970eb529c48384b8c921e428486c478851eba8f4a
3
+ size 4790
runs/Apr25_11-56-04_MacBook-Pro-3.local/events.out.tfevents.1714038969.MacBook-Pro-3.local.42437.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:861b865147a18089a72d026b052ad42c9bf1d2a2c3a86af2e2ed99fad9d3961d
3
+ size 4790
runs/Apr25_12-02-11_MacBook-Pro-3.local/events.out.tfevents.1714039360.MacBook-Pro-3.local.48181.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38890d11aba1534b849e52d5c9293ded553dd4ef7d1907ba01e2597829968485
3
+ size 5138
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.8458248774210612,
4
- "train_runtime": 38.2645,
5
  "train_samples": 42,
6
- "train_samples_per_second": 1.098,
7
- "train_steps_per_second": 0.078
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 0.8802837530771891,
4
+ "train_runtime": 29.5366,
5
  "train_samples": 42,
6
+ "train_samples_per_second": 1.422,
7
+ "train_steps_per_second": 0.102
8
  }
trainer_state.json CHANGED
@@ -8,29 +8,14 @@
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 0.33,
13
- "grad_norm": 10.981945037841797,
14
- "learning_rate": 5e-07,
15
- "logits/chosen": -0.6707152128219604,
16
- "logits/rejected": -0.8389236927032471,
17
- "logps/chosen": -465.56787109375,
18
- "logps/rejected": -1116.6866455078125,
19
- "loss": 1.1531,
20
- "rewards/accuracies": 0.4375,
21
- "rewards/chosen": 0.2850288152694702,
22
- "rewards/margins": 0.3632635474205017,
23
- "rewards/rejected": -0.07823469489812851,
24
- "step": 1
25
- },
26
  {
27
  "epoch": 1.0,
28
  "step": 3,
29
  "total_flos": 0.0,
30
- "train_loss": 0.8458248774210612,
31
- "train_runtime": 38.2645,
32
- "train_samples_per_second": 1.098,
33
- "train_steps_per_second": 0.078
34
  }
35
  ],
36
  "logging_steps": 10,
 
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  {
12
  "epoch": 1.0,
13
  "step": 3,
14
  "total_flos": 0.0,
15
+ "train_loss": 0.8802837530771891,
16
+ "train_runtime": 29.5366,
17
+ "train_samples_per_second": 1.422,
18
+ "train_steps_per_second": 0.102
19
  }
20
  ],
21
  "logging_steps": 10,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3f7f97f31ef1eb375dd9b7308555e225d5387fb7fe51d12f7410ebb4a4eb480
3
- size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:266c603d9bd4ca09eb2054cb68cd0b1c9bc9c5d6f6cebd43a95fe484aef40d38
3
+ size 4920