archit11 commited on
Commit
902242a
1 Parent(s): 81b7c42

End of training

Browse files
README.md CHANGED
@@ -20,9 +20,9 @@ It achieves the following results on the evaluation set:
20
  - eval_precision: 0.2362
21
  - eval_recall: 0.1921
22
  - eval_f1: 0.1788
23
- - eval_runtime: 1016.7587
24
- - eval_samples_per_second: 4.878
25
- - eval_steps_per_second: 1.22
26
  - step: 0
27
 
28
  ## Model description
 
20
  - eval_precision: 0.2362
21
  - eval_recall: 0.1921
22
  - eval_f1: 0.1788
23
+ - eval_runtime: 1015.705
24
+ - eval_samples_per_second: 4.883
25
+ - eval_steps_per_second: 1.221
26
  - step: 0
27
 
28
  ## Model description
all_results.json CHANGED
@@ -4,7 +4,7 @@
4
  "eval_loss": 2.501384973526001,
5
  "eval_precision": 0.23617900665745273,
6
  "eval_recall": 0.19213899602329576,
7
- "eval_runtime": 1016.7587,
8
- "eval_samples_per_second": 4.878,
9
- "eval_steps_per_second": 1.22
10
  }
 
4
  "eval_loss": 2.501384973526001,
5
  "eval_precision": 0.23617900665745273,
6
  "eval_recall": 0.19213899602329576,
7
+ "eval_runtime": 1015.705,
8
+ "eval_samples_per_second": 4.883,
9
+ "eval_steps_per_second": 1.221
10
  }
runs/Apr02_15-59-10_31ea9200f14f/events.out.tfevents.1712077121.31ea9200f14f.34.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79f0bf8f4b81093e75329c3cd07555cff7a3506e67d0e9d0d0e23cdd32b61b4f
3
- size 486
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b9597853b5923576c4899cf6fbfd9bd79b43da01554e0650ab24d5c4ed99a05
3
+ size 884
test_results.json CHANGED
@@ -4,7 +4,7 @@
4
  "eval_loss": 2.501384973526001,
5
  "eval_precision": 0.23617900665745273,
6
  "eval_recall": 0.19213899602329576,
7
- "eval_runtime": 1016.7587,
8
- "eval_samples_per_second": 4.878,
9
- "eval_steps_per_second": 1.22
10
  }
 
4
  "eval_loss": 2.501384973526001,
5
  "eval_precision": 0.23617900665745273,
6
  "eval_recall": 0.19213899602329576,
7
+ "eval_runtime": 1015.705,
8
+ "eval_samples_per_second": 4.883,
9
+ "eval_steps_per_second": 1.221
10
  }
trainer_state.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": null,
5
+ "eval_steps": 500,
6
+ "global_step": 0,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "eval_accuracy": 0.225,
13
+ "eval_f1": 0.17882905387355633,
14
+ "eval_loss": 2.501384973526001,
15
+ "eval_precision": 0.23617900665745273,
16
+ "eval_recall": 0.19213899602329576,
17
+ "eval_runtime": 1016.7587,
18
+ "eval_samples_per_second": 4.878,
19
+ "eval_steps_per_second": 1.22,
20
+ "step": 0
21
+ },
22
+ {
23
+ "eval_accuracy": 0.225,
24
+ "eval_f1": 0.17882905387355633,
25
+ "eval_loss": 2.501384973526001,
26
+ "eval_precision": 0.23617900665745273,
27
+ "eval_recall": 0.19213899602329576,
28
+ "eval_runtime": 1015.705,
29
+ "eval_samples_per_second": 4.883,
30
+ "eval_steps_per_second": 1.221,
31
+ "step": 0
32
+ }
33
+ ],
34
+ "logging_steps": 500,
35
+ "max_steps": 0,
36
+ "num_input_tokens_seen": 0,
37
+ "num_train_epochs": 0,
38
+ "save_steps": 500,
39
+ "total_flos": 0,
40
+ "train_batch_size": null,
41
+ "trial_name": null,
42
+ "trial_params": null
43
+ }