neihc commited on
Commit
ddd02d3
·
verified ·
1 Parent(s): cb80547

neihc/miniCPM_finetune

Browse files
README.md CHANGED
@@ -38,7 +38,7 @@ The following hyperparameters were used during training:
38
  - seed: 42
39
  - gradient_accumulation_steps: 4
40
  - total_train_batch_size: 16
41
- - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
  - num_epochs: 2
44
  - mixed_precision_training: Native AMP
@@ -50,7 +50,7 @@ The following hyperparameters were used during training:
50
  ### Framework versions
51
 
52
  - PEFT 0.14.0
53
- - Transformers 4.44.2
54
- - Pytorch 2.4.1+cu121
55
- - Datasets 3.2.0
56
- - Tokenizers 0.19.1
 
38
  - seed: 42
39
  - gradient_accumulation_steps: 4
40
  - total_train_batch_size: 16
41
+ - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
42
  - lr_scheduler_type: linear
43
  - num_epochs: 2
44
  - mixed_precision_training: Native AMP
 
50
  ### Framework versions
51
 
52
  - PEFT 0.14.0
53
+ - Transformers 4.46.3
54
+ - Pytorch 2.4.0
55
+ - Datasets 3.1.0
56
+ - Tokenizers 0.20.3
adapter_config.json CHANGED
@@ -24,8 +24,8 @@
24
  "revision": null,
25
  "target_modules": [
26
  "k_proj",
27
- "o_proj",
28
  "v_proj",
 
29
  "q_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
24
  "revision": null,
25
  "target_modules": [
26
  "k_proj",
 
27
  "v_proj",
28
+ "o_proj",
29
  "q_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afef72b72afc5354303e27cf7e95dbad8f810252e65efc312b98d71041d991a9
3
  size 34134464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a0834b9e719b37ac8bff5f64d662e35aa2da35d7dfb2cb8a16e2e7d73ff2c26
3
  size 34134464
runs/Jan10_01-58-56_384bedf9702e/events.out.tfevents.1736474337.384bedf9702e.23.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e3ea6032380286d354c54044848b7fdfa4cf80d90890c33395eca6b96a1b022
3
+ size 7706
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad5d9a6efb8a5501b5ef31c7e1843680f6643f6a146aadf6c7195ab5d18eb253
3
- size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3373e538f6d2b1bd17825aa39f4c2e616649fe72227a0b0da8f0c778261f95fa
3
+ size 5240