neihc commited on
Commit
8045cc0
·
verified ·
1 Parent(s): d4ab8d4

neihc/miniCPM_finetune

Browse files
README.md CHANGED
@@ -38,7 +38,7 @@ The following hyperparameters were used during training:
38
  - seed: 42
39
  - gradient_accumulation_steps: 4
40
  - total_train_batch_size: 16
41
- - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
42
  - lr_scheduler_type: linear
43
  - num_epochs: 2
44
  - mixed_precision_training: Native AMP
@@ -50,7 +50,7 @@ The following hyperparameters were used during training:
50
  ### Framework versions
51
 
52
  - PEFT 0.14.0
53
- - Transformers 4.46.3
54
- - Pytorch 2.4.0
55
- - Datasets 3.1.0
56
- - Tokenizers 0.20.3
 
38
  - seed: 42
39
  - gradient_accumulation_steps: 4
40
  - total_train_batch_size: 16
41
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
  - num_epochs: 2
44
  - mixed_precision_training: Native AMP
 
50
  ### Framework versions
51
 
52
  - PEFT 0.14.0
53
+ - Transformers 4.44.2
54
+ - Pytorch 2.4.1+cu121
55
+ - Datasets 3.2.0
56
+ - Tokenizers 0.19.1
adapter_config.json CHANGED
@@ -23,9 +23,9 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "v_proj",
27
- "o_proj",
28
  "q_proj",
 
 
29
  "k_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
 
26
  "q_proj",
27
+ "o_proj",
28
+ "v_proj",
29
  "k_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16439eca64be48994506fa9e362a71e1e694c8f6eb935be905692c466f408334
3
  size 34134464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8b2a9e30f1cd2f51ba056f6db8adb4b830d7e954bf6293cdfd8bd25ccf511ea
3
  size 34134464
runs/Jan13_17-07-07_e7d85d5b8601/events.out.tfevents.1736788028.e7d85d5b8601.21.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18663f1d9f565e8a75cae0b283018a6067b20819c3b9fda4b3b5ee1a8a2517bb
3
+ size 7566
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b266e8526ff0f51e736a7e149fad82bfcbabdb104d4ead74c30f1bbe4de68cc4
3
- size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de4a5cc4f99fbba88d135806133d238a8045c0eca2487bb591f056acd9a50b5
3
+ size 5176