End of training

Browse files

Files changed (5) hide show

README.md +32 -12
adapter_config.json +2 -2
adapter_model.safetensors +1 -1
tokenizer.json +1 -6
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [LoftQ/Meta-Llama-3-8B-Instruct-4bit-64rank](https://huggingface.co/LoftQ/Meta-Llama-3-8B-Instruct-4bit-64rank) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.0052
 ## Model description
@@ -43,22 +43,42 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
-- num_epochs: 10
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 2.3911        | 1.0   | 53   | 1.5495          |
-| 2.1963        | 2.0   | 106  | 1.2801          |
-| 2.1026        | 3.0   | 159  | 1.1126          |
-| 2.0158        | 4.0   | 212  | 1.0529          |
-| 1.9591        | 5.0   | 265  | 1.0237          |
-| 1.9115        | 6.0   | 318  | 1.0124          |
-| 1.8671        | 7.0   | 371  | 1.0084          |
-| 1.8498        | 8.0   | 424  | 1.0052          |
-| 1.831         | 9.0   | 477  | 1.0056          |
-| 1.8301        | 10.0  | 530  | 1.0052          |
 ### Framework versions

 This model is a fine-tuned version of [LoftQ/Meta-Llama-3-8B-Instruct-4bit-64rank](https://huggingface.co/LoftQ/Meta-Llama-3-8B-Instruct-4bit-64rank) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.8668
 ## Model description
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
+- num_epochs: 30
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 2.3909        | 1.0   | 53   | 1.5473          |
+| 2.1937        | 2.0   | 106  | 1.2690          |
+| 2.0915        | 3.0   | 159  | 1.0977          |
+| 1.9927        | 4.0   | 212  | 1.0320          |
+| 1.9058        | 5.0   | 265  | 1.0046          |
+| 1.8032        | 6.0   | 318  | 0.9885          |
+| 1.6688        | 7.0   | 371  | 0.9754          |
+| 1.5215        | 8.0   | 424  | 0.9745          |
+| 1.3617        | 9.0   | 477  | 0.9640          |
+| 1.2074        | 10.0  | 530  | 0.9579          |
+| 1.0429        | 11.0  | 583  | 0.9441          |
+| 0.9013        | 12.0  | 636  | 0.9355          |
+| 0.7969        | 13.0  | 689  | 0.9278          |
+| 0.7092        | 14.0  | 742  | 0.9171          |
+| 0.6272        | 15.0  | 795  | 0.9070          |
+| 0.5688        | 16.0  | 848  | 0.9052          |
+| 0.5128        | 17.0  | 901  | 0.8942          |
+| 0.469         | 18.0  | 954  | 0.8894          |
+| 0.4294        | 19.0  | 1007 | 0.8871          |
+| 0.3953        | 20.0  | 1060 | 0.8807          |
+| 0.371         | 21.0  | 1113 | 0.8756          |
+| 0.3533        | 22.0  | 1166 | 0.8750          |
+| 0.3335        | 23.0  | 1219 | 0.8730          |
+| 0.3212        | 24.0  | 1272 | 0.8699          |
+| 0.3108        | 25.0  | 1325 | 0.8687          |
+| 0.3089        | 26.0  | 1378 | 0.8676          |
+| 0.3031        | 27.0  | 1431 | 0.8678          |
+| 0.3014        | 28.0  | 1484 | 0.8675          |
+| 0.3013        | 29.0  | 1537 | 0.8666          |
+| 0.2978        | 30.0  | 1590 | 0.8668          |
 ### Framework versions

adapter_config.json CHANGED Viewed

@@ -20,11 +20,11 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "all-linear",
     "q_proj",
     "v_proj",
-    "k_proj",
-    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "o_proj",
     "all-linear",
     "q_proj",
     "v_proj",
+    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7c05061ab3d9f3f6e9aad31c1a0b96ae2e3da5468a73a43d2946b36d3f003082
 size 218138576

 version https://git-lfs.github.com/spec/v1
+oid sha256:6845c582b4cee8404cbc4538ef581d423cd0c2b23006af1e8ffb3735ff88fb8f
 size 218138576

tokenizer.json CHANGED Viewed

@@ -1,11 +1,6 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 1024,
-    "strategy": "LongestFirst",
-    "stride": 0
-  },
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:508ef04d248d3ca361ccf90aea9f309f1084f6c4206885e043ab9e69ef1d759f
 size 5048

 version https://git-lfs.github.com/spec/v1
+oid sha256:144e158846b8b07db045419a88ebc514d6630d59c4798dfa0e4b5643632a50c1
 size 5048