greatakela commited on
Commit
2cdc6c9
1 Parent(s): 661293f

greatakela/mistral_instruct_classify10k_adapters

Browse files
README.md CHANGED
@@ -1,8 +1,13 @@
1
  ---
2
  license: apache-2.0
3
- base_model: mistralai/Mistral-7B-Instruct-v0.1
4
  tags:
 
 
5
  - generated_from_trainer
 
 
 
6
  model-index:
7
  - name: mistral_instruct_classify10k
8
  results: []
@@ -13,9 +18,9 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # mistral_instruct_classify10k
15
 
16
- This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.1](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
- - Loss: 0.6008
19
 
20
  ## Model description
21
 
@@ -47,16 +52,17 @@ The following hyperparameters were used during training:
47
 
48
  | Training Loss | Epoch | Step | Validation Loss |
49
  |:-------------:|:-----:|:----:|:---------------:|
50
- | 0.7492 | 0.04 | 48 | 0.7265 |
51
- | 0.6609 | 1.04 | 96 | 0.6719 |
52
- | 0.5933 | 2.04 | 144 | 0.6383 |
53
- | 0.5361 | 3.04 | 192 | 0.6149 |
54
- | 0.475 | 4.04 | 240 | 0.6008 |
55
 
56
 
57
  ### Framework versions
58
 
59
- - Transformers 4.35.2
60
- - Pytorch 2.1.1+cu121
61
- - Datasets 2.15.0
62
- - Tokenizers 0.15.0
 
 
1
  ---
2
  license: apache-2.0
3
+ library_name: peft
4
  tags:
5
+ - trl
6
+ - sft
7
  - generated_from_trainer
8
+ datasets:
9
+ - generator
10
+ base_model: mistralai/Mistral-7B-Instruct-v0.1
11
  model-index:
12
  - name: mistral_instruct_classify10k
13
  results: []
 
18
 
19
  # mistral_instruct_classify10k
20
 
21
+ This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.1](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1) on the generator dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 0.6021
24
 
25
  ## Model description
26
 
 
52
 
53
  | Training Loss | Epoch | Step | Validation Loss |
54
  |:-------------:|:-----:|:----:|:---------------:|
55
+ | 0.7548 | 1.0 | 49 | 0.7252 |
56
+ | 0.6684 | 2.0 | 98 | 0.6725 |
57
+ | 0.5849 | 3.0 | 147 | 0.6398 |
58
+ | 0.5236 | 4.0 | 196 | 0.6159 |
59
+ | 0.4733 | 5.0 | 245 | 0.6021 |
60
 
61
 
62
  ### Framework versions
63
 
64
+ - PEFT 0.8.2
65
+ - Transformers 4.37.2
66
+ - Pytorch 2.2.0+cu121
67
+ - Datasets 2.17.0
68
+ - Tokenizers 0.15.2
adapter_config.json CHANGED
@@ -19,10 +19,11 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "k_proj",
23
- "o_proj",
24
  "v_proj",
25
- "q_proj"
 
 
26
  ],
27
- "task_type": "CAUSAL_LM"
 
28
  }
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
 
22
  "v_proj",
23
+ "q_proj",
24
+ "o_proj",
25
+ "k_proj"
26
  ],
27
+ "task_type": "CAUSAL_LM",
28
+ "use_rslora": false
29
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18d9cfb741585d64078882e23c778fc87493090e3b89251b89814d8e0a8a4dc8
3
  size 218138576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:170fe642770cdfddeb9c5b302a20e1706ac5e4b2d6ff86f8bdb1eac6d989e862
3
  size 218138576
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
+ size 493443
tokenizer_config.json CHANGED
@@ -1,4 +1,6 @@
1
  {
 
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<unk>",
@@ -37,5 +39,5 @@
37
  "spaces_between_special_tokens": false,
38
  "tokenizer_class": "LlamaTokenizer",
39
  "unk_token": "<unk>",
40
- "use_default_system_prompt": true
41
  }
 
1
  {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
 
39
  "spaces_between_special_tokens": false,
40
  "tokenizer_class": "LlamaTokenizer",
41
  "unk_token": "<unk>",
42
+ "use_default_system_prompt": false
43
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0460fd214e311723889719080cc888269aeda57150e4224ba7f702b5ab6dcb77
3
- size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2647418726458fe8c42ad91926ebc4d538d170a90a91458aab481d6c4c5a44f8
3
+ size 4728