lfhe commited on
Commit
2c6683b
·
1 Parent(s): 067e569
adapter_config.json CHANGED
@@ -10,18 +10,20 @@
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
- "lora_alpha": 64,
14
  "lora_dropout": 0.05,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
- "r": 32,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
23
  "o_proj",
24
- "qkv_proj"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
 
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
+ "lora_alpha": 512,
14
  "lora_dropout": 0.05,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
+ "r": 256,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "qkv_proj",
24
+ "down_proj",
25
  "o_proj",
26
+ "gate_up_proj"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ba95ba615d126bc740db5435a586950939c55086297b064a96ae74433ae29e2
3
- size 75514840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:501b9ca5d28184bbd39e74a180d77baa93bd349645019236d0dc6fbca98f0c0d
3
+ size 1610648152
special_tokens_map.json CHANGED
@@ -1,4 +1,13 @@
1
  {
 
 
 
 
 
 
 
 
 
2
  "bos_token": {
3
  "content": "<s>",
4
  "lstrip": false,
 
1
  {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "<|end|>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ }
10
+ ],
11
  "bos_token": {
12
  "content": "<s>",
13
  "lstrip": false,
tokenizer.json CHANGED
@@ -98,7 +98,7 @@
98
  "content": "<|end|>",
99
  "single_word": false,
100
  "lstrip": false,
101
- "rstrip": true,
102
  "normalized": false,
103
  "special": true
104
  },
 
98
  "content": "<|end|>",
99
  "single_word": false,
100
  "lstrip": false,
101
+ "rstrip": false,
102
  "normalized": false,
103
  "special": true
104
  },
tokenizer_config.json CHANGED
@@ -87,7 +87,7 @@
87
  "content": "<|end|>",
88
  "lstrip": false,
89
  "normalized": false,
90
- "rstrip": true,
91
  "single_word": false,
92
  "special": true
93
  },
@@ -116,15 +116,19 @@
116
  "special": true
117
  }
118
  },
 
 
 
119
  "bos_token": "<s>",
120
  "chat_template": "{% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
121
  "clean_up_tokenization_spaces": false,
122
  "eos_token": "<|endoftext|>",
123
  "legacy": false,
124
- "model_max_length": 131072,
125
  "pad_token": "<|endoftext|>",
126
- "padding_side": "left",
127
  "sp_model_kwargs": {},
 
128
  "tokenizer_class": "LlamaTokenizer",
129
  "unk_token": "<unk>",
130
  "use_default_system_prompt": false
 
87
  "content": "<|end|>",
88
  "lstrip": false,
89
  "normalized": false,
90
+ "rstrip": false,
91
  "single_word": false,
92
  "special": true
93
  },
 
116
  "special": true
117
  }
118
  },
119
+ "additional_special_tokens": [
120
+ "<|end|>"
121
+ ],
122
  "bos_token": "<s>",
123
  "chat_template": "{% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
124
  "clean_up_tokenization_spaces": false,
125
  "eos_token": "<|endoftext|>",
126
  "legacy": false,
127
+ "model_max_length": 8192,
128
  "pad_token": "<|endoftext|>",
129
+ "padding_side": "right",
130
  "sp_model_kwargs": {},
131
+ "split_special_tokens": false,
132
  "tokenizer_class": "LlamaTokenizer",
133
  "unk_token": "<unk>",
134
  "use_default_system_prompt": false
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4462b5dd4e76ba26575494c18855e9b1d5aba875fa1f1645672478a0e18c3172
3
- size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79a3bf4181978fb2ed511243adf5e45caa870dd3eb02522ab6dfb5a9fd43ebed
3
+ size 5496