veronica-girolimetti commited on
Commit
0f3f44b
1 Parent(s): 4fd1c0d

Training in progress, step 265

Browse files
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "epfl-llm/meditron-7b",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "k_proj",
24
- "down_proj",
25
  "up_proj",
26
- "o_proj",
27
- "v_proj",
28
  "q_proj",
29
- "gate_proj"
 
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "unsloth/llama-2-7b-chat-bnb-4bit",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
23
  "up_proj",
24
+ "k_proj",
 
25
  "q_proj",
26
+ "gate_proj",
27
+ "v_proj",
28
+ "down_proj",
29
+ "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9809602631f53f593605bdc35d559c88bd9496ff59f012c3c26d7e75e45de6ba
3
  size 5117112704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18b97d1c23158519bf1ae810d3922a872561ba30e8beb2584aa04baec5c2e7a7
3
  size 5117112704
runs/Oct18_19-56-32_b9c4e637b51c/events.out.tfevents.1729281396.b9c4e637b51c.6221.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bee92d62519a4d1fa04bb7ec0baabf7025218efd2075c4fcf175926514613bcf
3
+ size 11557
special_tokens_map.json CHANGED
@@ -1,28 +1,7 @@
1
  {
2
- "additional_special_tokens": [
3
- "[bib_ref]",
4
- "[/bib_ref]",
5
- "[fig_ref]",
6
- "[/fig_ref]",
7
- "[bib]",
8
- "[/bib]",
9
- "[fig]",
10
- "[/fig]",
11
- "[table]",
12
- "[/table]",
13
- "[formula]",
14
- "[/formula]"
15
- ],
16
  "bos_token": {
17
  "content": "<s>",
18
  "lstrip": false,
19
- "normalized": true,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "cls_token": {
24
- "content": "<CLS>",
25
- "lstrip": false,
26
  "normalized": false,
27
  "rstrip": false,
28
  "single_word": false
@@ -30,26 +9,12 @@
30
  "eos_token": {
31
  "content": "</s>",
32
  "lstrip": false,
33
- "normalized": true,
34
- "rstrip": false,
35
- "single_word": false
36
- },
37
- "mask_token": {
38
- "content": "<MASK>",
39
- "lstrip": false,
40
  "normalized": false,
41
  "rstrip": false,
42
  "single_word": false
43
  },
44
  "pad_token": {
45
- "content": "<PAD>",
46
- "lstrip": false,
47
- "normalized": false,
48
- "rstrip": false,
49
- "single_word": false
50
- },
51
- "sep_token": {
52
- "content": "<SEP>",
53
  "lstrip": false,
54
  "normalized": false,
55
  "rstrip": false,
@@ -58,7 +23,7 @@
58
  "unk_token": {
59
  "content": "<unk>",
60
  "lstrip": false,
61
- "normalized": true,
62
  "rstrip": false,
63
  "single_word": false
64
  }
 
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "bos_token": {
3
  "content": "<s>",
4
  "lstrip": false,
 
 
 
 
 
 
 
5
  "normalized": false,
6
  "rstrip": false,
7
  "single_word": false
 
9
  "eos_token": {
10
  "content": "</s>",
11
  "lstrip": false,
 
 
 
 
 
 
 
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
  "pad_token": {
17
+ "content": "<unk>",
 
 
 
 
 
 
 
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
 
23
  "unk_token": {
24
  "content": "<unk>",
25
  "lstrip": false,
26
+ "normalized": false,
27
  "rstrip": false,
28
  "single_word": false
29
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "add_bos_token": true,
3
  "add_eos_token": false,
4
- "add_prefix_space": true,
5
  "added_tokens_decoder": {
6
  "0": {
7
  "content": "<unk>",
8
  "lstrip": false,
9
- "normalized": true,
10
  "rstrip": false,
11
  "single_word": false,
12
  "special": true
@@ -14,7 +14,7 @@
14
  "1": {
15
  "content": "<s>",
16
  "lstrip": false,
17
- "normalized": true,
18
  "rstrip": false,
19
  "single_word": false,
20
  "special": true
@@ -22,174 +22,21 @@
22
  "2": {
23
  "content": "</s>",
24
  "lstrip": false,
25
- "normalized": true,
26
- "rstrip": false,
27
- "single_word": false,
28
- "special": true
29
- },
30
- "32000": {
31
- "content": "<CLS>",
32
- "lstrip": false,
33
- "normalized": false,
34
- "rstrip": false,
35
- "single_word": false,
36
- "special": true
37
- },
38
- "32001": {
39
- "content": "<SEP>",
40
- "lstrip": false,
41
- "normalized": false,
42
- "rstrip": false,
43
- "single_word": false,
44
- "special": true
45
- },
46
- "32002": {
47
- "content": "<EOD>",
48
- "lstrip": false,
49
- "normalized": false,
50
- "rstrip": false,
51
- "single_word": false,
52
- "special": true
53
- },
54
- "32003": {
55
- "content": "<MASK>",
56
- "lstrip": false,
57
- "normalized": false,
58
- "rstrip": false,
59
- "single_word": false,
60
- "special": true
61
- },
62
- "32004": {
63
- "content": "<PAD>",
64
- "lstrip": false,
65
- "normalized": false,
66
- "rstrip": false,
67
- "single_word": false,
68
- "special": true
69
- },
70
- "32005": {
71
- "content": "[bib_ref]",
72
- "lstrip": false,
73
- "normalized": false,
74
- "rstrip": false,
75
- "single_word": false,
76
- "special": true
77
- },
78
- "32006": {
79
- "content": "[/bib_ref]",
80
- "lstrip": false,
81
- "normalized": false,
82
- "rstrip": false,
83
- "single_word": false,
84
- "special": true
85
- },
86
- "32007": {
87
- "content": "[fig_ref]",
88
- "lstrip": false,
89
- "normalized": false,
90
- "rstrip": false,
91
- "single_word": false,
92
- "special": true
93
- },
94
- "32008": {
95
- "content": "[/fig_ref]",
96
- "lstrip": false,
97
- "normalized": false,
98
- "rstrip": false,
99
- "single_word": false,
100
- "special": true
101
- },
102
- "32009": {
103
- "content": "[bib]",
104
- "lstrip": false,
105
- "normalized": false,
106
- "rstrip": false,
107
- "single_word": false,
108
- "special": true
109
- },
110
- "32010": {
111
- "content": "[/bib]",
112
- "lstrip": false,
113
- "normalized": false,
114
- "rstrip": false,
115
- "single_word": false,
116
- "special": true
117
- },
118
- "32011": {
119
- "content": "[fig]",
120
- "lstrip": false,
121
- "normalized": false,
122
- "rstrip": false,
123
- "single_word": false,
124
- "special": true
125
- },
126
- "32012": {
127
- "content": "[/fig]",
128
- "lstrip": false,
129
- "normalized": false,
130
- "rstrip": false,
131
- "single_word": false,
132
- "special": true
133
- },
134
- "32013": {
135
- "content": "[table]",
136
- "lstrip": false,
137
- "normalized": false,
138
- "rstrip": false,
139
- "single_word": false,
140
- "special": true
141
- },
142
- "32014": {
143
- "content": "[/table]",
144
- "lstrip": false,
145
- "normalized": false,
146
- "rstrip": false,
147
- "single_word": false,
148
- "special": true
149
- },
150
- "32015": {
151
- "content": "[formula]",
152
- "lstrip": false,
153
- "normalized": false,
154
- "rstrip": false,
155
- "single_word": false,
156
- "special": true
157
- },
158
- "32016": {
159
- "content": "[/formula]",
160
- "lstrip": false,
161
  "normalized": false,
162
  "rstrip": false,
163
  "single_word": false,
164
  "special": true
165
  }
166
  },
167
- "additional_special_tokens": [
168
- "[bib_ref]",
169
- "[/bib_ref]",
170
- "[fig_ref]",
171
- "[/fig_ref]",
172
- "[bib]",
173
- "[/bib]",
174
- "[fig]",
175
- "[/fig]",
176
- "[table]",
177
- "[/table]",
178
- "[formula]",
179
- "[/formula]"
180
- ],
181
  "bos_token": "<s>",
 
182
  "clean_up_tokenization_spaces": false,
183
- "cls_token": "<CLS>",
184
  "eos_token": "</s>",
185
  "legacy": false,
186
- "mask_token": "<MASK>",
187
  "model_max_length": 4096,
188
- "pad_token": "<PAD>",
189
  "padding_side": "right",
190
- "sep_token": "<SEP>",
191
  "sp_model_kwargs": {},
192
- "spaces_between_special_tokens": false,
193
  "tokenizer_class": "LlamaTokenizer",
194
  "unk_token": "<unk>",
195
  "use_default_system_prompt": false
 
1
  {
2
  "add_bos_token": true,
3
  "add_eos_token": false,
4
+ "add_prefix_space": null,
5
  "added_tokens_decoder": {
6
  "0": {
7
  "content": "<unk>",
8
  "lstrip": false,
9
+ "normalized": false,
10
  "rstrip": false,
11
  "single_word": false,
12
  "special": true
 
14
  "1": {
15
  "content": "<s>",
16
  "lstrip": false,
17
+ "normalized": false,
18
  "rstrip": false,
19
  "single_word": false,
20
  "special": true
 
22
  "2": {
23
  "content": "</s>",
24
  "lstrip": false,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  "normalized": false,
26
  "rstrip": false,
27
  "single_word": false,
28
  "special": true
29
  }
30
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
31
  "bos_token": "<s>",
32
+ "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 and system_message != false %}{% set content = '<<SYS>>\\n' + system_message + '\\n<</SYS>>\\n\\n' + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ bos_token + '[INST] ' + content.strip() + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content.strip() + ' ' + eos_token }}{% endif %}{% endfor %}",
33
  "clean_up_tokenization_spaces": false,
 
34
  "eos_token": "</s>",
35
  "legacy": false,
 
36
  "model_max_length": 4096,
37
+ "pad_token": "<unk>",
38
  "padding_side": "right",
 
39
  "sp_model_kwargs": {},
 
40
  "tokenizer_class": "LlamaTokenizer",
41
  "unk_token": "<unk>",
42
  "use_default_system_prompt": false
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:236bb0f2118cd2d2cc800861787f9d3c9c2d447b0a8b79b4777de831321f9e7d
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c60f9cfc7e9c83a0c06145e2a7609cca95ba652065569a1cee831cd648f1fcd3
3
  size 5496