joanllop commited on
Commit
110c55b
·
1 Parent(s): b609125
.gitattributes CHANGED
@@ -35,3 +35,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  images/salamandra_header.png filter=lfs diff=lfs merge=lfs -text
37
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  images/salamandra_header.png filter=lfs diff=lfs merge=lfs -text
37
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
38
+ model-00002-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text
39
+ model-00003-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text
40
+ model-00004-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text
41
+ model-00001-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text
42
+ tokenizer.model filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -6,6 +6,7 @@
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 2,
 
9
  "hidden_act": "silu",
10
  "hidden_size": 4096,
11
  "initializer_range": 0.02,
@@ -17,12 +18,12 @@
17
  "num_hidden_layers": 32,
18
  "num_key_value_heads": 8,
19
  "pretraining_tp": 1,
20
- "rms_norm_eps": 1e-06,
21
  "rope_scaling": null,
22
  "rope_theta": 10000.0,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
- "transformers_version": "4.41.1",
26
  "use_cache": true,
27
  "vocab_size": 256000
28
  }
 
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 2,
9
+ "head_dim": 128,
10
  "hidden_act": "silu",
11
  "hidden_size": 4096,
12
  "initializer_range": 0.02,
 
18
  "num_hidden_layers": 32,
19
  "num_key_value_heads": 8,
20
  "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-05,
22
  "rope_scaling": null,
23
  "rope_theta": 10000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
+ "transformers_version": "4.45.2",
27
  "use_cache": true,
28
  "vocab_size": 256000
29
  }
generation_config.json CHANGED
@@ -7,5 +7,5 @@
7
  "top_p": 0.95,
8
  "max_new_tokens": 25,
9
  "repetition_penalty": 1.2,
10
- "transformers_version": "4.40.2"
11
  }
 
7
  "top_p": 0.95,
8
  "max_new_tokens": 25,
9
  "repetition_penalty": 1.2,
10
+ "transformers_version": "4.45.2"
11
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:476aa35f9b2251b2e15b9d9107bc63b8506d219e999817fe9d870fb410c2145d
3
  size 4982973048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37605bf126644abb6e195034fae986f5248aed453b3579047e3a475aaf2387ab
3
  size 4982973048
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58c1450233d3453c9faafdbfa1d4f96f5c29e669f3f7e69ccdd1a7b53ad934d1
3
  size 4995660232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de573b93500a81744174cbfdbcd54465ab5e1e5d76dccd32d53382ad54a3d337
3
  size 4995660232
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7c5c41380f2f7b4caea1c011a4170270d33e76190135faae2bde104d1946fe2
3
  size 3460482936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f507941af2449c9f24c776ffa379ea78995b94c2d370202a786ac6d5642888d9
3
  size 3460482936
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbfdbb42a23f684cc00c560209fa0256881f6ff8eade4f3c0d9c8f13d3825989
3
  size 2097152128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4944914fb33caad0b42c1591478d6fe95dd07811a899ea7ac6b3bfcbd3c2052
3
  size 2097152128
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:990527d1e7b98c027d386c742250b2f8517bd3adf98c46cc6c1c2f35b234c224
3
- size 37007559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e90b85b3e3b3ebfc6b9bafeb954b37f2435eed595738337e53f2a746d23d5a2
3
+ size 37007416
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa490e57cebce5cb1a0a5b1a5d3fa4de05aee53dc3a44791f1c3401db44d802d
3
- size 4813274
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab94ddf46d14f0279254858d53770c5319c5129d47291ee2bada530271cb1292
3
+ size 4813276
tokenizer_config.json CHANGED
@@ -31,8 +31,9 @@
31
  "bos_token": "<s>",
32
  "clean_up_tokenization_spaces": false,
33
  "eos_token": "</s>",
34
- "legacy": true,
35
- "model_max_length": 8192,
 
36
  "pad_token": null,
37
  "sp_model_kwargs": {},
38
  "spaces_between_special_tokens": false,
 
31
  "bos_token": "<s>",
32
  "clean_up_tokenization_spaces": false,
33
  "eos_token": "</s>",
34
+ "legacy": false,
35
+ "local_files_only": true,
36
+ "model_max_length": 1000000000000000019884624838656,
37
  "pad_token": null,
38
  "sp_model_kwargs": {},
39
  "spaces_between_special_tokens": false,