joanllop commited on
Commit
1812f38
·
1 Parent(s): e26e974
.gitattributes CHANGED
@@ -35,3 +35,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  images/salamandra_header.png filter=lfs diff=lfs merge=lfs -text
37
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  images/salamandra_header.png filter=lfs diff=lfs merge=lfs -text
37
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
38
+ model.safetensors filter=lfs diff=lfs merge=lfs -text
39
+ tokenizer.model filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -6,6 +6,7 @@
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 2,
 
9
  "hidden_act": "silu",
10
  "hidden_size": 2048,
11
  "initializer_range": 0.02,
@@ -16,14 +17,13 @@
16
  "num_attention_heads": 16,
17
  "num_hidden_layers": 24,
18
  "num_key_value_heads": 16,
19
- "num_layers": 24,
20
  "pretraining_tp": 1,
21
  "rms_norm_eps": 1e-05,
22
  "rope_scaling": null,
23
  "rope_theta": 10000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
- "transformers_version": "4.41.1",
27
  "use_cache": true,
28
  "vocab_size": 256000
29
  }
 
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 2,
9
+ "head_dim": 128,
10
  "hidden_act": "silu",
11
  "hidden_size": 2048,
12
  "initializer_range": 0.02,
 
17
  "num_attention_heads": 16,
18
  "num_hidden_layers": 24,
19
  "num_key_value_heads": 16,
 
20
  "pretraining_tp": 1,
21
  "rms_norm_eps": 1e-05,
22
  "rope_scaling": null,
23
  "rope_theta": 10000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
+ "transformers_version": "4.45.2",
27
  "use_cache": true,
28
  "vocab_size": 256000
29
  }
generation_config.json CHANGED
@@ -7,5 +7,5 @@
7
  "top_p": 0.95,
8
  "max_new_tokens": 25,
9
  "repetition_penalty": 1.2,
10
- "transformers_version": "4.40.2"
11
  }
 
7
  "top_p": 0.95,
8
  "max_new_tokens": 25,
9
  "repetition_penalty": 1.2,
10
+ "transformers_version": "4.45.2"
11
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ec596bbf8f95408a120b009f320621cdcd2f861b3e373e770fe5a12754de66b
3
  size 4507005744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:895a734b23869bfa3fdca1956cfc3de4bba500c4e8c7d958067c74cf807406f3
3
  size 4507005744
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:990527d1e7b98c027d386c742250b2f8517bd3adf98c46cc6c1c2f35b234c224
3
- size 37007559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e90b85b3e3b3ebfc6b9bafeb954b37f2435eed595738337e53f2a746d23d5a2
3
+ size 37007416
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa490e57cebce5cb1a0a5b1a5d3fa4de05aee53dc3a44791f1c3401db44d802d
3
- size 4813274
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab94ddf46d14f0279254858d53770c5319c5129d47291ee2bada530271cb1292
3
+ size 4813276
tokenizer_config.json CHANGED
@@ -31,8 +31,9 @@
31
  "bos_token": "<s>",
32
  "clean_up_tokenization_spaces": false,
33
  "eos_token": "</s>",
34
- "legacy": true,
35
- "model_max_length": 8192,
 
36
  "pad_token": null,
37
  "sp_model_kwargs": {},
38
  "spaces_between_special_tokens": false,
 
31
  "bos_token": "<s>",
32
  "clean_up_tokenization_spaces": false,
33
  "eos_token": "</s>",
34
+ "legacy": false,
35
+ "local_files_only": true,
36
+ "model_max_length": 1000000000000000019884624838656,
37
  "pad_token": null,
38
  "sp_model_kwargs": {},
39
  "spaces_between_special_tokens": false,