bachvudinh
commited on
Commit
•
ba80fc5
1
Parent(s):
793ae42
Initialize Llama3.1 with Whisper Tokenizer
Browse files- config.json +1 -1
- model-00001-of-00004.safetensors +2 -2
- model-00004-of-00004.safetensors +2 -2
- model.safetensors.index.json +1 -1
- tokenizer.json +9 -0
- tokenizer_config.json +8 -0
config.json
CHANGED
@@ -35,5 +35,5 @@
|
|
35 |
"torch_dtype": "bfloat16",
|
36 |
"transformers_version": "4.43.1",
|
37 |
"use_cache": true,
|
38 |
-
"vocab_size":
|
39 |
}
|
|
|
35 |
"torch_dtype": "bfloat16",
|
36 |
"transformers_version": "4.43.1",
|
37 |
"use_cache": true,
|
38 |
+
"vocab_size": 128771
|
39 |
}
|
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e185eae1705d58503daf684339d5d5838c61d86fbc6f421dd7a9471d084b38a4
|
3 |
+
size 4980917552
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e84166fbae2e692893ba5773474a2f5bfa37e9839f32c19a8725d33e10abffa7
|
3 |
+
size 1172357688
|
model.safetensors.index.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
-
"total_size":
|
4 |
},
|
5 |
"weight_map": {
|
6 |
"lm_head.weight": "model-00004-of-00004.safetensors",
|
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
+
"total_size": 16068960256
|
4 |
},
|
5 |
"weight_map": {
|
6 |
"lm_head.weight": "model-00004-of-00004.safetensors",
|
tokenizer.json
CHANGED
@@ -6932,6 +6932,15 @@
|
|
6932 |
"rstrip": false,
|
6933 |
"normalized": false,
|
6934 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6935 |
}
|
6936 |
],
|
6937 |
"normalizer": null,
|
|
|
6932 |
"rstrip": false,
|
6933 |
"normalized": false,
|
6934 |
"special": true
|
6935 |
+
},
|
6936 |
+
{
|
6937 |
+
"id": 128770,
|
6938 |
+
"content": "<|sound_0512|>",
|
6939 |
+
"single_word": false,
|
6940 |
+
"lstrip": false,
|
6941 |
+
"rstrip": false,
|
6942 |
+
"normalized": false,
|
6943 |
+
"special": true
|
6944 |
}
|
6945 |
],
|
6946 |
"normalizer": null,
|
tokenizer_config.json
CHANGED
@@ -6159,6 +6159,14 @@
|
|
6159 |
"rstrip": false,
|
6160 |
"single_word": false,
|
6161 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6162 |
}
|
6163 |
},
|
6164 |
"bos_token": "<|begin_of_text|>",
|
|
|
6159 |
"rstrip": false,
|
6160 |
"single_word": false,
|
6161 |
"special": true
|
6162 |
+
},
|
6163 |
+
"128770": {
|
6164 |
+
"content": "<|sound_0512|>",
|
6165 |
+
"lstrip": false,
|
6166 |
+
"normalized": false,
|
6167 |
+
"rstrip": false,
|
6168 |
+
"single_word": false,
|
6169 |
+
"special": true
|
6170 |
}
|
6171 |
},
|
6172 |
"bos_token": "<|begin_of_text|>",
|