Upload folder using huggingface_hub
Browse files- .gitattributes +12 -0
- compiled/2379555668bd87cb73b9.neff +3 -0
- compiled/625cbc9fc30bdfe4655d.neff +3 -0
- compiled/69408ea3072d734f7cf8.neff +3 -0
- compiled/7375794dc87a0944abae.neff +3 -0
- compiled/87b623157d3eb2153d48.neff +3 -0
- compiled/b2319ba4002d5c6923d4.neff +3 -0
- compiled/bac86e22321a7b448b83.neff +3 -0
- compiled/bafbb75c5fd94fa672f5.neff +3 -0
- compiled/c57922bd0bf9fc22305f.neff +3 -0
- compiled/c7174ca2aa90bd6d258a.neff +3 -0
- compiled/ca301776358bb24e0b67.neff +3 -0
- compiled/f33663d7426faf0a46e4.neff +3 -0
- config.json +42 -0
- generation_config.json +6 -0
- special_tokens_map.json +23 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +0 -0
.gitattributes
CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
compiled/2379555668bd87cb73b9.neff filter=lfs diff=lfs merge=lfs -text
|
37 |
+
compiled/625cbc9fc30bdfe4655d.neff filter=lfs diff=lfs merge=lfs -text
|
38 |
+
compiled/69408ea3072d734f7cf8.neff filter=lfs diff=lfs merge=lfs -text
|
39 |
+
compiled/7375794dc87a0944abae.neff filter=lfs diff=lfs merge=lfs -text
|
40 |
+
compiled/87b623157d3eb2153d48.neff filter=lfs diff=lfs merge=lfs -text
|
41 |
+
compiled/b2319ba4002d5c6923d4.neff filter=lfs diff=lfs merge=lfs -text
|
42 |
+
compiled/bac86e22321a7b448b83.neff filter=lfs diff=lfs merge=lfs -text
|
43 |
+
compiled/bafbb75c5fd94fa672f5.neff filter=lfs diff=lfs merge=lfs -text
|
44 |
+
compiled/c57922bd0bf9fc22305f.neff filter=lfs diff=lfs merge=lfs -text
|
45 |
+
compiled/c7174ca2aa90bd6d258a.neff filter=lfs diff=lfs merge=lfs -text
|
46 |
+
compiled/ca301776358bb24e0b67.neff filter=lfs diff=lfs merge=lfs -text
|
47 |
+
compiled/f33663d7426faf0a46e4.neff filter=lfs diff=lfs merge=lfs -text
|
compiled/2379555668bd87cb73b9.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb12607aa397e370639b067126c728e76b40075acc343d49c18a48c6cecfaf6c
|
3 |
+
size 1321984
|
compiled/625cbc9fc30bdfe4655d.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7379c6aa990febd9c5b8fcfa7c1fef2cfd9e7ea5f99d3f968d013d1510075d0
|
3 |
+
size 8418304
|
compiled/69408ea3072d734f7cf8.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06be480f77e8b4007645bec3d31a75c70cb488c8e9d97020f3e7585204de6a12
|
3 |
+
size 15750144
|
compiled/7375794dc87a0944abae.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e669fea3849cebeb897159e432ea400e66129e93197ec99052e6c669b0e877a1
|
3 |
+
size 11879424
|
compiled/87b623157d3eb2153d48.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36d00296f2fe171507887905504d6c58f82fa33c9ee32973fc0b7a3c0a531988
|
3 |
+
size 12053504
|
compiled/b2319ba4002d5c6923d4.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0d8427c749726816c1ec0b047cb6481be903f7b74ab62c5b342730db957b19c
|
3 |
+
size 11920384
|
compiled/bac86e22321a7b448b83.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b504695e84e0c0252046d8cd39b29cc63357b86bfab96e0880c16ef1daa6201f
|
3 |
+
size 2171904
|
compiled/bafbb75c5fd94fa672f5.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdde827594fb2c25b8cdb91c3e7179b411aea84b505f51ea85a2c6a3d626b557
|
3 |
+
size 12268544
|
compiled/c57922bd0bf9fc22305f.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce57e940cdb5d1759d4edbec086cc7da1857351631b57454b3d5af032bf6bd73
|
3 |
+
size 12616704
|
compiled/c7174ca2aa90bd6d258a.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39687c8d300e764ba24f9b57cc2a706f681acb94a1748188d2ad276984e09db2
|
3 |
+
size 18740224
|
compiled/ca301776358bb24e0b67.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f77ea64bc48bbeecf52da782d46b1120038b75d46f3a8134f845c9df0e466f06
|
3 |
+
size 4506624
|
compiled/f33663d7426faf0a46e4.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98e2f0c3f34b3f24468aa4e7058a0eaf2a4a64509cd022cbb080526b426331cb
|
3 |
+
size 11961344
|
config.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "mistralai/Mixtral-8x22B-Instruct-v0.1",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 6144,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 16384,
|
13 |
+
"max_position_embeddings": 65536,
|
14 |
+
"model_type": "mixtral",
|
15 |
+
"neuron": {
|
16 |
+
"auto_cast_type": "fp16",
|
17 |
+
"batch_size": 4,
|
18 |
+
"checkpoint_id": "mistralai/Mixtral-8x22B-Instruct-v0.1",
|
19 |
+
"checkpoint_revision": "a46959a1a02a9247294f5e141a4f3270059c6b32",
|
20 |
+
"compiler_type": "neuronx-cc",
|
21 |
+
"compiler_version": "2.15.128.0+56dc5a86",
|
22 |
+
"num_cores": 24,
|
23 |
+
"sequence_length": 4096,
|
24 |
+
"task": "text-generation"
|
25 |
+
},
|
26 |
+
"num_attention_heads": 48,
|
27 |
+
"num_experts_per_tok": 2,
|
28 |
+
"num_hidden_layers": 56,
|
29 |
+
"num_key_value_heads": 8,
|
30 |
+
"num_local_experts": 8,
|
31 |
+
"output_router_logits": false,
|
32 |
+
"rms_norm_eps": 1e-05,
|
33 |
+
"rope_theta": 1000000.0,
|
34 |
+
"router_aux_loss_coef": 0.001,
|
35 |
+
"router_jitter_noise": 0.0,
|
36 |
+
"sliding_window": null,
|
37 |
+
"tie_word_embeddings": false,
|
38 |
+
"torch_dtype": "bfloat16",
|
39 |
+
"transformers_version": "4.43.2",
|
40 |
+
"use_cache": true,
|
41 |
+
"vocab_size": 32768
|
42 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.43.2"
|
6 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "</s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"unk_token": {
|
17 |
+
"content": "<unk>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
}
|
23 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37f00374dea48658ee8f5d0f21895b9bc55cb0103939607c8185bfd1c6ca1f89
|
3 |
+
size 587404
|
tokenizer_config.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|