nithiyn commited on
Commit
a122f2a
·
verified ·
1 Parent(s): cd1f639

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ compiled/2379555668bd87cb73b9.neff filter=lfs diff=lfs merge=lfs -text
37
+ compiled/625cbc9fc30bdfe4655d.neff filter=lfs diff=lfs merge=lfs -text
38
+ compiled/69408ea3072d734f7cf8.neff filter=lfs diff=lfs merge=lfs -text
39
+ compiled/7375794dc87a0944abae.neff filter=lfs diff=lfs merge=lfs -text
40
+ compiled/87b623157d3eb2153d48.neff filter=lfs diff=lfs merge=lfs -text
41
+ compiled/b2319ba4002d5c6923d4.neff filter=lfs diff=lfs merge=lfs -text
42
+ compiled/bac86e22321a7b448b83.neff filter=lfs diff=lfs merge=lfs -text
43
+ compiled/bafbb75c5fd94fa672f5.neff filter=lfs diff=lfs merge=lfs -text
44
+ compiled/c57922bd0bf9fc22305f.neff filter=lfs diff=lfs merge=lfs -text
45
+ compiled/c7174ca2aa90bd6d258a.neff filter=lfs diff=lfs merge=lfs -text
46
+ compiled/ca301776358bb24e0b67.neff filter=lfs diff=lfs merge=lfs -text
47
+ compiled/f33663d7426faf0a46e4.neff filter=lfs diff=lfs merge=lfs -text
compiled/2379555668bd87cb73b9.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb12607aa397e370639b067126c728e76b40075acc343d49c18a48c6cecfaf6c
3
+ size 1321984
compiled/625cbc9fc30bdfe4655d.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7379c6aa990febd9c5b8fcfa7c1fef2cfd9e7ea5f99d3f968d013d1510075d0
3
+ size 8418304
compiled/69408ea3072d734f7cf8.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06be480f77e8b4007645bec3d31a75c70cb488c8e9d97020f3e7585204de6a12
3
+ size 15750144
compiled/7375794dc87a0944abae.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e669fea3849cebeb897159e432ea400e66129e93197ec99052e6c669b0e877a1
3
+ size 11879424
compiled/87b623157d3eb2153d48.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36d00296f2fe171507887905504d6c58f82fa33c9ee32973fc0b7a3c0a531988
3
+ size 12053504
compiled/b2319ba4002d5c6923d4.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0d8427c749726816c1ec0b047cb6481be903f7b74ab62c5b342730db957b19c
3
+ size 11920384
compiled/bac86e22321a7b448b83.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b504695e84e0c0252046d8cd39b29cc63357b86bfab96e0880c16ef1daa6201f
3
+ size 2171904
compiled/bafbb75c5fd94fa672f5.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdde827594fb2c25b8cdb91c3e7179b411aea84b505f51ea85a2c6a3d626b557
3
+ size 12268544
compiled/c57922bd0bf9fc22305f.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce57e940cdb5d1759d4edbec086cc7da1857351631b57454b3d5af032bf6bd73
3
+ size 12616704
compiled/c7174ca2aa90bd6d258a.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39687c8d300e764ba24f9b57cc2a706f681acb94a1748188d2ad276984e09db2
3
+ size 18740224
compiled/ca301776358bb24e0b67.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f77ea64bc48bbeecf52da782d46b1120038b75d46f3a8134f845c9df0e466f06
3
+ size 4506624
compiled/f33663d7426faf0a46e4.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98e2f0c3f34b3f24468aa4e7058a0eaf2a4a64509cd022cbb080526b426331cb
3
+ size 11961344
config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "mistralai/Mixtral-8x22B-Instruct-v0.1",
3
+ "architectures": [
4
+ "MixtralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 6144,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 16384,
13
+ "max_position_embeddings": 65536,
14
+ "model_type": "mixtral",
15
+ "neuron": {
16
+ "auto_cast_type": "fp16",
17
+ "batch_size": 4,
18
+ "checkpoint_id": "mistralai/Mixtral-8x22B-Instruct-v0.1",
19
+ "checkpoint_revision": "a46959a1a02a9247294f5e141a4f3270059c6b32",
20
+ "compiler_type": "neuronx-cc",
21
+ "compiler_version": "2.15.128.0+56dc5a86",
22
+ "num_cores": 24,
23
+ "sequence_length": 4096,
24
+ "task": "text-generation"
25
+ },
26
+ "num_attention_heads": 48,
27
+ "num_experts_per_tok": 2,
28
+ "num_hidden_layers": 56,
29
+ "num_key_value_heads": 8,
30
+ "num_local_experts": 8,
31
+ "output_router_logits": false,
32
+ "rms_norm_eps": 1e-05,
33
+ "rope_theta": 1000000.0,
34
+ "router_aux_loss_coef": 0.001,
35
+ "router_jitter_noise": 0.0,
36
+ "sliding_window": null,
37
+ "tie_word_embeddings": false,
38
+ "torch_dtype": "bfloat16",
39
+ "transformers_version": "4.43.2",
40
+ "use_cache": true,
41
+ "vocab_size": 32768
42
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.43.2"
6
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "unk_token": {
17
+ "content": "<unk>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37f00374dea48658ee8f5d0f21895b9bc55cb0103939607c8185bfd1c6ca1f89
3
+ size 587404
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff