Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +87 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 8192,
|
7 |
+
"intermediate_size": 28672,
|
8 |
+
"num_attention_heads": 64,
|
9 |
+
"num_hidden_layers": 80,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"rope_scaling": {
|
15 |
+
"factor": 8.0,
|
16 |
+
"high_freq_factor": 4.0,
|
17 |
+
"low_freq_factor": 1.0,
|
18 |
+
"original_max_position_embeddings": 8192,
|
19 |
+
"rope_type": "llama3"
|
20 |
+
},
|
21 |
+
"context_window_size": 131072,
|
22 |
+
"prefill_chunk_size": 8192,
|
23 |
+
"num_key_value_heads": 8,
|
24 |
+
"head_dim": 128,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"pipeline_parallel_stages": 1,
|
27 |
+
"max_batch_size": 128,
|
28 |
+
"disaggregation": false
|
29 |
+
},
|
30 |
+
"vocab_size": 128256,
|
31 |
+
"context_window_size": 131072,
|
32 |
+
"sliding_window_size": -1,
|
33 |
+
"prefill_chunk_size": 8192,
|
34 |
+
"attention_sink_size": -1,
|
35 |
+
"tensor_parallel_shards": 1,
|
36 |
+
"pipeline_parallel_stages": 1,
|
37 |
+
"temperature": 1.0,
|
38 |
+
"presence_penalty": 0.0,
|
39 |
+
"frequency_penalty": 0.0,
|
40 |
+
"repetition_penalty": 1.0,
|
41 |
+
"top_p": 1.0,
|
42 |
+
"tokenizer_files": [
|
43 |
+
"tokenizer.json",
|
44 |
+
"tokenizer_config.json"
|
45 |
+
],
|
46 |
+
"tokenizer_info": {
|
47 |
+
"token_postproc_method": "byte_level",
|
48 |
+
"prepend_space_in_encode": false,
|
49 |
+
"strip_space_in_decode": false
|
50 |
+
},
|
51 |
+
"conv_template": {
|
52 |
+
"name": "deepseek_v3",
|
53 |
+
"system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
|
54 |
+
"system_message": "You are a helpful assistant.",
|
55 |
+
"system_prefix_token_ids": null,
|
56 |
+
"add_role_after_system_message": true,
|
57 |
+
"roles": {
|
58 |
+
"user": "<\uff5cUser\uff5c>",
|
59 |
+
"assistant": "<\uff5cAssistant\uff5c>"
|
60 |
+
},
|
61 |
+
"role_templates": {
|
62 |
+
"user": "{user_message}",
|
63 |
+
"assistant": "{assistant_message}",
|
64 |
+
"tool": "{tool_message}"
|
65 |
+
},
|
66 |
+
"messages": [],
|
67 |
+
"seps": [
|
68 |
+
"",
|
69 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
70 |
+
],
|
71 |
+
"role_content_sep": "",
|
72 |
+
"role_empty_sep": "",
|
73 |
+
"stop_str": [],
|
74 |
+
"stop_token_ids": [
|
75 |
+
151643
|
76 |
+
],
|
77 |
+
"function_string": "",
|
78 |
+
"use_function_calling": false
|
79 |
+
},
|
80 |
+
"pad_token_id": 0,
|
81 |
+
"bos_token_id": 128000,
|
82 |
+
"eos_token_id": [
|
83 |
+
128001,
|
84 |
+
128008,
|
85 |
+
128009
|
86 |
+
]
|
87 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f06c49ec973144f3bb407cb37a1d20f157d59c11aeefbf034a506d09565ce4a
|
3 |
+
size 525336576
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de198c859282d07e302964c39cc56fb945efb86e1b4702ac2f4dedd6faace2e2
|
3 |
+
size 65667072
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b491290f229b7fdfc4d434d832c2d0c5b66fe9e108fa410c26322fe7ce6e7476
|
3 |
+
size 234881024
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52596a8ce9588eb777f663e3f98789308bd70db2056be332dd8cca84d34482e6
|
3 |
+
size 29360128
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b3a7334639f873efa6e66a92d568a6011a98a698dc2531869b0183e810441da
|
3 |
+
size 117440512
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a58dbdb5a782ce874b0df662d2f487c1d1f0289a7a758b4af77e3da33dd60d38
|
3 |
+
size 24150016
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70d9f6e2d3a6162418e2f404ec14c0db85ddfed3bd1e143ca820b428a521f535
|
3 |
+
size 41943040
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c8188114191521ffd512c990602d9b29a57dac4548035a51808660d3e3dfa73
|
3 |
+
size 33554432
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0810abf4e1a45157b4a8aab7aedcece7d139abb6bb194aaec028b4ca16af8029
|
3 |
+
size 234881024
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3563a5a62de1a70dabe9a13ca4c664c9471911b070f347340c2a0ba5cd35f7dd
|
3 |
+
size 29360128
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:072e0408c2763c40f5b7ff73aa790fdf69288263b5858aa1993cf37e864a4db8
|
3 |
+
size 117440512
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:721cb657946b6b2a92c2e756a25a1a67bb5781ec2838e7cc93ee49799daf049d
|
3 |
+
size 24150016
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06c2fc07ee4a01f73fa90ec4c1397335e484ae26bfd3b10e03423469b5bbedc1
|
3 |
+
size 41943040
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b1b3f1bb0bce26b6422ee02999108a88c74f9e637124b1f347157b8632fb0c3
|
3 |
+
size 29360128
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:740f7b8beb92976a574b984ba43eea061da965b10d9e3af52d5618097a2ce257
|
3 |
+
size 33554432
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff342cd518af5ab830dd42b044f379af56dcfdb549e5d0c2c304d5c95e4cf60c
|
3 |
+
size 234881024
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ab2cca2afb121d1cfac4681c37980a2cdb19627209d86e4edd0ea789c76ed57
|
3 |
+
size 29360128
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d538c8df5ed4381c69ba61f568f7be890d98b7cec47d0d25788ed924fe35e68e
|
3 |
+
size 117440512
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:227f0ef6c2de6f74c0fba1c1220b5315856d2b7d60e8edae0cf644ceb1f2c0cb
|
3 |
+
size 24150016
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80ac99e5c0cfed4c71431c908b9441f87ece53159bd69106e0d75a1253ad8e69
|
3 |
+
size 41943040
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d694c4bf9095a12f66ed61ba9708bf9cd5bcfee5b02e8dfa6e75d57da83591de
|
3 |
+
size 33554432
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa1ec753c5de887ab9fd5ceaa7d98b0851867b79e80ea345c5bac66e7eb6369b
|
3 |
+
size 234881024
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:613b77d65a81f724e66b01e9436d4b1eb80e65d4f702fbcde1b6d54775be961d
|
3 |
+
size 29360128
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9b1713e84ea9d98b67a62ea540cbf6df46ab0b389ebee407920a9aaf22b9b6a
|
3 |
+
size 117440512
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a65930efa2593f2605f6986ccea46036a1f311c2be672b87a454562b8ff0b75
|
3 |
+
size 117440512
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3523c3c2281297440b224117a53b20ef019ae5945237b4b34835d05477e4ca2a
|
3 |
+
size 24150016
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b7cb6bf928d2e970050b7981aed9aa09a214ff22057301e9739760e697d6a6f
|
3 |
+
size 41943040
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cc045e6234215c3f2ca4f3cba9a712dfe3044797d0a7a2fc3bca4945fa7dac3
|
3 |
+
size 33554432
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd486edbad5f3534ae1e5ae35b588fcbc9d98a3abf31e3c45c0e69fae094d324
|
3 |
+
size 234881024
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4117d7b7e6f264aee86da7a55348a21424e0264ddeb7341e7971f0d8f1532d26
|
3 |
+
size 29360128
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ef76583a942e575936cd8ccb378d0154c857c94ae1eb4bfe47cb4c99edff271
|
3 |
+
size 117440512
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:662f4d00bf7eb1b36c6b7da19afc59d87e845b68eef155a149c7d82d513c9f9a
|
3 |
+
size 24150016
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0947fc5b9c677832bd12a590e3de8289fdd8c2bde8261a7c45396db605d4cf7
|
3 |
+
size 41943040
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e0bdf4643278b87e02350a8984567ae1d7a218f73198371ac88f230f225d8dd
|
3 |
+
size 33554432
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:089434e0802f9e8edcb41a287e21d54eea618f399307b116e1c8a184d4d3fe0d
|
3 |
+
size 234881024
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4516288dc15756c349c34bdfde47cf74390c9340c0e9b39ebf8e35eb46be063f
|
3 |
+
size 41943040
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be107305fa3179cb34a8d8ff62399c1a5e36eaaf465a2b471fb580c05ac12475
|
3 |
+
size 29360128
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65bc20b1878eea63eed93c142284a87de56abccc93fe82349bdf6d8b0def6364
|
3 |
+
size 117440512
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fe38c74de656d97a7e3fa4e9e068e4750a1955ac4800eec42a08240c2a4206f
|
3 |
+
size 24150016
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37b1ace92132f0b4ad52777021a412c32762025c5fb72604ad5a6bc0b50fe975
|
3 |
+
size 41943040
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa72d08bdf084090a1f07d08b26df346835cb37a92c32daf5f24751857b1dfee
|
3 |
+
size 33554432
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc708eea0a71e69caf8a24a4ad55e104b36a5de57747d3804a14a7c26c3a805d
|
3 |
+
size 234881024
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1696e0cf512990f8906bb03bd95ea5a4ab147e6623ef3d50af4e33c25499a976
|
3 |
+
size 29360128
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be24d99d33db858fdaebebf725d3480f1bfd1236449fba59d3a5f1a1d447f03a
|
3 |
+
size 117440512
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd0bf176d530fdc3e6ef8994638e1d104009d04e3a16b0e725cdbd2fd6a00fc0
|
3 |
+
size 24150016
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48a0456b539b68efb4233cbd33be15dcab386ddd38c2b706c14f7ae2127672b6
|
3 |
+
size 41943040
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd8bcf619427a3f85220c1b1b1701ce19eb35ab4b5c29fd816d217c55e943485
|
3 |
+
size 33554432
|