Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +76 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen2",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 3584,
|
8 |
+
"intermediate_size": 18944,
|
9 |
+
"num_attention_heads": 28,
|
10 |
+
"num_hidden_layers": 28,
|
11 |
+
"num_key_value_heads": 4,
|
12 |
+
"rms_norm_eps": 1e-06,
|
13 |
+
"rope_theta": 10000,
|
14 |
+
"vocab_size": 152064,
|
15 |
+
"tie_word_embeddings": false,
|
16 |
+
"context_window_size": 131072,
|
17 |
+
"prefill_chunk_size": 8192,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"head_dim": 128,
|
20 |
+
"dtype": "float32",
|
21 |
+
"max_batch_size": 128
|
22 |
+
},
|
23 |
+
"vocab_size": 152064,
|
24 |
+
"context_window_size": 131072,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 8192,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 1.0,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 1.0,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.json",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_level",
|
41 |
+
"prepend_space_in_encode": false,
|
42 |
+
"strip_space_in_decode": false
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "deepseek_v3",
|
46 |
+
"system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
|
47 |
+
"system_message": "You are a helpful assistant.",
|
48 |
+
"system_prefix_token_ids": null,
|
49 |
+
"add_role_after_system_message": true,
|
50 |
+
"roles": {
|
51 |
+
"user": "<\uff5cUser\uff5c>",
|
52 |
+
"assistant": "<\uff5cAssistant\uff5c>"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
"",
|
62 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
63 |
+
],
|
64 |
+
"role_content_sep": "",
|
65 |
+
"role_empty_sep": "",
|
66 |
+
"stop_str": [],
|
67 |
+
"stop_token_ids": [
|
68 |
+
151643
|
69 |
+
],
|
70 |
+
"function_string": "",
|
71 |
+
"use_function_calling": false
|
72 |
+
},
|
73 |
+
"pad_token_id": 0,
|
74 |
+
"bos_token_id": 151643,
|
75 |
+
"eos_token_id": 151643
|
76 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f8cc84038e8523b802677f4e2dbbf8e49bc0e129e9df6fbb8c43cf8b6218f4a
|
3 |
+
size 272498688
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5bf6ac1a0abd881191c7666a43999ef868547f034010288678d7c8e8335566a
|
3 |
+
size 34062336
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6d6e8cf46604d6f0443d31082ebaf3b5541030b35ff860c992b97557a71c3bc
|
3 |
+
size 29268992
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dcb5d9221a2a474fc09d11b17e927a5509edef35992a2363e0f2d3afa8e182c
|
3 |
+
size 67895296
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c897d17a5de7f21e69bd237fafeaf1b8ba211952af361d1c59364bcc40c66330
|
3 |
+
size 33947648
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41a297bbae858e782d2b87b917592494d4674bb2d47c2e9be3b00f70fc7b58e8
|
3 |
+
size 29268992
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c243b337321a106d79026d1774b734fe00f7e2aafea5242e9325478126307546
|
3 |
+
size 67895296
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a03349a358488ab9fb209b00b1b89cc8d479fbe7578bd0e73cb90e3e55c84bf7
|
3 |
+
size 33947648
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fdaa93935d8621699dc68fbdb7508a1a685d12bf9a17c6e7d4f2f6e531b482b
|
3 |
+
size 29268992
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a77ce00c076fb0f1408d88d1240668e84506d40af983a8bc533201fc2d16fefe
|
3 |
+
size 67895296
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4f7bb72d49752750f5ff7f43c77f4a02f39333baf5ab7dd3bbafe1809dc7424
|
3 |
+
size 33947648
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b65b8cc3dbda6ab6a9c90ab85698b33eae509eaaa0438c4e94ccb235e5934fd
|
3 |
+
size 29268992
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6626469a188a06be97c511e28cbdafece569c28e06f5f2e346ebfcb766de5409
|
3 |
+
size 67895296
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a31d2e718966578ca93337b35190da349d56dc3541e2fab010486ac3a236ff6d
|
3 |
+
size 67895296
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a971e5606b5aaeeed23ab6a7f976bc4c59afdf5f3fde42ed1a0f268a1d0e42aa
|
3 |
+
size 33947648
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06a123b7d0de287dbcd0bd3215cb290fefce5aaa8319fa4115c87693cc40b498
|
3 |
+
size 29268992
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a99d4033411b79c7ceb2cb94cb5de1f9817ef27a82900ed3959ba008249857f
|
3 |
+
size 67895296
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab9b8f18f1c3c7fffb7bf900ebbd5997eeef6d7f68642458184d732636216f02
|
3 |
+
size 33947648
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccf5e2e00822e2916950282837a1fbe469e0861b0afd5d0e94289dc2fed54d9d
|
3 |
+
size 29268992
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:432bda5577ae25f83884a7acef1026132a61b9d63c8ca6dd4634e4a67b8b9ea2
|
3 |
+
size 67895296
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0379355297c1a9976474116c129a0f08f2655e238b97171e322de51f0c923cd9
|
3 |
+
size 33947648
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b7bc6e900707c0c4ff5a969963d02dea80e0c75f04352a70b89a7653096495a
|
3 |
+
size 29268992
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b92d7d7d035f631a1a973bbdbe0e6370fbb1c2f8794862e03a084e835053aa6
|
3 |
+
size 67895296
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90057b01221fc820d85168d749ebf5928693f3aa633d14b77fa1a6c0ae97a2b4
|
3 |
+
size 33947648
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24743b0006e50b2995c0d6d6cbc2007b3725dc6c0da7750ffdbdd41471be4add
|
3 |
+
size 33947648
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95b86fb40495fa97b24fd54fa311a61201a4a077a6d955c8919e81768c4fdd3f
|
3 |
+
size 29268992
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d3300b6651bbca31fae88360184a97019a4d4a5f22f2e82ff1dc195fe2921a5
|
3 |
+
size 67895296
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f496715ec3362b325a77cb21488ec0933925eb00da3fd404d3cd5001b70da22
|
3 |
+
size 33947648
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dfb934f7f420d6eac6d4518edfba1a04c2e80658765e4bd14dfce08ad28450e
|
3 |
+
size 29268992
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:149185a664e1236d2eb406a2a751462961430cb349d29ffbf00dce3d1588f2a5
|
3 |
+
size 67895296
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bae7193ea218b5ac4f6da7297bc3000611f56371d881d9074b61597624401a88
|
3 |
+
size 33947648
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62b30a876f0a203cbbe0c436b95429638ec166a89262879b05bd004e8c7a638a
|
3 |
+
size 29268992
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c3d503c3dc32a2b3b7335868e06577759f7953415a094b0b33b7b7cd8eb69f8
|
3 |
+
size 67895296
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dfb5e3016b1457e8c8bfe9c63cda4fc48ba9dbf23ecb6994baf648ebf9f3fc9
|
3 |
+
size 33947648
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11fb97da90e7f1bac0492e1f03141a7300b0f1df5117b8a381ddd936b13e26f7
|
3 |
+
size 29278208
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6da5cd40f50b4385de8d58fc215db9e7ae73b6c19dffa50e8050492290db0122
|
3 |
+
size 29268992
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c46836e3e32c23a4dc72142c338d290a6e202375a02acda7302a0811bd2a0ba
|
3 |
+
size 67895296
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28f2ed0048a5bab04e5fcfbcf517433e29d7bb5655e8428e44a9ced57b5b4246
|
3 |
+
size 33947648
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72fef46b69181bce2380c6352502466e9a4236cb595248dfbd21e4189637338f
|
3 |
+
size 29268992
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c254252af308d25408178a3673f46a60935b00c98001b1a29434d60fcf71fd1
|
3 |
+
size 67895296
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0427d5e73cc63fb8605e817dcfd8a9dacdc0bd63e52bc7f30c82b965730d415d
|
3 |
+
size 33947648
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22bbe837a51ddcb2c0476441aa042282d87e20c00d3ad8a7d31102e2c441ad23
|
3 |
+
size 29268992
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96f8c32fcbb30a490e94974fe49d1af6143a3b0eaabf1b016b66c1f55dce051b
|
3 |
+
size 67895296
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cad654fe1554a1f94285f958acf2a49e3a7a541fa16865731f8b8b9a02b4462b
|
3 |
+
size 33947648
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4827694ce0bbabc4a0086bd16ef9509c738bb9eb14fabbb08e5e1a11b64fed9
|
3 |
+
size 29268992
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aca7de6593754a5841d69e6642a84693ee95a8daaeb741a698e72696c1ae6c3a
|
3 |
+
size 67895296
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cca92e4f48f9625479c3e0d0204062577f3239575eedddfcdb5f732feef0a26c
|
3 |
+
size 67895296
|