Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +76 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_140.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen2",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 5120,
|
8 |
+
"intermediate_size": 13824,
|
9 |
+
"num_attention_heads": 40,
|
10 |
+
"num_hidden_layers": 48,
|
11 |
+
"num_key_value_heads": 8,
|
12 |
+
"rms_norm_eps": 1e-05,
|
13 |
+
"rope_theta": 1000000.0,
|
14 |
+
"vocab_size": 152064,
|
15 |
+
"tie_word_embeddings": false,
|
16 |
+
"context_window_size": 131072,
|
17 |
+
"prefill_chunk_size": 8192,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"head_dim": 128,
|
20 |
+
"dtype": "float32",
|
21 |
+
"max_batch_size": 128
|
22 |
+
},
|
23 |
+
"vocab_size": 152064,
|
24 |
+
"context_window_size": 131072,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 8192,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 1.0,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 1.0,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.json",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_level",
|
41 |
+
"prepend_space_in_encode": false,
|
42 |
+
"strip_space_in_decode": false
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "deepseek_v3",
|
46 |
+
"system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
|
47 |
+
"system_message": "You are a helpful assistant.",
|
48 |
+
"system_prefix_token_ids": null,
|
49 |
+
"add_role_after_system_message": true,
|
50 |
+
"roles": {
|
51 |
+
"user": "<\uff5cUser\uff5c>",
|
52 |
+
"assistant": "<\uff5cAssistant\uff5c>"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
"",
|
62 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
63 |
+
],
|
64 |
+
"role_content_sep": "",
|
65 |
+
"role_empty_sep": "",
|
66 |
+
"stop_str": [],
|
67 |
+
"stop_token_ids": [
|
68 |
+
151643
|
69 |
+
],
|
70 |
+
"function_string": "",
|
71 |
+
"use_function_calling": false
|
72 |
+
},
|
73 |
+
"pad_token_id": 0,
|
74 |
+
"bos_token_id": 151643,
|
75 |
+
"eos_token_id": 151643
|
76 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:335cc247586fe9125d7f4699c5afdd438f08f60cb44e69a8318e50add1d8e94b
|
3 |
+
size 1557135360
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec04b6e1cc047ece50b4900265269eba664545770449454c689da4fcada67449
|
3 |
+
size 73400320
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4be1c2f0193fda0cc3e47699ddbac064d18591573df0d7c20375e9a44ede721b
|
3 |
+
size 52428800
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8cb559ab4385578d3b51f7a8be19c7070546e4ef9c1bf656452f494697399a4
|
3 |
+
size 141557760
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:594512711d9bb7c09477ba83f8c1a3976e85be351c798d07c85ad2f41014c06f
|
3 |
+
size 73400320
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f95560dce696e844438c640d9b909651a507b7cebf4d70858a7dfc9a6dd28f55
|
3 |
+
size 52428800
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15077d097256c5c38f4f1be750fb5c8e0590ff7c1a08e1dbac137b9e3f3adb25
|
3 |
+
size 283115520
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fcab2540b9c65b37b874d4e1c1b1113a88a150503a02b091c3f3ea939a607c0
|
3 |
+
size 141557760
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7be0c507a258ba42ba51a3f590a0f93be666b0d6856b27f063fd67953466d80
|
3 |
+
size 73400320
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3113cc3a9f660ce4f769157624a1a1dfe72552566fe2fb40b7c7c4bca49cc1b9
|
3 |
+
size 52428800
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d58f5674119421dcebdbc00f7562776e22c633ca7235b540521e9631d1c0174
|
3 |
+
size 283115520
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4da03dc305b5106bfa0899d307d42a16a1ac654d9127cfc6730f930c1aa46ca
|
3 |
+
size 141557760
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfb0045a760790d1bb1f3c27d486e7be73ce70487e8591ff6dd0ddd583974e50
|
3 |
+
size 73400320
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:938904c93a3ab4008fafc63d82adf99698e0207318948a3fa4a124b1359c90c4
|
3 |
+
size 283115520
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:443d2c4eda958a6390b3eaa3b3e00fab8f62f179021ff7c082c8e11fe582da6c
|
3 |
+
size 52428800
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33fd72d87ee5428760064d7ede2fb810a66e83931868a9b171081086882c6d21
|
3 |
+
size 283115520
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:601f2c83ed167737e2975e0226cca008e8c28f40ecd9179489bb2bfe9b240290
|
3 |
+
size 141557760
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f73a513f1f169ded816ccfd9dcd3097e5b8a98ea1cae6b51258c562c86089611
|
3 |
+
size 73400320
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11831009a368f2b30b0955c8738a3982cd420c1788f9b8344e21a487541ea0a8
|
3 |
+
size 52428800
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de623de49c845b9c50143de71dc90ba226412c6a50ad9d536b86f081f4b365e8
|
3 |
+
size 283115520
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70bc25c270f8aa9e950a2778e96595ff73061d7ad626cf364600f7502440eeff
|
3 |
+
size 141557760
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c4a325fb504f3f8ce09d5c03971476a135902e3d1009de9e224141d78a77173
|
3 |
+
size 73400320
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97b39a61d60cc4856f4e0fb6939bde77a1309876e77df9a9c1afa7726fbf5a25
|
3 |
+
size 52428800
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f567de7f4b63f12735cc3dded6825f3b6a596c236d3a61a9baee0253442e482c
|
3 |
+
size 283115520
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a0050b28f87e5b3c182cc6bf4baeb6ec78cab9c88dda93333da2e8cfcdac3e3
|
3 |
+
size 141557760
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c89869ad6f3892bfd463f179c8b00b15ea1fe9648406c09f6fdc26063cf0353
|
3 |
+
size 141557760
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01a2894f27141ac0374ecbe8078dbaeff43886de1bcae99d9f1f825430e37137
|
3 |
+
size 73400320
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82cdfe10a7826a5bc55f54e61e3e244dfcdbcece4fd764dde05b178eb455bcc1
|
3 |
+
size 52428800
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66dad0b39b774c0b755283dbf6a2a43b335fbb7666aebe0ea69794bec02fe2a5
|
3 |
+
size 283115520
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9faecfbe268a60c708dfbc20db3c99a990a8cd58e1ddc0b184f3983ddb983885
|
3 |
+
size 141557760
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7353db87d949889b89c9d411f45b85933177a200ce87ac32ffab44432725548
|
3 |
+
size 73400320
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c8805858237e78d0cd1927843b6ed4a2c08d3ce6caf0765304f3059efe6b6db
|
3 |
+
size 52428800
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52b5914bfade891ed9189b546032104bc2f92f429894a901f994bb0b2ce1ad13
|
3 |
+
size 283115520
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24cd3a7390d944a81418f2d3759ac8983d30f3b80902c8206348b8d485a9a418
|
3 |
+
size 141557760
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:761cb4cbfd0ce5f2f8ed703dd0560500d18f01625270e36b64bccdc70636c8d1
|
3 |
+
size 73400320
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fd43fe30d6690495b7976fb66cecd0e2782f51c5deb520305b892501c87f926
|
3 |
+
size 73400320
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dcccf82aceaeffa76f20a079189b9a2f7b7c5af727857bc07af120a272318ac
|
3 |
+
size 52428800
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47e32aa6006b9923f01a6b19b340c45ab4cb802a5429b306273fccdbd7660161
|
3 |
+
size 283115520
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f31af1428f327734e8efa48e258aae0f14510446ccca5755933dd4375304bce1
|
3 |
+
size 141557760
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5d5bcf8cfa3d242bde170ed3c5e33cf0a3b86f093388351d2d25bdcc579e1b3
|
3 |
+
size 73400320
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8718b29d65bfb40a77ae5296bc49cf4e1c7d9e73c3ecb49475ca4f574f8cb334
|
3 |
+
size 52428800
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d8010f342f810567a2facd5e27a04e12674e67364f83cd2c98f861e9d726023
|
3 |
+
size 283115520
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6b1acaa577cce194314429b9656914022ce87fa058b437babdcbdd3507ee040
|
3 |
+
size 141557760
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:037647b5f138ab2364527613a90ab666322f05dbfa30f9d176a98a4a0de99a0c
|
3 |
+
size 73400320
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7c0c1dde5e47d21b3445392eafdfe9ac49a997c796adc370dbb5b91192e92f0
|
3 |
+
size 52428800
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a60efe31d6c86a0e0d09268dc05820a51801c0994b125bc0b17e54660f3ae8f6
|
3 |
+
size 283115520
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f21b3d5ec963a64a0766498766e824926a59b2ab8558c20ef1ec659caeed10a
|
3 |
+
size 52428800
|
params_shard_140.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f2ac2d3b8a36f88224db4163c106b4b2619a93d07f4af1b46cc52d17226c882
|
3 |
+
size 141557760
|