Upload 105 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +82 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_51.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,82 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f16_0",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 10000.0,
|
14 |
+
"rope_scaling": null,
|
15 |
+
"context_window_size": 4096,
|
16 |
+
"prefill_chunk_size": 4096,
|
17 |
+
"num_key_value_heads": 32,
|
18 |
+
"head_dim": 128,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"pipeline_parallel_stages": 1,
|
21 |
+
"max_batch_size": 128
|
22 |
+
},
|
23 |
+
"vocab_size": 32000,
|
24 |
+
"context_window_size": 4096,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 4096,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 0.6,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 0.9,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.model",
|
37 |
+
"tokenizer.json",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"tokenizer_info": {
|
41 |
+
"token_postproc_method": "byte_fallback",
|
42 |
+
"prepend_space_in_encode": true,
|
43 |
+
"strip_space_in_decode": true
|
44 |
+
},
|
45 |
+
"conv_template": {
|
46 |
+
"name": "llama-2",
|
47 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n",
|
48 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
49 |
+
"system_prefix_token_ids": [
|
50 |
+
1
|
51 |
+
],
|
52 |
+
"add_role_after_system_message": false,
|
53 |
+
"roles": {
|
54 |
+
"user": "<s>[INST]",
|
55 |
+
"assistant": "[/INST]",
|
56 |
+
"tool": "[INST]"
|
57 |
+
},
|
58 |
+
"role_templates": {
|
59 |
+
"user": "{user_message}",
|
60 |
+
"assistant": "{assistant_message}",
|
61 |
+
"tool": "{tool_message}"
|
62 |
+
},
|
63 |
+
"messages": [],
|
64 |
+
"seps": [
|
65 |
+
" ",
|
66 |
+
" </s>"
|
67 |
+
],
|
68 |
+
"role_content_sep": " ",
|
69 |
+
"role_empty_sep": " ",
|
70 |
+
"stop_str": [
|
71 |
+
"[INST]"
|
72 |
+
],
|
73 |
+
"stop_token_ids": [
|
74 |
+
2
|
75 |
+
],
|
76 |
+
"function_string": "",
|
77 |
+
"use_function_calling": false
|
78 |
+
},
|
79 |
+
"pad_token_id": 0,
|
80 |
+
"bos_token_id": 1,
|
81 |
+
"eos_token_id": 2
|
82 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a08a9af87db7ef06ad141f526c0478b642e002da26b8df7aab92102723e8e16
|
3 |
+
size 65536000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f67996b1e419cd3e38a42243bb47393250b2a3dd0e5390e1d7d55551898e7323
|
3 |
+
size 28516288
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0adc56c9f7dc7c6122fa2dd2f8f474687fdd936ea6a2585fe2866b7fe911c688
|
3 |
+
size 31357952
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6f4cc211d35c424e1621b2b2f2dd248cc80a4f6c29e666af8d54f9cc1ae7154
|
3 |
+
size 32135168
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50a16bbf7eb5fc4a57d86f9ae6c36bb4a8e265758295b77090fc422559d35148
|
3 |
+
size 29647296
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87845a38b56d5db51782b62adfd0f315948701135618ec7df51f6a94c1165ea7
|
3 |
+
size 33480704
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44f3c884cc7d9ff0de368bc23f14ca4e86835fb9315a772567ac29f1dfd96efc
|
3 |
+
size 28361216
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94537c3fd8663e575e57529392de4303b2e90931e9c33f85bb1573eb0f9ced25
|
3 |
+
size 29647296
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b30467dc3ee9d989d790ec263ae533ff6ed5e11b0dc500eebbcfd8f6c84cf48d
|
3 |
+
size 33480704
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eae47a0bd74ac395edb1cb689363db860fa9fe3c30f9f8bb3d6d3fa497b1d8e9
|
3 |
+
size 28361216
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1d52b9e01a41406efb05d559e20a833c3e351b514966384bcb07084a551d1a7
|
3 |
+
size 29647296
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a92fc3bb48d66a150a35d29dbcc6bdf480cfaa11fc06869ab045e7203fa2a3fe
|
3 |
+
size 33480704
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8ef596ed88c50a7c8ce2c4356d684ff1336e1a5f20435f78bc6d979e83944c8
|
3 |
+
size 20362752
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af2afe77e83733d9e560e8e5cf53ce90bede1897bf029b7bb85581b5388cbb0a
|
3 |
+
size 28361216
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65a50d3021e4ebdde4213793a2daf2f9dc0998801b27c825998f1ff6d3369c5b
|
3 |
+
size 29647296
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b183fdefff4b2aa5790f26a6bdb939d3cc880e4e475d759bc7ac9f165aa6eeb1
|
3 |
+
size 33480704
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:139f1b65d4a94f0f499d721a4505fbc4d9db03c90393be1e5d7b4a7de5303460
|
3 |
+
size 28361216
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73fca47d2b1edbf9f1c6e120960f116d7b2e43d30f08835508b2bcebaed4ed9a
|
3 |
+
size 29647296
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2c2fc8b735598e901450ced02f6225e0d1de02c8605280e29e377c224164006
|
3 |
+
size 33480704
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f75bdcefff674e56400454226babe2a80f69a5292b38f9eeea921913487f3294
|
3 |
+
size 28353024
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09847e1228969c78d84e768ac1e4ee97d52d16d5e29935a92504b4bcbf84dda4
|
3 |
+
size 31804416
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96064ced43a2ec3365c8b0254eefc15133bfa3a85131b3afb0bc4ed8efdbdd2f
|
3 |
+
size 24527360
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bc6150d89a6c06be08cce1407623eda4e25f04dd6d67337239a5a137cf4def0
|
3 |
+
size 29647296
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54f331d991a8243d8273256f63bd2234505f3d0109f1fe86972d2c83ca661b74
|
3 |
+
size 31812608
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a74d9e7b1e3fc07e9f726acb421e613774c2651b811e934eb239ba812b40403
|
3 |
+
size 33480704
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21f680bff4ab5207dc09d9094a4284ea7e4449fbaba0c1ecece30223bc47891f
|
3 |
+
size 28361216
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0d446e93a0d24ade17ced8e4155ab6a72d0d6232a3249f8b5359d42d3624207
|
3 |
+
size 29647296
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c9e8dbfbe3d4a379feb3e7c75ebedf2565a502c4f9e8a88158e7b136ba27d0c
|
3 |
+
size 33480704
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8098a5747574188a3e0bc5e0da3b8e727d8f9c5d7950268d74c857e4dce26ccc
|
3 |
+
size 28361216
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9033b6775c0cc5570bc90765789b2337965663ff9d32b69580ad7189a2a9947
|
3 |
+
size 29647296
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd057b40d2e2b193322804cd5cd88e4823bd221a1f2dd88af3c2775ecfab8efd
|
3 |
+
size 33480704
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf680991e2ea76e4b39972f0c783855f6cf3b11d0d76512f8f0ba3031f057206
|
3 |
+
size 28361216
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2ca2bda542b25839747c051b4e39c5c1549bf24214d36b5baccfe98fb0638a2
|
3 |
+
size 29647296
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c543d0fb726848dfae35a6a7736518f27c2ffaf7edd594b9ef4a03cc0f405585
|
3 |
+
size 33480704
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3715937055671d4cc67feec54ac07a6166c7242dd194689c796340c9a5c93c0
|
3 |
+
size 20693504
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ada057075fe2085d032f16817484ff384837c1670873c7fcaffd0ad9fbbb17cc
|
3 |
+
size 28361216
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05a8ed8be9fc53d42ab7f7489ba06ddee65fc817e9ccd543a31be6b8bf84ebef
|
3 |
+
size 29647296
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:558843e18dad2ca23b8d9c2388844b4c2c8126503d90d3d50fe10cdcc999ca94
|
3 |
+
size 33480704
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c8c335937e17cacdffd3a722b95cae54d11a28fa8bb3c75541f4774749ee366
|
3 |
+
size 28361216
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e1945bea13ca6e77e710100bff42d16c54665f1042ea4150231f5222310a5b2
|
3 |
+
size 29647296
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c35a8e17a26516740e69aa162632be1a67dd106550c30121a621003c06229cd8
|
3 |
+
size 33480704
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e6863ecf5384a9d3d7b7c7c223f34b47a4f39dec934042062fd2fd9ad331ed6
|
3 |
+
size 28361216
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf5c072714875446f1f48de4e3921e77c466553e4f7c90719f9279dfc05cc49b
|
3 |
+
size 29647296
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e68af24b987c56be949ebb77c52acb3b5e7f70ca10c034dd0593ecb29759cd1
|
3 |
+
size 33480704
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5c20c2643c279a05c96318b24f998ae01426c2bdb96b8e0a64586575a1f9707
|
3 |
+
size 28361216
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd1f9953d48053550cec396ebac8125b6c180b6b304fc8c359e80b6010fdacc6
|
3 |
+
size 29647296
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0fa8f41e3a17dc7b85801b6352060951ff636ae7dbb1275d1f1c4bb05ee8137
|
3 |
+
size 29647296
|
params_shard_51.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be79ba7e4f488820e50b3965c28b8a1aea8bf35ac81113d12adf28d882da9fd2
|
3 |
+
size 33480704
|