nerderlyne
commited on
Commit
·
37dd308
1
Parent(s):
a7dd7ad
add mlc weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +83 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,83 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"field_model_type": "llama",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"field_model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"position_embedding_base": 500000.0,
|
13 |
+
"context_window_size": 8192,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 8,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80
|
19 |
+
},
|
20 |
+
"vocab_size": 128256,
|
21 |
+
"context_window_size": 8192,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"temperature": 0.6,
|
27 |
+
"presence_penalty": 0.0,
|
28 |
+
"frequency_penalty": 0.0,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 0.9,
|
31 |
+
"tokenizer_files": [
|
32 |
+
"tokenizer.json",
|
33 |
+
"tokenizer_config.json"
|
34 |
+
],
|
35 |
+
"tokenizer_info": {
|
36 |
+
"token_postproc_method": "byte_level",
|
37 |
+
"prepend_space_in_encode": false,
|
38 |
+
"strip_space_in_decode": false
|
39 |
+
},
|
40 |
+
"conv_template": {
|
41 |
+
"name": "llama-3",
|
42 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}",
|
43 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
44 |
+
"system_prefix_token_ids": [
|
45 |
+
128000
|
46 |
+
],
|
47 |
+
"add_role_after_system_message": true,
|
48 |
+
"roles": {
|
49 |
+
"user": "user",
|
50 |
+
"assistant": "assistant"
|
51 |
+
},
|
52 |
+
"role_templates": {
|
53 |
+
"user": "{user_message}",
|
54 |
+
"assistant": "{assistant_message}",
|
55 |
+
"tool": "{tool_message}"
|
56 |
+
},
|
57 |
+
"messages": [],
|
58 |
+
"seps": [
|
59 |
+
"<|eot_id|><|start_header_id|>"
|
60 |
+
],
|
61 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
62 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
63 |
+
"stop_str": [
|
64 |
+
"<|end_of_text|>",
|
65 |
+
"<|eot_id|>"
|
66 |
+
],
|
67 |
+
"stop_token_ids": [
|
68 |
+
128001,
|
69 |
+
128009
|
70 |
+
],
|
71 |
+
"function_string": "",
|
72 |
+
"use_function_calling": false
|
73 |
+
},
|
74 |
+
"pad_token_id": 0,
|
75 |
+
"bos_token_id": 128000,
|
76 |
+
"eos_token_id": [
|
77 |
+
128001,
|
78 |
+
128009
|
79 |
+
],
|
80 |
+
"mean_gen_len": 128,
|
81 |
+
"max_gen_len": 512,
|
82 |
+
"shift_fill_factor": 0.3
|
83 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:857135d05507431e76ef68864ca1e838f8c44db9e76070d49bc55ff3290745cb
|
3 |
+
size 262668288
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32bb4c640f08430de4ef5aeee44aba6ca2513961ae5aa6ce38c55a8ef795f510
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3113debd5cb144463fb722940cbaeeba6c02a35630415230367cc0a736f023de
|
3 |
+
size 33046528
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23138e769636ebacebe160cbddb5b6dda6c3ab0c82e26fd2e0b884c1a38b6488
|
3 |
+
size 58720256
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eefa85f77d8aa5542125b7f846e0bffe9b4c0a65c7069306edae9b6fd4ec45a6
|
3 |
+
size 25174016
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de4834f58f7c17f139ebe4b4e970c7c8aa786de393599f483e7121b90f4ae6c7
|
3 |
+
size 29360128
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdd75fa89a7eb548e609c6bdb32a320c95de308d0851d541d4db7241835a07a9
|
3 |
+
size 58720256
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef569c39a160c6d2ddb3ac3b673e8dbe2dcc82c1166ee325aa58f0ae5ac05607
|
3 |
+
size 33046528
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:011d7b54897ecd070aa61091a241c33f3bab3223526d2d2d3ad397c59305f8f4
|
3 |
+
size 58720256
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59a50af753ca692e07ff9b7cf0d57d762ba6dd0677fc591542e81e0611a38987
|
3 |
+
size 32505856
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c876d7dda82b1a45be15041ca4a08aaff1a338c1eaa1f606cef8f465ab243f6a
|
3 |
+
size 9437184
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d0b82dc970cd1e729011a647b9456d610648bd1a19e7f43ed1448822d7941b9
|
3 |
+
size 29360128
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b7a537c59f9a6fbefc0a182caf4a152be997aa96d6677fcbcb7dc317b65c3d0
|
3 |
+
size 58720256
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ab36ce55c2ea569ada9c7d1dc94afd7593d7d6942cf7474c0543d6c4dabe4eb
|
3 |
+
size 22036480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fda7bd7fa85199d4312fe9b81741996fdf58b4c039522a1870ebb2a23ec6702
|
3 |
+
size 29360128
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeb18791f603ca1179287a6f86eb73d91631f70fbba27e8928f6d2e05d3fe427
|
3 |
+
size 58720256
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6280990996ca008f4294dec41941eaf06f769e9e1b7c8e84cce3e7735692d351
|
3 |
+
size 27271168
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db8c9fc8ab00cf1c74970a4ee54a665b4e8fa7f97f8adf16bb0a31a99cf1b916
|
3 |
+
size 29360128
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05a4c6d6f79757e594f2e1098b974462261e17500bc419e5e8c765224aee1dc8
|
3 |
+
size 30949376
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa205a817002deb0d3a4bd83887cee3222444ef6c1c56af34697f4f793fa6349
|
3 |
+
size 58720256
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63962a1a538ff2ecc296c6d07ff461247cfe1fa28950a97a7779dd80c4bb4d1e
|
3 |
+
size 32841728
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:821426d2ecd0894768092bf097acfd945a116310841d22fcd5b490737593c456
|
3 |
+
size 25174016
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a81872a9a50fe2b863f27152cde2fe06ff7342f9a2431ddd8bea80cd8558ae58
|
3 |
+
size 29360128
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09df1db31951ba2079f574751f9e600c274285d5d18035a1fd9e55e009fcfe03
|
3 |
+
size 58720256
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c430932e2adb952ebab2207e256f550fc4e0f1ebc7bca0f339503ac0ec9fa0b1
|
3 |
+
size 33046528
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3e10d9d9b3c9a1b8455ac6db80d885b9148472e9350b02f3c1a4f05aa0396e4
|
3 |
+
size 29360128
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f819c3c50b4c6e7a324e811bf63ad8e05c96291b608078e071d4a5b063b3d3ce
|
3 |
+
size 58720256
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70cbf8f4b31f1c748010c6c339f5c57ff80a2724d5ea410f9a24cb6c6be0d2ed
|
3 |
+
size 22036480
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85ba31099c12ea589c59fede0bc13858db07debf54e2b6d5b2d46db814b4aed7
|
3 |
+
size 29360128
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df7cf86f8737a99b78988fbce47678b3a1e8cadd71e005fb50a6d6f40ca017bb
|
3 |
+
size 58720256
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7c64f08e3f06ae38c16577c6d8ced726e491b093b6a6d4e295ebb49aa322955
|
3 |
+
size 27271168
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:721892a1771fd7cc14f116366b08e4311cce9b4f36e747a260f84eea01046561
|
3 |
+
size 262668288
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c33227273f264696a4c936c1731f2c53349cb2827af37863c2824d2bd0d54891
|
3 |
+
size 29360128
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:097ea61b7330d9d4fd997306ec3cb3c34f4bcd55abfa6c9c7851c04e73b1ebb5
|
3 |
+
size 30949376
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a64285dd939df748c5f6f9d2cb928685a6b6e8a31379c0d4ff9d0a40a7467b2
|
3 |
+
size 58720256
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:729e174ad4e8cfb63768a12f363c10370ede8631f18f5a5ecd3bcd0978fb19be
|
3 |
+
size 25174016
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec0b7526a7dc790413698dd1bdf8e38411401c4a4720800a81c899dbeb3e356b
|
3 |
+
size 29360128
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e92c9eb0fc75f40834973350f42eef25d0fd6a2ec3e9f78a62bc00fc58986f71
|
3 |
+
size 58720256
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:209a00ec235d7de73695f4d448c0ee87485b9bc7e35998e50f9621516fb48ff7
|
3 |
+
size 33046528
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6256215b312a62397eb6d26061b4cdf08bb22cab537b2b8905a7f0cdb03a2ab5
|
3 |
+
size 29360128
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5273c67ed08edcee180fddf88ba0e619b8b465124db569a330e1214e547c1deb
|
3 |
+
size 58720256
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee652ace3dcd14ea69e151ada835e18e4c2219d098fb54b20911cef79c4b0da5
|
3 |
+
size 22036480
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2328a9e043f74b15f0843a8b02637a4b1b6e5925809c2dc53dd131aeefdc2958
|
3 |
+
size 32833536
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b3b70b51641f89d1e42eb44b739e2431873bc7cb94e58608ebcee6265b1ae5a
|
3 |
+
size 29360128
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:932510721648b3964d674905d008dfeebdde6d3925f09b60f529dcca7f3e738d
|
3 |
+
size 58720256
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09340092155333b40a61cd5954e752720add151af9601066badf03643c277e1b
|
3 |
+
size 27271168
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1221c96a3c3a978e8c1a7ce21b71b3d5d8a234995c2a7a4d7fd39d2f453a81f
|
3 |
+
size 29360128
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41f2db46632c1c9ff17ed93b28458e9af0e1b0558e582e6a93f2b07ef69d0768
|
3 |
+
size 30949376
|