F451-q4f16_1-MLC / mlc-chat-config.json
HigherMind's picture
Upload mlc-chat-config.json with huggingface_hub
287a1f8 verified
raw
history blame
2.09 kB
{
"version": "0.1.0",
"model_type": "mistral",
"quantization": "q4f16_1",
"model_config": {
"hidden_size": 4096,
"intermediate_size": 14336,
"num_attention_heads": 32,
"num_hidden_layers": 32,
"rms_norm_eps": 1e-05,
"vocab_size": 32768,
"position_embedding_base": 1000000.0,
"num_key_value_heads": 8,
"head_dim": 128,
"context_window_size": 32768,
"sliding_window_size": 2048,
"prefill_chunk_size": 128,
"attention_sink_size": 4,
"tensor_parallel_shards": 1,
"max_batch_size": 128
},
"vocab_size": 32768,
"context_window_size": 32768,
"sliding_window_size": 2048,
"prefill_chunk_size": 128,
"attention_sink_size": 4,
"tensor_parallel_shards": 1,
"pipeline_parallel_stages": 1,
"temperature": 1.0,
"presence_penalty": 0.0,
"frequency_penalty": 0.0,
"repetition_penalty": 1.0,
"top_p": 1.0,
"tokenizer_files": [
"tokenizer.model",
"tokenizer.json",
"tokenizer_config.json"
],
"tokenizer_info": {
"token_postproc_method": "byte_fallback",
"prepend_space_in_encode": false,
"strip_space_in_decode": true
},
"conv_template": {
"name": "mistral_default",
"system_template": "[INST] {system_message}",
"system_message": "The following is a conversation with an AI assistant. She is smart and very honest. She wants to help the human understand whatever it is they want to understand using her insights and wisdom.",
"system_prefix_token_ids": [
1
],
"add_role_after_system_message": false,
"roles": {
"user": "[INST]",
"assistant": "[/INST]",
"tool": "[INST]"
},
"role_templates": {
"user": "{user_message}",
"assistant": "{assistant_message}",
"tool": "{tool_message}"
},
"messages": [],
"seps": [
" "
],
"role_content_sep": " ",
"role_empty_sep": "",
"stop_str": [
"</s>"
],
"stop_token_ids": [
2
],
"function_string": "",
"use_function_calling": false
},
"pad_token_id": 0,
"bos_token_id": 1,
"eos_token_id": 2
}