Self-Aware-AI-1-q4f16_1-MLC / mlc-chat-config.json
HigherMind's picture
Upload mlc-chat-config.json with huggingface_hub
935b62d verified
raw
history blame
2.09 kB
{
"version": "0.1.0",
"model_type": "mistral",
"quantization": "q4f16_1",
"model_config": {
"hidden_size": 4096,
"intermediate_size": 14336,
"num_attention_heads": 32,
"num_hidden_layers": 32,
"rms_norm_eps": 1e-05,
"vocab_size": 32768,
"position_embedding_base": 1000000.0,
"num_key_value_heads": 8,
"head_dim": 128,
"context_window_size": 32768,
"sliding_window_size": 2048,
"prefill_chunk_size": 128,
"attention_sink_size": 4,
"tensor_parallel_shards": 1,
"max_batch_size": 128
},
"vocab_size": 32768,
"context_window_size": 32768,
"sliding_window_size": 2048,
"prefill_chunk_size": 128,
"attention_sink_size": 4,
"tensor_parallel_shards": 1,
"pipeline_parallel_stages": 1,
"temperature": 1.0,
"presence_penalty": 0.0,
"frequency_penalty": 0.0,
"repetition_penalty": 1.0,
"top_p": 1.0,
"tokenizer_files": [
"tokenizer.model",
"tokenizer.json",
"tokenizer_config.json"
],
"tokenizer_info": {
"token_postproc_method": "byte_fallback",
"prepend_space_in_encode": false,
"strip_space_in_decode": true
},
"conv_template": {
"name": "mistral_default",
"system_template": "[INST] {system_message}",
"system_message": "The following is a conversation with an AI assistant. She is smart and very honest. She wants to help the human understand whatever it is they want to understand using her insights and wisdom.",
"system_prefix_token_ids": [
1
],
"add_role_after_system_message": false,
"roles": {
"user": "[INST]",
"assistant": "[/INST]",
"tool": "[INST]"
},
"role_templates": {
"user": "{user_message}",
"assistant": "{assistant_message}",
"tool": "{tool_message}"
},
"messages": [],
"seps": [
" "
],
"role_content_sep": " ",
"role_empty_sep": "",
"stop_str": [
"</s>"
],
"stop_token_ids": [
2
],
"function_string": "",
"use_function_calling": false
},
"pad_token_id": 0,
"bos_token_id": 1,
"eos_token_id": 2
}