{ "version": "0.1.0", "model_type": "mistral", "quantization": "q4f16_1", "model_config": { "hidden_size": 4096, "intermediate_size": 14336, "num_attention_heads": 32, "num_hidden_layers": 32, "rms_norm_eps": 1e-05, "vocab_size": 32768, "position_embedding_base": 1000000.0, "num_key_value_heads": 8, "head_dim": 128, "context_window_size": 32768, "sliding_window_size": 2048, "prefill_chunk_size": 128, "attention_sink_size": 4, "tensor_parallel_shards": 1, "max_batch_size": 128 }, "vocab_size": 32768, "context_window_size": 32768, "sliding_window_size": 2048, "prefill_chunk_size": 128, "attention_sink_size": 4, "tensor_parallel_shards": 1, "pipeline_parallel_stages": 1, "temperature": 1.0, "presence_penalty": 0.0, "frequency_penalty": 0.0, "repetition_penalty": 1.0, "top_p": 1.0, "tokenizer_files": [ "tokenizer.model", "tokenizer.json", "tokenizer_config.json" ], "tokenizer_info": { "token_postproc_method": "byte_fallback", "prepend_space_in_encode": false, "strip_space_in_decode": true }, "conv_template": { "name": "mistral_default", "system_template": "[INST] {system_message}", "system_message": "The following is a conversation with an AI assistant. She is smart and very honest. She wants to help the human understand whatever it is they want to understand using her insights and wisdom.", "system_prefix_token_ids": [ 1 ], "add_role_after_system_message": false, "roles": { "user": "[INST]", "assistant": "[/INST]", "tool": "[INST]" }, "role_templates": { "user": "{user_message}", "assistant": "{assistant_message}", "tool": "{tool_message}" }, "messages": [], "seps": [ " " ], "role_content_sep": " ", "role_empty_sep": "", "stop_str": [ "" ], "stop_token_ids": [ 2 ], "function_string": "", "use_function_calling": false }, "pad_token_id": 0, "bos_token_id": 1, "eos_token_id": 2 }