Philosopy-1-q4f16_1-MLC / mlc-chat-config.json
HigherMind's picture
Upload mlc-chat-config.json with huggingface_hub
a75675a verified
raw
history blame
2.09 kB
{
"version": "0.1.0",
"model_type": "mistral",
"quantization": "q4f16_1",
"model_config": {
"hidden_size": 4096,
"intermediate_size": 14336,
"num_attention_heads": 32,
"num_hidden_layers": 32,
"rms_norm_eps": 1e-05,
"vocab_size": 32768,
"position_embedding_base": 1000000.0,
"num_key_value_heads": 8,
"head_dim": 128,
"context_window_size": 32768,
"sliding_window_size": 2048,
"prefill_chunk_size": 128,
"attention_sink_size": 4,
"tensor_parallel_shards": 1,
"max_batch_size": 128
},
"vocab_size": 32768,
"context_window_size": 32768,
"sliding_window_size": 2048,
"prefill_chunk_size": 128,
"attention_sink_size": 4,
"tensor_parallel_shards": 1,
"pipeline_parallel_stages": 1,
"temperature": 1.0,
"presence_penalty": 0.0,
"frequency_penalty": 0.0,
"repetition_penalty": 1.0,
"top_p": 1.0,
"tokenizer_files": [
"tokenizer.model",
"tokenizer.json",
"tokenizer_config.json"
],
"tokenizer_info": {
"token_postproc_method": "byte_fallback",
"prepend_space_in_encode": false,
"strip_space_in_decode": true
},
"conv_template": {
"name": "mistral_default",
"system_template": "[INST] {system_message}",
"system_message": "The following is a conversation with an AI assistant. She is smart and very honest. She wants to help the human understand whatever it is they want to understand using her insights and wisdom.",
"system_prefix_token_ids": [
1
],
"add_role_after_system_message": false,
"roles": {
"user": "[INST]",
"assistant": "[/INST]",
"tool": "[INST]"
},
"role_templates": {
"user": "{user_message}",
"assistant": "{assistant_message}",
"tool": "{tool_message}"
},
"messages": [],
"seps": [
" "
],
"role_content_sep": " ",
"role_empty_sep": "",
"stop_str": [
"</s>"
],
"stop_token_ids": [
2
],
"function_string": "",
"use_function_calling": false
},
"pad_token_id": 0,
"bos_token_id": 1,
"eos_token_id": 2
}