* fix: correct phi3 * redundant phi2 dolphin * add: hermes llama3 * add: ngl settings * correct ctx len * correct ngl * correct maxlen + ngl * disable phi3 * add ngl * add ngl * add ngl * add ngl * add ngl * add ngl * add ngl * remove redundant hermes pro * add ngl * add ngl * add ngl * remove miqu * add ngl * add ngl * add ngl * add ngl * remove redundant * add ngl * add ngl * add ngl * add ngl * add ngl * add ngl * add ngl * add ngl * add ngl * version package bump * feat: resolve issue of cannot found model in the extensions due to the removal * feat: completely remove hermes-pro-7b * feat: completely remove openhermes-neural-7b and miqu-70b, and add llama3-hermes-8b via renaming from Rex * fix: correct description --------- Co-authored-by: Van-QA <van@jan.ai>
36 lines
1001 B
JSON
36 lines
1001 B
JSON
{
|
|
"sources": [
|
|
{
|
|
"filename": "yi-34b-chat.Q4_K_M.gguf",
|
|
"url": "https://huggingface.co/TheBloke/Yi-34B-Chat-GGUF/resolve/main/yi-34b-chat.Q4_K_M.gguf"
|
|
}
|
|
],
|
|
"id": "yi-34b",
|
|
"object": "model",
|
|
"name": "Yi 34B Q4",
|
|
"version": "1.0",
|
|
"description": "Yi-34B, a specialized chat model, is known for its diverse and creative responses and excels across various NLP tasks and benchmarks.",
|
|
"format": "gguf",
|
|
"settings": {
|
|
"ctx_len": 4096,
|
|
"prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
|
|
"llama_model_path": "yi-34b-chat.Q4_K_M.gguf",
|
|
"ngl": 60
|
|
},
|
|
"parameters": {
|
|
"temperature": 0.7,
|
|
"top_p": 0.95,
|
|
"stream": true,
|
|
"max_tokens": 4096,
|
|
"stop": [],
|
|
"frequency_penalty": 0,
|
|
"presence_penalty": 0
|
|
},
|
|
"metadata": {
|
|
"author": "01-ai, The Bloke",
|
|
"tags": ["34B", "Foundational Model"],
|
|
"size": 20660000000
|
|
},
|
|
"engine": "nitro"
|
|
}
|