diff --git a/models/yi-34b/model.json b/models/yi-34b/model.json index 3697a9e22..4bc9b0ba1 100644 --- a/models/yi-34b/model.json +++ b/models/yi-34b/model.json @@ -1,20 +1,20 @@ { "sources": [ { - "filename": "yi-34b-chat.Q5_K_M.gguf", - "url": "https://huggingface.co/TheBloke/Yi-34B-Chat-GGUF/resolve/main/yi-34b-chat.Q5_K_M.gguf" + "filename": "yi-34b-chat.Q4_K_M.gguf", + "url": "https://huggingface.co/TheBloke/Yi-34B-Chat-GGUF/resolve/main/yi-34b-chat.Q4_K_M.gguf" } ], "id": "yi-34b", "object": "model", - "name": "Yi 34B Q5", + "name": "Yi 34B Q4", "version": "1.0", "description": "Yi-34B, a specialized chat model, is known for its diverse and creative responses and excels across various NLP tasks and benchmarks.", "format": "gguf", "settings": { "ctx_len": 4096, "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant", - "llama_model_path": "yi-34b-chat.Q5_K_M.gguf" + "llama_model_path": "yi-34b-chat.Q4_K_M.gguf" }, "parameters": { "temperature": 0.7,