fix: #3703 - Deepseek-Coder-33B-Instruct is incompatible (#3732)

This commit is contained in:
Louis 2024-09-26 12:43:23 +07:00 committed by GitHub
parent f46ab45e0e
commit 7f08f0fa79
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
3 changed files with 9 additions and 9 deletions

View File

@ -1,7 +1,7 @@
{ {
"name": "@janhq/inference-cortex-extension", "name": "@janhq/inference-cortex-extension",
"productName": "Cortex Inference Engine", "productName": "Cortex Inference Engine",
"version": "1.0.17", "version": "1.0.18",
"description": "This extension embeds cortex.cpp, a lightweight inference engine written in C++. See https://jan.ai.\nAdditional dependencies could be installed to run without Cuda Toolkit installation.", "description": "This extension embeds cortex.cpp, a lightweight inference engine written in C++. See https://jan.ai.\nAdditional dependencies could be installed to run without Cuda Toolkit installation.",
"main": "dist/index.js", "main": "dist/index.js",
"node": "dist/node/index.cjs.js", "node": "dist/node/index.cjs.js",

View File

@ -8,7 +8,7 @@
"id": "deepseek-coder-1.3b", "id": "deepseek-coder-1.3b",
"object": "model", "object": "model",
"name": "Deepseek Coder 1.3B Instruct Q8", "name": "Deepseek Coder 1.3B Instruct Q8",
"version": "1.3", "version": "1.4",
"description": "Deepseek Coder excelled in project-level code completion with advanced capabilities across multiple programming languages.", "description": "Deepseek Coder excelled in project-level code completion with advanced capabilities across multiple programming languages.",
"format": "gguf", "format": "gguf",
"settings": { "settings": {
@ -22,13 +22,13 @@
"top_p": 0.95, "top_p": 0.95,
"stream": true, "stream": true,
"max_tokens": 16384, "max_tokens": 16384,
"stop": [], "stop": ["<|EOT|>"],
"frequency_penalty": 0, "frequency_penalty": 0,
"presence_penalty": 0 "presence_penalty": 0
}, },
"metadata": { "metadata": {
"author": "Deepseek, The Bloke", "author": "Deepseek, The Bloke",
"tags": ["Tiny", "Foundational Model"], "tags": ["Tiny"],
"size": 1430000000 "size": 1430000000
}, },
"engine": "nitro" "engine": "nitro"

View File

@ -2,13 +2,13 @@
"sources": [ "sources": [
{ {
"filename": "deepseek-coder-33b-instruct.Q4_K_M.gguf", "filename": "deepseek-coder-33b-instruct.Q4_K_M.gguf",
"url": "https://huggingface.co/TheBloke/deepseek-coder-33B-instruct-GGUF/resolve/main/deepseek-coder-33b-instruct.Q4_K_M.gguf" "url": "https://huggingface.co/mradermacher/deepseek-coder-33b-instruct-GGUF/resolve/main/deepseek-coder-33b-instruct.Q4_K_M.gguf"
} }
], ],
"id": "deepseek-coder-34b", "id": "deepseek-coder-34b",
"object": "model", "object": "model",
"name": "Deepseek Coder 33B Instruct Q4", "name": "Deepseek Coder 33B Instruct Q4",
"version": "1.3", "version": "1.4",
"description": "Deepseek Coder excelled in project-level code completion with advanced capabilities across multiple programming languages.", "description": "Deepseek Coder excelled in project-level code completion with advanced capabilities across multiple programming languages.",
"format": "gguf", "format": "gguf",
"settings": { "settings": {
@ -22,13 +22,13 @@
"top_p": 0.95, "top_p": 0.95,
"stream": true, "stream": true,
"max_tokens": 16384, "max_tokens": 16384,
"stop": [], "stop": ["<|EOT|>"],
"frequency_penalty": 0, "frequency_penalty": 0,
"presence_penalty": 0 "presence_penalty": 0
}, },
"metadata": { "metadata": {
"author": "Deepseek, The Bloke", "author": "Deepseek",
"tags": ["34B", "Foundational Model"], "tags": ["33B"],
"size": 19940000000 "size": 19940000000
}, },
"engine": "nitro" "engine": "nitro"