Chore: Add stop token for Gemma 2b (#3125)

* add stop token

* Bump version
This commit is contained in:
Hoang Ha 2024-07-01 18:36:08 +07:00 committed by Louis
parent 2f917dfcf3
commit 9fb95642df
No known key found for this signature in database
GPG Key ID: 44FA9F4D33C37DE2
2 changed files with 3 additions and 3 deletions

View File

@ -1,7 +1,7 @@
{ {
"name": "@janhq/inference-cortex-extension", "name": "@janhq/inference-cortex-extension",
"productName": "Cortex Inference Engine", "productName": "Cortex Inference Engine",
"version": "1.0.13", "version": "1.0.14",
"description": "This extension embeds cortex.cpp, a lightweight inference engine written in C++. See https://nitro.jan.ai.\nAdditional dependencies could be installed to run without Cuda Toolkit installation.", "description": "This extension embeds cortex.cpp, a lightweight inference engine written in C++. See https://nitro.jan.ai.\nAdditional dependencies could be installed to run without Cuda Toolkit installation.",
"main": "dist/index.js", "main": "dist/index.js",
"node": "dist/node/index.cjs.js", "node": "dist/node/index.cjs.js",

View File

@ -8,7 +8,7 @@
"id": "gemma-2b", "id": "gemma-2b",
"object": "model", "object": "model",
"name": "Gemma 2B Q4", "name": "Gemma 2B Q4",
"version": "1.2", "version": "1.3",
"description": "Gemma is built from the same technology with Google's Gemini.", "description": "Gemma is built from the same technology with Google's Gemini.",
"format": "gguf", "format": "gguf",
"settings": { "settings": {
@ -22,7 +22,7 @@
"top_p": 0.95, "top_p": 0.95,
"stream": true, "stream": true,
"max_tokens": 8192, "max_tokens": 8192,
"stop": [], "stop": ["<end_of_turn>"],
"frequency_penalty": 0, "frequency_penalty": 0,
"presence_penalty": 0 "presence_penalty": 0
}, },