Merge pull request #3847 from janhq/fix/correct-stop-token-llava-models

fix: correct eos token of llava models
This commit is contained in:
Louis 2024-10-21 15:33:25 +07:00 committed by GitHub
commit e2d9533e79
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
3 changed files with 7 additions and 5 deletions

View File

@ -1,7 +1,7 @@
{
"name": "@janhq/inference-cortex-extension",
"productName": "Cortex Inference Engine",
"version": "1.0.19",
"version": "1.0.20",
"description": "This extension embeds cortex.cpp, a lightweight inference engine written in C++. See https://jan.ai.\nAdditional dependencies could be installed to run without Cuda Toolkit installation.",
"main": "dist/index.js",
"node": "dist/node/index.cjs.js",

View File

@ -12,7 +12,7 @@
"id": "llava-13b",
"object": "model",
"name": "LlaVa 13B Q4",
"version": "1.1",
"version": "1.2",
"description": "LlaVa can bring vision understanding to Jan",
"format": "gguf",
"settings": {
@ -24,7 +24,8 @@
"mmproj": "mmproj-model-f16.gguf"
},
"parameters": {
"max_tokens": 4096
"max_tokens": 4096,
"stop": ["</s>"]
},
"metadata": {
"author": "liuhaotian",

View File

@ -12,7 +12,7 @@
"id": "llava-7b",
"object": "model",
"name": "LlaVa 7B",
"version": "1.1",
"version": "1.2",
"description": "LlaVa can bring vision understanding to Jan",
"format": "gguf",
"settings": {
@ -24,7 +24,8 @@
"mmproj": "mmproj-model-f16.gguf"
},
"parameters": {
"max_tokens": 4096
"max_tokens": 4096,
"stop": ["</s>"]
},
"metadata": {
"author": "liuhaotian",