From 3903c10c5b6b06ac5663f796cb3ef06eb0acbcc7 Mon Sep 17 00:00:00 2001 From: hiro Date: Sun, 10 Dec 2023 20:16:05 +0700 Subject: [PATCH 1/3] fix: inference nitro accepts model parameters --- extensions/inference-nitro-extension/src/helpers/sse.ts | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/extensions/inference-nitro-extension/src/helpers/sse.ts b/extensions/inference-nitro-extension/src/helpers/sse.ts index d9d8712dd..978d9e3c5 100644 --- a/extensions/inference-nitro-extension/src/helpers/sse.ts +++ b/extensions/inference-nitro-extension/src/helpers/sse.ts @@ -16,7 +16,7 @@ export function requestInference( messages: recentMessages, model: model.id, stream: true, - // ...model.parameters, + ...model.parameters, }); fetch(INFERENCE_URL, { method: "POST", From 0522d2fe4d17e631e73d2f228d93e74998026080 Mon Sep 17 00:00:00 2001 From: hiro Date: Sun, 10 Dec 2023 20:16:19 +0700 Subject: [PATCH 2/3] fix: inference openai compatible accepts parameters --- extensions/inference-openai-extension/src/helpers/sse.ts | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/extensions/inference-openai-extension/src/helpers/sse.ts b/extensions/inference-openai-extension/src/helpers/sse.ts index c8ddefca6..dbbfc2cb2 100644 --- a/extensions/inference-openai-extension/src/helpers/sse.ts +++ b/extensions/inference-openai-extension/src/helpers/sse.ts @@ -22,8 +22,8 @@ export function requestInference( const requestBody = JSON.stringify({ messages: recentMessages, stream: true, - model: model_id - // ...model.parameters, + model: model_id, + ...model.parameters, }); fetch(`${engine.full_url}`, { method: "POST", From 97f3733a52847eb3f3f3a103d8f40f1889f1586a Mon Sep 17 00:00:00 2001 From: hiro Date: Sun, 10 Dec 2023 20:16:37 +0700 Subject: [PATCH 3/3] chore: remove default parameters for openai gpt models --- models/gpt-3.5-turbo-16k-0613/model.json | 4 +--- models/gpt-4/model.json | 8 +++----- 2 files changed, 4 insertions(+), 8 deletions(-) diff --git a/models/gpt-3.5-turbo-16k-0613/model.json b/models/gpt-3.5-turbo-16k-0613/model.json index c7e2f0d1e..93dfc79ba 100644 --- a/models/gpt-3.5-turbo-16k-0613/model.json +++ b/models/gpt-3.5-turbo-16k-0613/model.json @@ -7,9 +7,7 @@ "description": "OpenAI GPT 3.5 Turbo 16k 0613 model is extremely good", "format": "api", "settings": {}, - "parameters": { - "max_tokens": 4096 - }, + "parameters": {}, "metadata": { "author": "OpenAI", "tags": ["General", "Big Context Length"] diff --git a/models/gpt-4/model.json b/models/gpt-4/model.json index 8883fd8ef..4f1bb4021 100644 --- a/models/gpt-4/model.json +++ b/models/gpt-4/model.json @@ -2,14 +2,12 @@ "source_url": "https://openai.com", "id": "gpt-4", "object": "model", - "name": "OpenAI GPT 3.5", + "name": "OpenAI GPT 4", "version": 1.0, - "description": "OpenAI GPT 3.5 model is extremely good", + "description": "OpenAI GPT 4 model is extremely good", "format": "api", "settings": {}, - "parameters": { - "max_tokens": 4096 - }, + "parameters": {}, "metadata": { "author": "OpenAI", "tags": ["General", "Big Context Length"]