fix: correct OpenAI o1 model parameters

This commit is contained in:
Louis 2024-11-19 22:10:12 +07:00
parent c501641c91
commit 11637c5244
No known key found for this signature in database
GPG Key ID: 44FA9F4D33C37DE2
4 changed files with 12 additions and 14 deletions

View File

@ -45,7 +45,9 @@ export function requestInference(
subscriber.complete()
return
}
if (model.parameters?.stream === false) {
// There could be overriden stream parameter in the model
// that is set in request body (transformed payload)
if (requestBody?.stream === false || model.parameters?.stream === false) {
const data = await response.json()
if (transformResponse) {
subscriber.next(transformResponse(data))

View File

@ -97,11 +97,9 @@
"format": "api",
"settings": {},
"parameters": {
"max_tokens": 4096,
"temperature": 0.7,
"top_p": 0.95,
"stream": true,
"stop": [],
"temperature": 1,
"top_p": 1,
"max_tokens": 32768,
"frequency_penalty": 0,
"presence_penalty": 0
},
@ -125,11 +123,9 @@
"format": "api",
"settings": {},
"parameters": {
"max_tokens": 4096,
"temperature": 0.7,
"top_p": 0.95,
"stream": true,
"stop": [],
"temperature": 1,
"top_p": 1,
"max_tokens": 65536,
"frequency_penalty": 0,
"presence_penalty": 0
},

View File

@ -76,11 +76,11 @@ export default class JanInferenceOpenAIExtension extends RemoteOAIEngine {
transformPayload = (payload: OpenAIPayloadType): OpenAIPayloadType => {
// Transform the payload for preview models
if (this.previewModels.includes(payload.model)) {
const { max_tokens, temperature, top_p, stop, ...params } = payload
const { max_tokens, stop, ...params } = payload
return {
...params,
max_completion_tokens: max_tokens,
stream: false // o1 only support stream = false
stream: false, // o1 only support stream = false
}
}
// Pass through for non-preview models

View File

@ -1,7 +1,7 @@
{
"name": "@janhq/model-extension",
"productName": "Model Management",
"version": "1.0.34",
"version": "1.0.35",
"description": "Model Management Extension provides model exploration and seamless downloads",
"main": "dist/index.js",
"author": "Jan <service@jan.ai>",