diff --git a/.github/workflows/publish-npm-core.yml b/.github/workflows/publish-npm-core.yml
index 49eac8dd2..462dbdc8e 100644
--- a/.github/workflows/publish-npm-core.yml
+++ b/.github/workflows/publish-npm-core.yml
@@ -2,9 +2,9 @@ name: Publish core Package to npmjs
 on:
   push:
     tags: ["v[0-9]+.[0-9]+.[0-9]+-core"]
-    paths: ["core/**"]
+    paths: ["core/**", ".github/workflows/publish-npm-core.yml"]
   pull_request:
-    paths: ["core/**"]
+    paths: ["core/**", ".github/workflows/publish-npm-core.yml"]
 jobs:
   build-and-publish-plugins:
     environment: production
@@ -45,7 +45,7 @@ jobs:
           node-version: "20.x"
           registry-url: "https://registry.npmjs.org"
 
-      - run: cd core && corepack enable && corepack prepare yarn@4.5.3 --activate && yarn --version && yarn install && yarn build
+      - run: cd core && corepack enable && corepack prepare yarn@4.5.3 --activate && yarn --version && yarn config set -H enableImmutableInstalls false && yarn install && yarn build
 
       - run: cd core && yarn publish --access public
         if: github.event_name == 'push'
diff --git a/.github/workflows/publish-npm-joi.yml b/.github/workflows/publish-npm-joi.yml
index 8c6ee6f68..867ad80fe 100644
--- a/.github/workflows/publish-npm-joi.yml
+++ b/.github/workflows/publish-npm-joi.yml
@@ -2,9 +2,9 @@ name: Publish joi Package to npmjs
 on:
   push:
     tags: ["v[0-9]+.[0-9]+.[0-9]+-joi"]
-    paths: ["joi/**"]
+    paths: ["joi/**", ".github/workflows/publish-npm-joi.yml"]
   pull_request:
-    paths: ["joi/**"]
+    paths: ["joi/**", ".github/workflows/publish-npm-joi.yml"]
 jobs:
   build-and-publish-plugins:
     environment: production
@@ -45,7 +45,7 @@ jobs:
           node-version: "20.x"
           registry-url: "https://registry.npmjs.org"
 
-      - run: cd joi && corepack enable && corepack prepare yarn@4.5.3 --activate && yarn --version && yarn install && yarn build
+      - run: cd joi && corepack enable && corepack prepare yarn@4.5.3 --activate && yarn --version && yarn config set -H enableImmutableInstalls false && yarn install && yarn build
 
       - run: cd joi && yarn publish --access public
         if: github.event_name == 'push'
diff --git a/core/src/browser/extensions/engines/helpers/sse.ts b/core/src/browser/extensions/engines/helpers/sse.ts
index 153d741da..aaafbf7e5 100644
--- a/core/src/browser/extensions/engines/helpers/sse.ts
+++ b/core/src/browser/extensions/engines/helpers/sse.ts
@@ -22,7 +22,9 @@ export function requestInference(
       headers: {
         'Content-Type': 'application/json',
         'Access-Control-Allow-Origin': '*',
-        'Accept': model.parameters?.stream ? 'text/event-stream' : 'application/json',
+        'Accept': model.parameters?.stream
+          ? 'text/event-stream'
+          : 'application/json',
         ...headers,
       },
       body: JSON.stringify(requestBody),
@@ -47,12 +49,24 @@ export function requestInference(
         }
         // There could be overriden stream parameter in the model
         // that is set in request body (transformed payload)
-        if (requestBody?.stream === false || model.parameters?.stream === false) {
+        if (
+          requestBody?.stream === false ||
+          model.parameters?.stream === false
+        ) {
           const data = await response.json()
+          if (data.error || data.message) {
+            subscriber.error(data.error ?? data)
+            subscriber.complete()
+            return
+          }
           if (transformResponse) {
             subscriber.next(transformResponse(data))
           } else {
-            subscriber.next(data.choices[0]?.message?.content ?? '')
+            subscriber.next(
+              data.choices
+                ? data.choices[0]?.message?.content
+                : (data.content[0]?.text ?? '')
+            )
           }
         } else {
           const stream = response.body
diff --git a/core/src/browser/extensions/enginesManagement.ts b/core/src/browser/extensions/enginesManagement.ts
index 524546b05..66dff87df 100644
--- a/core/src/browser/extensions/enginesManagement.ts
+++ b/core/src/browser/extensions/enginesManagement.ts
@@ -3,6 +3,7 @@ import {
   Engines,
   EngineVariant,
   EngineReleased,
+  EngineConfig,
   DefaultEngineVariant,
 } from '../../types'
 import { BaseExtension, ExtensionTypeEnum } from '../extension'
@@ -55,8 +56,16 @@ export abstract class EngineManagementExtension extends BaseExtension {
    * @returns A Promise that resolves to intall of engine.
    */
   abstract installEngine(
-    name: InferenceEngine,
-    engineConfig: { variant: string; version?: string }
+    name: string,
+    engineConfig: EngineConfig
+  ): Promise<{ messages: string }>
+
+  /**
+   * Add a new remote engine
+   * @returns A Promise that resolves to intall of engine.
+   */
+  abstract addRemoteEngine(
+    engineConfig: EngineConfig
   ): Promise<{ messages: string }>
 
   /**
@@ -65,14 +74,16 @@ export abstract class EngineManagementExtension extends BaseExtension {
    */
   abstract uninstallEngine(
     name: InferenceEngine,
-    engineConfig: { variant: string; version: string }
+    engineConfig: EngineConfig
   ): Promise<{ messages: string }>
 
   /**
    * @param name - Inference engine name.
    * @returns A Promise that resolves to an object of default engine.
    */
-  abstract getDefaultEngineVariant(name: InferenceEngine): Promise<DefaultEngineVariant>
+  abstract getDefaultEngineVariant(
+    name: InferenceEngine
+  ): Promise<DefaultEngineVariant>
 
   /**
    * @body variant - string
@@ -81,11 +92,19 @@ export abstract class EngineManagementExtension extends BaseExtension {
    */
   abstract setDefaultEngineVariant(
     name: InferenceEngine,
-    engineConfig: { variant: string; version: string }
+    engineConfig: EngineConfig
   ): Promise<{ messages: string }>
 
   /**
    * @returns A Promise that resolves to update engine.
    */
-  abstract updateEngine(name: InferenceEngine): Promise<{ messages: string }>
+  abstract updateEngine(
+    name: InferenceEngine,
+    engineConfig?: EngineConfig
+  ): Promise<{ messages: string }>
+
+  /**
+   * @returns A Promise that resolves to an object of remote models list .
+   */
+  abstract getRemoteModels(name: InferenceEngine | string): Promise<any>
 }
diff --git a/core/src/node/helper/config.test.ts b/core/src/node/helper/config.test.ts
index d46750d5f..617a8f7ef 100644
--- a/core/src/node/helper/config.test.ts
+++ b/core/src/node/helper/config.test.ts
@@ -1,28 +1,19 @@
-import { getEngineConfiguration } from './config';
-import { getAppConfigurations, defaultAppConfig } from './config';
-
-import { getJanExtensionsPath } from './config';
-import { getJanDataFolderPath } from './config';
-it('should return undefined for invalid engine ID', async () => {
-  const config = await getEngineConfiguration('invalid_engine');
-  expect(config).toBeUndefined();
-});
+import { getAppConfigurations, defaultAppConfig } from './config'
 
+import { getJanExtensionsPath, getJanDataFolderPath } from './config'
 
 it('should return default config when CI is e2e', () => {
-  process.env.CI = 'e2e';
-  const config = getAppConfigurations();
-  expect(config).toEqual(defaultAppConfig());
-});
-
+  process.env.CI = 'e2e'
+  const config = getAppConfigurations()
+  expect(config).toEqual(defaultAppConfig())
+})
 
 it('should return extensions path when retrieved successfully', () => {
-  const extensionsPath = getJanExtensionsPath();
-  expect(extensionsPath).not.toBeUndefined();
-});
-
+  const extensionsPath = getJanExtensionsPath()
+  expect(extensionsPath).not.toBeUndefined()
+})
 
 it('should return data folder path when retrieved successfully', () => {
-  const dataFolderPath = getJanDataFolderPath();
-  expect(dataFolderPath).not.toBeUndefined();
-});
+  const dataFolderPath = getJanDataFolderPath()
+  expect(dataFolderPath).not.toBeUndefined()
+})
diff --git a/core/src/node/helper/config.ts b/core/src/node/helper/config.ts
index 8bf48d629..6fb28d01f 100644
--- a/core/src/node/helper/config.ts
+++ b/core/src/node/helper/config.ts
@@ -1,8 +1,7 @@
-import { AppConfiguration, SettingComponentProps } from '../../types'
+import { AppConfiguration } from '../../types'
 import { join, resolve } from 'path'
 import fs from 'fs'
 import os from 'os'
-import childProcess from 'child_process'
 const configurationFileName = 'settings.json'
 
 /**
@@ -19,7 +18,9 @@ export const getAppConfigurations = (): AppConfiguration => {
 
   if (!fs.existsSync(configurationFile)) {
     // create default app config if we don't have one
-    console.debug(`App config not found, creating default config at ${configurationFile}`)
+    console.debug(
+      `App config not found, creating default config at ${configurationFile}`
+    )
     fs.writeFileSync(configurationFile, JSON.stringify(appDefaultConfiguration))
     return appDefaultConfiguration
   }
@@ -30,20 +31,28 @@ export const getAppConfigurations = (): AppConfiguration => {
     )
     return appConfigurations
   } catch (err) {
-    console.error(`Failed to read app config, return default config instead! Err: ${err}`)
+    console.error(
+      `Failed to read app config, return default config instead! Err: ${err}`
+    )
     return defaultAppConfig()
   }
 }
 
 const getConfigurationFilePath = () =>
   join(
-    global.core?.appPath() || process.env[process.platform == 'win32' ? 'USERPROFILE' : 'HOME'],
+    global.core?.appPath() ||
+      process.env[process.platform == 'win32' ? 'USERPROFILE' : 'HOME'],
     configurationFileName
   )
 
-export const updateAppConfiguration = (configuration: AppConfiguration): Promise<void> => {
+export const updateAppConfiguration = (
+  configuration: AppConfiguration
+): Promise<void> => {
   const configurationFile = getConfigurationFilePath()
-  console.debug('updateAppConfiguration, configurationFile: ', configurationFile)
+  console.debug(
+    'updateAppConfiguration, configurationFile: ',
+    configurationFile
+  )
 
   fs.writeFileSync(configurationFile, JSON.stringify(configuration))
   return Promise.resolve()
@@ -69,86 +78,6 @@ export const getJanExtensionsPath = (): string => {
   return join(appConfigurations.data_folder, 'extensions')
 }
 
-/**
- * Utility function to physical cpu count
- *
- * @returns {number} The physical cpu count.
- */
-export const physicalCpuCount = async (): Promise<number> => {
-  const platform = os.platform()
-  try {
-    if (platform === 'linux') {
-      const output = await exec('lscpu -p | egrep -v "^#" | sort -u -t, -k 2,4 | wc -l')
-      return parseInt(output.trim(), 10)
-    } else if (platform === 'darwin') {
-      const output = await exec('sysctl -n hw.physicalcpu_max')
-      return parseInt(output.trim(), 10)
-    } else if (platform === 'win32') {
-      const output = await exec('WMIC CPU Get NumberOfCores')
-      return output
-        .split(os.EOL)
-        .map((line: string) => parseInt(line))
-        .filter((value: number) => !isNaN(value))
-        .reduce((sum: number, number: number) => sum + number, 1)
-    } else {
-      const cores = os.cpus().filter((cpu: any, index: number) => {
-        const hasHyperthreading = cpu.model.includes('Intel')
-        const isOdd = index % 2 === 1
-        return !hasHyperthreading || isOdd
-      })
-      return cores.length
-    }
-  } catch (err) {
-    console.warn('Failed to get physical CPU count', err)
-    // Divide by 2 to get rid of hyper threading
-    const coreCount = Math.ceil(os.cpus().length / 2)
-    console.debug('Using node API to get physical CPU count:', coreCount)
-    return coreCount
-  }
-}
-
-const exec = async (command: string): Promise<string> => {
-  return new Promise((resolve, reject) => {
-    childProcess.exec(command, { encoding: 'utf8' }, (error, stdout) => {
-      if (error) {
-        reject(error)
-      } else {
-        resolve(stdout)
-      }
-    })
-  })
-}
-
-// a hacky way to get the api key. we should comes up with a better
-// way to handle this
-export const getEngineConfiguration = async (engineId: string) => {
-  if (engineId !== 'openai' && engineId !== 'groq') return undefined
-
-  const settingDirectoryPath = join(
-    getJanDataFolderPath(),
-    'settings',
-    '@janhq',
-    engineId === 'openai' ? 'inference-openai-extension' : 'inference-groq-extension',
-    'settings.json'
-  )
-
-  const content = fs.readFileSync(settingDirectoryPath, 'utf-8')
-  const settings: SettingComponentProps[] = JSON.parse(content)
-  const apiKeyId = engineId === 'openai' ? 'openai-api-key' : 'groq-api-key'
-  const keySetting = settings.find((setting) => setting.key === apiKeyId)
-  let fullUrl = settings.find((setting) => setting.key === 'chat-completions-endpoint')
-    ?.controllerProps.value
-
-  let apiKey = keySetting?.controllerProps.value
-  if (typeof apiKey !== 'string') apiKey = ''
-  if (typeof fullUrl !== 'string') fullUrl = ''
-
-  return {
-    api_key: apiKey,
-    full_url: fullUrl,
-  }
-}
-
 /**
  * Default app configurations
  * App Data Folder default to Electron's userData
@@ -158,7 +87,10 @@ export const getEngineConfiguration = async (engineId: string) => {
  */
 export const defaultAppConfig = (): AppConfiguration => {
   const { app } = require('electron')
-  const defaultJanDataFolder = join(app?.getPath('userData') ?? os?.homedir() ?? '', 'data')
+  const defaultJanDataFolder = join(
+    app?.getPath('userData') ?? os?.homedir() ?? '',
+    'data'
+  )
   return {
     data_folder:
       process.env.CI === 'e2e'
diff --git a/core/src/node/helper/resource.test.ts b/core/src/node/helper/resource.test.ts
index aaeab9d65..c82d481db 100644
--- a/core/src/node/helper/resource.test.ts
+++ b/core/src/node/helper/resource.test.ts
@@ -1,15 +1,9 @@
-import { getSystemResourceInfo } from './resource';
+import { getSystemResourceInfo } from './resource'
 
 it('should return the correct system resource information with a valid CPU count', async () => {
-  const mockCpuCount = 4;
-  jest.spyOn(require('./config'), 'physicalCpuCount').mockResolvedValue(mockCpuCount);
-  const logSpy = jest.spyOn(require('./logger'), 'log').mockImplementation(() => {});
-
-  const result = await getSystemResourceInfo();
+  const result = await getSystemResourceInfo()
 
   expect(result).toEqual({
-    numCpuPhysicalCore: mockCpuCount,
     memAvailable: 0,
-  });
-  expect(logSpy).toHaveBeenCalledWith(`[CORTEX]::CPU information - ${mockCpuCount}`);
-});
+  })
+})
diff --git a/core/src/node/helper/resource.ts b/core/src/node/helper/resource.ts
index c7bfbf20c..5d75e54eb 100644
--- a/core/src/node/helper/resource.ts
+++ b/core/src/node/helper/resource.ts
@@ -1,13 +1,7 @@
 import { SystemResourceInfo } from '../../types'
-import { physicalCpuCount } from './config'
-import { log } from './logger'
 
 export const getSystemResourceInfo = async (): Promise<SystemResourceInfo> => {
-  const cpu = await physicalCpuCount()
-  log(`[CORTEX]::CPU information - ${cpu}`)
-
   return {
-    numCpuPhysicalCore: cpu,
     memAvailable: 0, // TODO: this should not be 0
   }
 }
diff --git a/core/src/types/engine/index.ts b/core/src/types/engine/index.ts
index 9e6f5c9c8..7c848a279 100644
--- a/core/src/types/engine/index.ts
+++ b/core/src/types/engine/index.ts
@@ -1,7 +1,23 @@
 import { InferenceEngine } from '../../types'
 
 export type Engines = {
-  [key in InferenceEngine]: EngineVariant[]
+  [key in InferenceEngine]: (EngineVariant & EngineConfig)[]
+}
+
+export type EngineMetadata = {
+  get_models_url?: string
+  header_template?: string
+  transform_req?: {
+    chat_completions?: {
+      url?: string
+      template?: string
+    }
+  }
+  transform_resp?: {
+    chat_completions?: {
+      template?: string
+    }
+  }
 }
 
 export type EngineVariant = {
@@ -23,6 +39,16 @@ export type EngineReleased = {
   size: number
 }
 
+export type EngineConfig = {
+  engine?: string
+  version?: string
+  variant?: string
+  type?: string
+  url?: string
+  api_key?: string
+  metadata?: EngineMetadata
+}
+
 export enum EngineEvent {
   OnEngineUpdate = 'OnEngineUpdate',
 }
diff --git a/core/src/types/message/messageEntity.ts b/core/src/types/message/messageEntity.ts
index 302b824ee..edd253a57 100644
--- a/core/src/types/message/messageEntity.ts
+++ b/core/src/types/message/messageEntity.ts
@@ -32,9 +32,8 @@ export type ThreadMessage = {
   completed_at: number
   /** The additional metadata of this message. **/
   metadata?: Record<string, unknown>
-
+  /** Type of the message */
   type?: string
-
   /** The error code which explain what error type. Used in conjunction with MessageStatus.Error */
   error_code?: ErrorCode
 }
@@ -72,6 +71,10 @@ export type MessageRequest = {
   // TODO: deprecate threadId field
   thread?: Thread
 
+  /** Engine name to process */
+  engine?: string
+
+  /** Message type */
   type?: string
 }
 
@@ -147,7 +150,9 @@ export interface Attachment {
   /**
    * The tools to add this file to.
    */
-  tools?: Array<CodeInterpreterTool | Attachment.AssistantToolsFileSearchTypeOnly>
+  tools?: Array<
+    CodeInterpreterTool | Attachment.AssistantToolsFileSearchTypeOnly
+  >
 }
 
 export namespace Attachment {
@@ -166,5 +171,10 @@ export interface IncompleteDetails {
   /**
    * The reason the message is incomplete.
    */
-  reason: 'content_filter' | 'max_tokens' | 'run_cancelled' | 'run_expired' | 'run_failed'
+  reason:
+    | 'content_filter'
+    | 'max_tokens'
+    | 'run_cancelled'
+    | 'run_expired'
+    | 'run_failed'
 }
diff --git a/core/src/types/miscellaneous/systemResourceInfo.ts b/core/src/types/miscellaneous/systemResourceInfo.ts
index 6ceea0822..82db5d941 100644
--- a/core/src/types/miscellaneous/systemResourceInfo.ts
+++ b/core/src/types/miscellaneous/systemResourceInfo.ts
@@ -1,5 +1,4 @@
 export type SystemResourceInfo = {
-  numCpuPhysicalCore: number
   memAvailable: number
 }
 
diff --git a/electron/package.json b/electron/package.json
index 72163cb42..329f2b4c4 100644
--- a/electron/package.json
+++ b/electron/package.json
@@ -1,6 +1,6 @@
 {
   "name": "jan",
-  "version": "0.1.3",
+  "version": "0.1.1736316956",
   "main": "./build/main.js",
   "author": "Jan <service@jan.ai>",
   "license": "MIT",
diff --git a/extensions/engine-management-extension/engines.mjs b/extensions/engine-management-extension/engines.mjs
new file mode 100644
index 000000000..e85035423
--- /dev/null
+++ b/extensions/engine-management-extension/engines.mjs
@@ -0,0 +1,39 @@
+import anthropic from './resources/anthropic.json' with { type: 'json' }
+import cohere from './resources/cohere.json' with { type: 'json' }
+import openai from './resources/openai.json' with { type: 'json' }
+import openrouter from './resources/openrouter.json' with { type: 'json' }
+import groq from './resources/groq.json' with { type: 'json' }
+import martian from './resources/martian.json' with { type: 'json' }
+import mistral from './resources/mistral.json' with { type: 'json' }
+import nvidia from './resources/nvidia.json' with { type: 'json' }
+
+import anthropicModels from './models/anthropic.json' with { type: 'json' }
+import cohereModels from './models/cohere.json' with { type: 'json' }
+import openaiModels from './models/openai.json' with { type: 'json' }
+import openrouterModels from './models/openrouter.json' with { type: 'json' }
+import groqModels from './models/groq.json' with { type: 'json' }
+import martianModels from './models/martian.json' with { type: 'json' }
+import mistralModels from './models/mistral.json' with { type: 'json' }
+import nvidiaModels from './models/nvidia.json' with { type: 'json' }
+
+const engines = [
+  anthropic,
+  openai,
+  cohere,
+  openrouter,
+  groq,
+  mistral,
+  martian,
+  nvidia,
+]
+const models = [
+  ...anthropicModels,
+  ...openaiModels,
+  ...cohereModels,
+  ...openrouterModels,
+  ...groqModels,
+  ...mistralModels,
+  ...martianModels,
+  ...nvidiaModels,
+]
+export { engines, models }
diff --git a/extensions/inference-anthropic-extension/resources/models.json b/extensions/engine-management-extension/models/anthropic.json
similarity index 54%
rename from extensions/inference-anthropic-extension/resources/models.json
rename to extensions/engine-management-extension/models/anthropic.json
index 59e41245b..d35ba4c22 100644
--- a/extensions/inference-anthropic-extension/resources/models.json
+++ b/extensions/engine-management-extension/models/anthropic.json
@@ -1,74 +1,41 @@
 [
   {
-    "sources": [
-      {
-        "url": "https://www.anthropic.com/"
-      }
-    ],
-    "id": "claude-3-opus-latest",
+    "model": "claude-3-opus-latest",
     "object": "model",
     "name": "Claude 3 Opus Latest",
     "version": "1.0",
     "description": "Claude 3 Opus is a powerful model suitables for highly complex task.",
-    "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 4096,
       "temperature": 0.7,
       "stream": false
     },
-    "metadata": {
-      "author": "Anthropic",
-      "tags": ["General", "Big Context Length"]
-    },
     "engine": "anthropic"
   },
   {
-    "sources": [
-      {
-        "url": "https://www.anthropic.com/"
-      }
-    ],
-    "id": "claude-3-5-haiku-latest",
+    "model": "claude-3-5-haiku-latest",
     "object": "model",
     "name": "Claude 3.5 Haiku Latest",
     "version": "1.0",
     "description": "Claude 3.5 Haiku is the fastest model provides near-instant responsiveness.",
-    "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 8192,
       "temperature": 0.7,
       "stream": false
     },
-    "metadata": {
-      "author": "Anthropic",
-      "tags": ["General", "Big Context Length"]
-    },
     "engine": "anthropic"
   },
   {
-    "sources": [
-      {
-        "url": "https://www.anthropic.com/"
-      }
-    ],
-    "id": "claude-3-5-sonnet-latest",
+    "model": "claude-3-5-sonnet-latest",
     "object": "model",
     "name": "Claude 3.5 Sonnet Latest",
     "version": "1.0",
     "description": "Claude 3.5 Sonnet raises the industry bar for intelligence, outperforming competitor models and Claude 3 Opus on a wide range of evaluations, with the speed and cost of our mid-tier model, Claude 3 Sonnet.",
-    "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 8192,
       "temperature": 0.7,
       "stream": true
     },
-    "metadata": {
-      "author": "Anthropic",
-      "tags": ["General", "Big Context Length"]
-    },
     "engine": "anthropic"
   }
 ]
diff --git a/extensions/inference-cohere-extension/resources/models.json b/extensions/engine-management-extension/models/cohere.json
similarity index 58%
rename from extensions/inference-cohere-extension/resources/models.json
rename to extensions/engine-management-extension/models/cohere.json
index 2b4cc3e8e..458e4278b 100644
--- a/extensions/inference-cohere-extension/resources/models.json
+++ b/extensions/engine-management-extension/models/cohere.json
@@ -1,56 +1,28 @@
 [
   {
-    "sources": [
-      {
-        "url": "https://cohere.com"
-      }
-    ],
-    "id": "command-r-plus",
+    "model": "command-r-plus",
     "object": "model",
     "name": "Command R+",
     "version": "1.0",
     "description": "Command R+ is an instruction-following conversational model that performs language tasks at a higher quality, more reliably, and with a longer context than previous models. It is best suited for complex RAG workflows and multi-step tool use.",
-    "format": "api",
-    "settings": {},
-    "parameters": {
-      "max_tokens": 128000,
+    "inference_params": {
+      "max_tokens": 4096,
       "temperature": 0.7,
       "stream": false
     },
-    "metadata": {
-      "author": "Cohere",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "cohere"
   },
   {
-    "sources": [
-      {
-        "url": "https://cohere.com"
-      }
-    ],
-    "id": "command-r",
+    "model": "command-r",
     "object": "model",
     "name": "Command R",
     "version": "1.0",
     "description": "Command R is an instruction-following conversational model that performs language tasks at a higher quality, more reliably, and with a longer context than previous models. It can be used for complex workflows like code generation, retrieval augmented generation (RAG), tool use, and agents.",
-    "format": "api",
-    "settings": {},
-    "parameters": {
-      "max_tokens": 128000,
+    "inference_params": {
+      "max_tokens": 4096,
       "temperature": 0.7,
       "stream": false
     },
-    "metadata": {
-      "author": "Cohere",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "cohere"
   }
 ]
diff --git a/extensions/inference-groq-extension/resources/models.json b/extensions/engine-management-extension/models/groq.json
similarity index 53%
rename from extensions/inference-groq-extension/resources/models.json
rename to extensions/engine-management-extension/models/groq.json
index b4b013dad..38a0f3835 100644
--- a/extensions/inference-groq-extension/resources/models.json
+++ b/extensions/engine-management-extension/models/groq.json
@@ -1,18 +1,11 @@
 [
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama3-70b-8192",
+    "model": "llama3-70b-8192",
     "object": "model",
     "name": "Groq Llama 3 70b",
     "version": "1.1",
     "description": "Groq Llama 3 70b with supercharged speed!",
-    "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 8192,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -21,29 +14,15 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama3-8b-8192",
+    "model": "llama3-8b-8192",
     "object": "model",
     "name": "Groq Llama 3 8b",
     "version": "1.1",
     "description": "Groq Llama 3 8b with supercharged speed!",
-    "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 8192,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -52,29 +31,15 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama-3.1-8b-instant",
+    "model": "llama-3.1-8b-instant",
     "object": "model",
     "name": "Groq Llama 3.1 8b Instant",
     "version": "1.1",
     "description": "Groq Llama 3.1 8b with supercharged speed!",
-    "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 8000,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -83,29 +48,15 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama-3.2-11b-text-preview",
+    "model": "llama-3.2-11b-text-preview",
     "object": "model",
     "name": "Groq Llama 3.2 11b Text Preview",
     "version": "1.1",
     "description": "Groq Llama 3.2 11b Text Preview with supercharged speed!",
-    "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 8192,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -114,29 +65,15 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama-3.2-11b-vision-preview",
+    "model": "llama-3.2-11b-vision-preview",
     "object": "model",
     "name": "Groq Llama 3.2 11b Vision Preview",
     "version": "1.1",
     "description": "Groq Llama 3.2 11b Vision Preview with supercharged speed!",
-    "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 8192,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -145,28 +82,14 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama-3.2-1b-preview",
+    "model": "llama-3.2-1b-preview",
     "object": "model",
     "name": "Groq Llama 3.2 1b Preview",
     "version": "1.1",
     "description": "Groq Llama 3.2 1b Preview with supercharged speed!",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 8192,
       "temperature": 0.7,
@@ -176,28 +99,14 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama-3.2-3b-preview",
+    "model": "llama-3.2-3b-preview",
     "object": "model",
     "name": "Groq Llama 3.2 3b Preview",
     "version": "1.1",
     "description": "Groq Llama 3.2 3b Preview with supercharged speed!",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 8192,
       "temperature": 0.7,
@@ -207,28 +116,14 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama-3.2-90b-text-preview",
+    "model": "llama-3.2-90b-text-preview",
     "object": "model",
     "name": "Groq Llama 3.2 90b Text Preview",
     "version": "1.1",
     "description": "Groq Llama 3.2 90b Text Preview with supercharged speed!",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 8192,
       "temperature": 0.7,
@@ -238,28 +133,14 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "llama-3.2-90b-vision-preview",
+    "model": "llama-3.2-90b-vision-preview",
     "object": "model",
     "name": "Groq Llama 3.2 90b Vision Preview",
     "version": "1.1",
     "description": "Groq Llama 3.2 90b Vision Preview with supercharged speed!",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 8192,
       "temperature": 0.7,
@@ -269,58 +150,14 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Meta",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "gemma-7b-it",
-    "object": "model",
-    "name": "Groq Gemma 7B Instruct",
-    "version": "1.2",
-    "description": "Groq Gemma 7B Instruct with supercharged speed!",
-    "format": "api",
-    "settings": {},
-    "parameters": {
-      "max_tokens": 8192,
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Google",
-      "tags": [
-        "General"
-      ]
-    },
-    "engine": "groq"
-  },
-  {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "gemma2-9b-it",
+    "model": "gemma2-9b-it",
     "object": "model",
     "name": "Groq Gemma 9B Instruct",
     "version": "1.2",
     "description": "Groq Gemma 9b Instruct with supercharged speed!",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 8192,
       "temperature": 0.7,
@@ -330,27 +167,14 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Google",
-      "tags": [
-        "General"
-      ]
-    },
     "engine": "groq"
   },
   {
-    "sources": [
-      {
-        "url": "https://groq.com"
-      }
-    ],
-    "id": "mixtral-8x7b-32768",
+    "model": "mixtral-8x7b-32768",
     "object": "model",
     "name": "Groq Mixtral 8x7B Instruct",
     "version": "1.2",
     "description": "Groq Mixtral 8x7B Instruct is Mixtral with supercharged speed!",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 32768,
       "temperature": 0.7,
@@ -360,13 +184,6 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Mistral",
-      "tags": [
-        "General",
-        "Big Context Length"
-      ]
-    },
     "engine": "groq"
   }
-]
\ No newline at end of file
+]
diff --git a/extensions/inference-martian-extension/resources/models.json b/extensions/engine-management-extension/models/martian.json
similarity index 63%
rename from extensions/inference-martian-extension/resources/models.json
rename to extensions/engine-management-extension/models/martian.json
index cf59e958e..b935587cc 100644
--- a/extensions/inference-martian-extension/resources/models.json
+++ b/extensions/engine-management-extension/models/martian.json
@@ -1,17 +1,10 @@
 [
   {
-    "sources": [
-      {
-        "url": "https://withmartian.com/"
-      }
-    ],
-    "id": "router",
+    "model": "router",
     "object": "model",
     "name": "Martian Model Router",
     "version": "1.0",
     "description": "Martian Model Router dynamically routes requests to the best LLM in real-time",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 4096,
       "temperature": 0.7,
@@ -21,12 +14,6 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "Martian",
-      "tags": [
-        "General"
-      ]
-    },
     "engine": "martian"
   }
-]
\ No newline at end of file
+]
diff --git a/extensions/inference-mistral-extension/resources/models.json b/extensions/engine-management-extension/models/mistral.json
similarity index 58%
rename from extensions/inference-mistral-extension/resources/models.json
rename to extensions/engine-management-extension/models/mistral.json
index 23ecd6fdd..47833a31c 100644
--- a/extensions/inference-mistral-extension/resources/models.json
+++ b/extensions/engine-management-extension/models/mistral.json
@@ -1,83 +1,44 @@
 [
   {
-    "sources": [
-      {
-        "url": "https://docs.mistral.ai/api/"
-      }
-    ],
-    "id": "mistral-small-latest",
+    "model": "mistral-small-latest",
     "object": "model",
     "name": "Mistral Small",
     "version": "1.1",
     "description": "Mistral Small is the ideal choice for simple tasks (Classification, Customer Support, or Text Generation) at an affordable price.",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 32000,
       "temperature": 0.7,
       "top_p": 0.95,
       "stream": true
     },
-    "metadata": {
-      "author": "Mistral",
-      "tags": [
-        "General"
-      ]
-    },
     "engine": "mistral"
   },
   {
-    "sources": [
-      {
-        "url": "https://docs.mistral.ai/api/"
-      }
-    ],
-    "id": "mistral-large-latest",
+    "model": "mistral-large-latest",
     "object": "model",
     "name": "Mistral Large",
     "version": "1.1",
     "description": "Mistral Large is ideal for complex tasks (Synthetic Text Generation, Code Generation, RAG, or Agents).",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 32000,
       "temperature": 0.7,
       "top_p": 0.95,
       "stream": true
     },
-    "metadata": {
-      "author": "Mistral",
-      "tags": [
-        "General"
-      ]
-    },
     "engine": "mistral"
   },
   {
-    "sources": [
-      {
-        "url": "https://docs.mistral.ai/api/"
-      }
-    ],
-    "id": "open-mixtral-8x22b",
+    "model": "open-mixtral-8x22b",
     "object": "model",
     "name": "Mixtral 8x22B",
     "version": "1.1",
     "description": "Mixtral 8x22B is a high-performance, cost-effective model designed for complex tasks.",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 32000,
       "temperature": 0.7,
       "top_p": 0.95,
       "stream": true
     },
-    "metadata": {
-      "author": "Mistral",
-      "tags": [
-        "General"
-      ]
-    },
     "engine": "mistral"
   }
 ]
diff --git a/extensions/inference-nvidia-extension/resources/models.json b/extensions/engine-management-extension/models/nvidia.json
similarity index 57%
rename from extensions/inference-nvidia-extension/resources/models.json
rename to extensions/engine-management-extension/models/nvidia.json
index b97644fc9..f2adac779 100644
--- a/extensions/inference-nvidia-extension/resources/models.json
+++ b/extensions/engine-management-extension/models/nvidia.json
@@ -1,17 +1,10 @@
 [
   {
-    "sources": [
-      {
-        "url": "https://integrate.api.nvidia.com/v1/chat/completions"
-      }
-    ],
-    "id": "mistralai/mistral-7b-instruct-v0.2",
+    "model": "mistralai/mistral-7b-instruct-v0.2",
     "object": "model",
     "name": "Mistral 7B",
     "version": "1.1",
     "description": "Mistral 7B with NVIDIA",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 1024,
       "temperature": 0.3,
@@ -22,10 +15,6 @@
       "stop": null,
       "seed": null
     },
-    "metadata": {
-      "author": "NVIDIA",
-      "tags": ["General"]
-    },
     "engine": "nvidia"
   }
 ]
diff --git a/extensions/inference-openai-extension/resources/models.json b/extensions/engine-management-extension/models/openai.json
similarity index 62%
rename from extensions/inference-openai-extension/resources/models.json
rename to extensions/engine-management-extension/models/openai.json
index 0c822fde2..8f59b42ea 100644
--- a/extensions/inference-openai-extension/resources/models.json
+++ b/extensions/engine-management-extension/models/openai.json
@@ -1,18 +1,12 @@
 [
   {
-    "sources": [
-      {
-        "url": "https://openai.com"
-      }
-    ],
-    "id": "gpt-4-turbo",
+    "model": "gpt-4-turbo",
     "object": "model",
     "name": "OpenAI GPT 4 Turbo",
     "version": "1.2",
     "description": "OpenAI GPT 4 Turbo model is extremely good",
     "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 4096,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -21,26 +15,16 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General"]
-    },
     "engine": "openai"
   },
   {
-    "sources": [
-      {
-        "url": "https://openai.com"
-      }
-    ],
-    "id": "gpt-3.5-turbo",
+    "model": "gpt-3.5-turbo",
     "object": "model",
     "name": "OpenAI GPT 3.5 Turbo",
     "version": "1.1",
     "description": "OpenAI GPT 3.5 Turbo model is extremely fast",
     "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 4096,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -49,28 +33,16 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General"]
-    },
     "engine": "openai"
   },
   {
-    "sources": [
-      {
-        "url": "https://openai.com"
-      }
-    ],
-    "id": "gpt-4o",
+    "model": "gpt-4o",
     "object": "model",
     "name": "OpenAI GPT 4o",
     "version": "1.1",
     "description": "OpenAI GPT 4o is a new flagship model with fast speed and high quality",
     "format": "api",
-    "settings": {
-      "vision_model": true
-    },
-    "parameters": {
+    "inference_params": {
       "max_tokens": 4096,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -79,28 +51,16 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General"]
-    },
     "engine": "openai"
   },
   {
-    "sources": [
-      {
-        "url": "https://openai.com"
-      }
-    ],
-    "id": "gpt-4o-mini",
+    "model": "gpt-4o-mini",
     "object": "model",
     "name": "OpenAI GPT 4o-mini",
     "version": "1.1",
     "description": "GPT-4o mini (“o” for “omni”) is a fast, affordable small model for focused tasks.",
     "format": "api",
-    "settings": {
-      "vision_model": true
-    },
-    "parameters": {
+    "inference_params": {
       "max_tokens": 16384,
       "temperature": 0.7,
       "top_p": 0.95,
@@ -109,26 +69,16 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General"]
-    },
     "engine": "openai"
   },
   {
-    "sources": [
-      {
-        "url": "https://openai.com"
-      }
-    ],
-    "id": "o1",
+    "model": "o1",
     "object": "model",
     "name": "OpenAI o1",
     "version": "1.0",
     "description": "OpenAI o1 is a new model with complex reasoning",
     "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 100000,
       "temperature": 1,
       "top_p": 1,
@@ -136,26 +86,16 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General"]
-    },
     "engine": "openai"
   },
   {
-    "sources": [
-      {
-        "url": "https://openai.com"
-      }
-    ],
-    "id": "o1-preview",
+    "model": "o1-preview",
     "object": "model",
     "name": "OpenAI o1-preview",
     "version": "1.0",
     "description": "OpenAI o1-preview is a new model with complex reasoning",
     "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 32768,
       "temperature": 1,
       "top_p": 1,
@@ -163,26 +103,16 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General"]
-    },
     "engine": "openai"
   },
   {
-    "sources": [
-      {
-        "url": "https://openai.com"
-      }
-    ],
-    "id": "o1-mini",
+    "model": "o1-mini",
     "object": "model",
     "name": "OpenAI o1-mini",
     "version": "1.0",
     "description": "OpenAI o1-mini is a lightweight reasoning model",
     "format": "api",
-    "settings": {},
-    "parameters": {
+    "inference_params": {
       "max_tokens": 65536,
       "temperature": 1,
       "top_p": 1,
@@ -190,10 +120,6 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General"]
-    },
     "engine": "openai"
   }
 ]
diff --git a/extensions/inference-openrouter-extension/resources/models.json b/extensions/engine-management-extension/models/openrouter.json
similarity index 63%
rename from extensions/inference-openrouter-extension/resources/models.json
rename to extensions/engine-management-extension/models/openrouter.json
index 31dea8734..5ac189a81 100644
--- a/extensions/inference-openrouter-extension/resources/models.json
+++ b/extensions/engine-management-extension/models/openrouter.json
@@ -1,17 +1,10 @@
 [
   {
-    "sources": [
-      {
-        "url": "https://openrouter.ai"
-      }
-    ],
-    "id": "open-router-auto",
+    "model": "open-router-auto",
     "object": "model",
     "name": "OpenRouter",
     "version": "1.0",
     "description": " OpenRouter scouts for the lowest prices and best latencies/throughputs across dozens of providers, and lets you choose how to prioritize them.",
-    "format": "api",
-    "settings": {},
     "parameters": {
       "max_tokens": 128000,
       "temperature": 0.7,
@@ -19,10 +12,6 @@
       "frequency_penalty": 0,
       "presence_penalty": 0
     },
-    "metadata": {
-      "author": "OpenRouter",
-      "tags": ["General", "Big Context Length"]
-    },
     "engine": "openrouter"
   }
 ]
diff --git a/extensions/engine-management-extension/resources/anthropic.json b/extensions/engine-management-extension/resources/anthropic.json
new file mode 100644
index 000000000..a599d7ce3
--- /dev/null
+++ b/extensions/engine-management-extension/resources/anthropic.json
@@ -0,0 +1,22 @@
+{
+  "id": "@janhq/inference-anthropic-extension",
+  "type": "remote",
+  "engine": "anthropic",
+  "url": "https://api.anthropic.com",
+  "api_key": "",
+  "metadata": {
+    "get_models_url": "https://api.anthropic.com/v1/models",
+    "header_template": "x-api-key: {{api_key}} anthropic-version: 2023-06-01",
+    "transform_req": {
+      "chat_completions": {
+        "url": "https://api.anthropic.com/v1/messages",
+        "template": "{ {% for key, value in input_request %} {% if key == \"messages\" %} {% if input_request.messages.0.role == \"system\" %} \"system\": \"{{ input_request.messages.0.content }}\", \"messages\": [{% for message in input_request.messages %} {% if not loop.is_first %} {\"role\": \"{{ message.role }}\", \"content\": \"{{ message.content }}\" } {% if not loop.is_last %},{% endif %} {% endif %} {% endfor %}] {% else %} \"messages\": [{% for message in input_request.messages %} {\"role\": \"{{ message.role}}\", \"content\": \"{{ message.content }}\" } {% if not loop.is_last %},{% endif %} {% endfor %}] {% endif %} {% if not loop.is_last %},{% endif %} {% else if key == \"system\" or key == \"model\" or key == \"temperature\" or key == \"store\" or key == \"max_tokens\" or key == \"stream\" or key == \"presence_penalty\" or key == \"metadata\" or key == \"frequency_penalty\" or key == \"tools\" or key == \"tool_choice\" or key == \"logprobs\" or key == \"top_logprobs\" or key == \"logit_bias\" or key == \"n\" or key == \"modalities\" or key == \"prediction\" or key == \"response_format\" or key == \"service_tier\" or key == \"seed\" or key == \"stop\" or key == \"stream_options\" or key == \"top_p\" or key == \"parallel_tool_calls\" or key == \"user\" %}\"{{ key }}\": {{ tojson(value) }} {% if not loop.is_last %},{% endif %} {% endif %} {% endfor %} }"
+      }
+    },
+    "transform_resp": {
+      "chat_completions": {
+        "template": "{% if input_request.stream %} {\"object\": \"chat.completion.chunk\", \"model\": \"{{ input_request.model }}\", \"choices\": [{\"index\": 0, \"delta\": { {% if input_request.type == \"message_start\" %} \"role\": \"assistant\", \"content\": null {% else if input_request.type == \"ping\" %} \"role\": \"assistant\", \"content\": null {% else if input_request.type == \"content_block_delta\" %} \"role\": \"assistant\", \"content\": \"{{ input_request.delta.text }}\" {% else if input_request.type == \"content_block_stop\" %} \"role\": \"assistant\", \"content\": null {% else if input_request.type == \"content_block_stop\" %} \"role\": \"assistant\", \"content\": null {% endif %} }, {% if input_request.type == \"content_block_stop\" %} \"finish_reason\": \"stop\" {% else %} \"finish_reason\": null {% endif %} }]} {% else %} {\"id\": \"{{ input_request.id }}\", \"created\": null, \"object\": \"chat.completion\", \"model\": \"{{ input_request.model }}\", \"choices\": [{ \"index\": 0, \"message\": { \"role\": \"{{ input_request.role }}\", \"content\": \"{% if input_request.content and input_request.content.0.type == \"text\" %} \"{{input_request.content.0.text}}\" {% endif %}\", \"refusal\": null }, \"logprobs\": null, \"finish_reason\": \"{{ input_request.stop_reason }}\" } ], \"usage\": { \"prompt_tokens\": {{ input_request.usage.input_tokens }}, \"completion_tokens\": {{ input_request.usage.output_tokens }}, \"total_tokens\": {{ input_request.usage.input_tokens + input_request.usage.output_tokens }}, \"prompt_tokens_details\": { \"cached_tokens\": 0 }, \"completion_tokens_details\": { \"reasoning_tokens\": 0, \"accepted_prediction_tokens\": 0, \"rejected_prediction_tokens\": 0 } }, \"system_fingerprint\": \"fp_6b68a8204b\"} {% endif %}"
+      }
+    }
+  }
+}
diff --git a/extensions/engine-management-extension/resources/cohere.json b/extensions/engine-management-extension/resources/cohere.json
new file mode 100644
index 000000000..6cb51dc04
--- /dev/null
+++ b/extensions/engine-management-extension/resources/cohere.json
@@ -0,0 +1,22 @@
+{
+  "id": "@janhq/inference-cohere-extension",
+  "type": "remote",
+  "engine": "cohere",
+  "url": "https://api.cohere.ai",
+  "api_key": "",
+  "metadata": {
+    "get_models_url": "https://api.cohere.ai/v1/models",
+    "header_template": "Authorization: Bearer {{api_key}}",
+    "transform_req": {
+      "chat_completions": {
+        "url": "https://api.cohere.ai/v1/chat",
+        "template": "{ {% for key, value in input_request %} {% if key == \"messages\" %} {% if input_request.messages.0.role == \"system\" %} \"preamble\": \"{{ input_request.messages.0.content }}\", {% if length(input_request.messages) > 2 %} \"chatHistory\": [{% for message in input_request.messages %} {% if not loop.is_first and not loop.is_last %} {\"role\": {% if message.role == \"user\" %} \"USER\" {% else %} \"CHATBOT\" {% endif %}, \"content\": \"{{ message.content }}\" } {% if loop.index < length(input_request.messages) - 2 %},{% endif %} {% endif %} {% endfor %}], {% endif %} \"message\": \"{{ last(input_request.messages).content }}\" {% else %} {% if length(input_request.messages) > 2 %} \"chatHistory\": [{% for message in input_request.messages %} {% if not loop.is_last %} { \"role\": {% if message.role == \"user\" %} \"USER\" {% else %} \"CHATBOT\" {% endif %}, \"content\": \"{{ message.content }}\" } {% if loop.index < length(input_request.messages) - 2 %},{% endif %} {% endif %} {% endfor %}],{% endif %}\"message\": \"{{ last(input_request.messages).content }}\" {% endif %}{% if not loop.is_last %},{% endif %} {% else if key == \"system\" or key == \"model\" or key == \"temperature\" or key == \"store\" or key == \"max_tokens\" or key == \"stream\" or key == \"presence_penalty\" or key == \"metadata\" or key == \"frequency_penalty\" or key == \"tools\" or key == \"tool_choice\" or key == \"logprobs\" or key == \"top_logprobs\" or key == \"logit_bias\" or key == \"n\" or key == \"modalities\" or key == \"prediction\" or key == \"response_format\" or key == \"service_tier\" or key == \"seed\" or key == \"stop\" or key == \"stream_options\" or key == \"top_p\" or key == \"parallel_tool_calls\" or key == \"user\" %} \"{{ key }}\": {{ tojson(value) }} {% if not loop.is_last %},{% endif %} {% endif %} {% endfor %} }"
+      }
+    },
+    "transform_resp": {
+      "chat_completions": {
+        "template": "{% if input_request.stream %} {\"object\": \"chat.completion.chunk\", \"model\": \"{{ input_request.model }}\", \"choices\": [{\"index\": 0, \"delta\": { {% if input_request.event_type == \"text-generation\" %} \"role\": \"assistant\", \"content\": \"{{ input_request.text }}\" {% else %} \"role\": \"assistant\", \"content\": null {% endif %} }, {% if input_request.event_type == \"stream-end\" %} \"finish_reason\": \"{{ input_request.finish_reason }}\" {% else %} \"finish_reason\": null {% endif %} }]} {% else %} {\"id\": \"{{ input_request.generation_id }}\", \"created\": null, \"object\": \"chat.completion\", \"model\": {% if input_request.model %} \"{{ input_request.model }}\" {% else %} \"command-r-plus-08-2024\" {% endif %}, \"choices\": [{ \"index\": 0, \"message\": { \"role\": \"assistant\", \"content\": {% if not input_request.text %} null {% else %}  \"{{ input_request.text }}\" {% endif %}, \"refusal\": null }, \"logprobs\": null, \"finish_reason\": \"{{ input_request.finish_reason }}\" } ], \"usage\": { \"prompt_tokens\": {{ input_request.meta.tokens.input_tokens }}, \"completion_tokens\": {{ input_request.meta.tokens.output_tokens }},\"total_tokens\": {{ input_request.meta.tokens.input_tokens + input_request.meta.tokens.output_tokens }}, \"prompt_tokens_details\": { \"cached_tokens\": 0 },\"completion_tokens_details\": { \"reasoning_tokens\": 0, \"accepted_prediction_tokens\": 0, \"rejected_prediction_tokens\": 0 } }, \"system_fingerprint\": \"fp_6b68a8204b\"} {% endif %}"
+      }
+    }
+  }
+}
diff --git a/extensions/engine-management-extension/resources/groq.json b/extensions/engine-management-extension/resources/groq.json
new file mode 100644
index 000000000..6be1ce6ef
--- /dev/null
+++ b/extensions/engine-management-extension/resources/groq.json
@@ -0,0 +1,22 @@
+{
+  "id": "@janhq/inference-groq-extension",
+  "type": "remote",
+  "engine": "groq",
+  "url": "https://api.groq.com",
+  "api_key": "",
+  "metadata": {
+    "get_models_url": "https://api.groq.com/openai/v1/models",
+    "header_template": "Authorization: Bearer {{api_key}}",
+    "transform_req": {
+      "chat_completions": {
+        "url": "https://api.groq.com/openai/v1/chat/completions",
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"messages\" or key == \"model\" or key == \"temperature\" or key == \"store\" or key == \"max_tokens\" or key == \"stream\" or key == \"presence_penalty\" or key == \"metadata\" or key == \"frequency_penalty\" or key == \"tools\" or key == \"tool_choice\" or key == \"logprobs\" or key == \"top_logprobs\" or key == \"logit_bias\" or key == \"n\" or key == \"modalities\" or key == \"prediction\" or key == \"response_format\" or key == \"service_tier\" or key == \"seed\" or key == \"stop\" or key == \"stream_options\" or key == \"top_p\" or key == \"parallel_tool_calls\" or key == \"user\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    },
+    "transform_resp": {
+      "chat_completions": {
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"choices\" or key == \"created\" or key == \"model\" or key == \"service_tier\" or key == \"system_fingerprint\" or key == \"stream\" or key == \"object\" or key == \"usage\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    }
+  }
+}
diff --git a/extensions/engine-management-extension/resources/martian.json b/extensions/engine-management-extension/resources/martian.json
new file mode 100644
index 000000000..4523ab754
--- /dev/null
+++ b/extensions/engine-management-extension/resources/martian.json
@@ -0,0 +1,22 @@
+{
+  "id": "@janhq/inference-martian-extension",
+  "type": "remote",
+  "engine": "martian",
+  "url": "https://withmartian.com",
+  "api_key": "",
+  "metadata": {
+    "get_models_url": "https://withmartian.com/api/openai/v1/models",
+    "header_template": "Authorization: Bearer {{api_key}}",
+    "transform_req": {
+      "chat_completions": {
+        "url": "https://withmartian.com/api/openai/v1/chat/completions",
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"messages\" or key == \"model\" or key == \"temperature\" or key == \"store\" or key == \"max_tokens\" or key == \"stream\" or key == \"presence_penalty\" or key == \"metadata\" or key == \"frequency_penalty\" or key == \"tools\" or key == \"tool_choice\" or key == \"logprobs\" or key == \"top_logprobs\" or key == \"logit_bias\" or key == \"n\" or key == \"modalities\" or key == \"prediction\" or key == \"response_format\" or key == \"service_tier\" or key == \"seed\" or key == \"stop\" or key == \"stream_options\" or key == \"top_p\" or key == \"parallel_tool_calls\" or key == \"user\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    },
+    "transform_resp": {
+      "chat_completions": {
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"choices\" or key == \"created\" or key == \"model\" or key == \"service_tier\" or key == \"system_fingerprint\" or key == \"stream\" or key == \"object\" or key == \"usage\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    }
+  }
+}
diff --git a/extensions/engine-management-extension/resources/mistral.json b/extensions/engine-management-extension/resources/mistral.json
new file mode 100644
index 000000000..4a032c4c8
--- /dev/null
+++ b/extensions/engine-management-extension/resources/mistral.json
@@ -0,0 +1,22 @@
+{
+  "id": "@janhq/inference-mistral-extension",
+  "type": "remote",
+  "engine": "mistral",
+  "url": "https://api.mistral.ai",
+  "api_key": "",
+  "metadata": {
+    "get_models_url": "https://api.mistral.ai/v1/models",
+    "header_template": "Authorization: Bearer {{api_key}}",
+    "transform_req": {
+      "chat_completions": {
+        "url": "https://api.mistral.ai/v1/chat/completions",
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"messages\" or key == \"model\" or key == \"temperature\" or key == \"store\" or key == \"max_tokens\" or key == \"stream\" or key == \"presence_penalty\" or key == \"metadata\" or key == \"frequency_penalty\" or key == \"tools\" or key == \"tool_choice\" or key == \"logprobs\" or key == \"top_logprobs\" or key == \"logit_bias\" or key == \"n\" or key == \"modalities\" or key == \"prediction\" or key == \"response_format\" or key == \"service_tier\" or key == \"seed\" or key == \"stop\" or key == \"stream_options\" or key == \"top_p\" or key == \"parallel_tool_calls\" or key == \"user\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    },
+    "transform_resp": {
+      "chat_completions": {
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"choices\" or key == \"created\" or key == \"model\" or key == \"service_tier\" or key == \"system_fingerprint\" or key == \"stream\" or key == \"object\" or key == \"usage\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    }
+  }
+}
diff --git a/extensions/engine-management-extension/resources/nvidia.json b/extensions/engine-management-extension/resources/nvidia.json
new file mode 100644
index 000000000..fa224c32c
--- /dev/null
+++ b/extensions/engine-management-extension/resources/nvidia.json
@@ -0,0 +1,22 @@
+{
+  "id": "@janhq/inference-nvidia-extension",
+  "type": "remote",
+  "engine": "nvidia",
+  "url": "https://integrate.api.nvidia.com",
+  "api_key": "",
+  "metadata": {
+    "get_models_url": "https://integrate.api.nvidia.com/v1/models",
+    "header_template": "Authorization: Bearer {{api_key}}",
+    "transform_req": {
+      "chat_completions": {
+        "url": "https://integrate.api.nvidia.com/v1/chat/completions",
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"messages\" or key == \"model\" or key == \"temperature\" or key == \"store\" or key == \"max_tokens\" or key == \"stream\" or key == \"presence_penalty\" or key == \"metadata\" or key == \"frequency_penalty\" or key == \"tools\" or key == \"tool_choice\" or key == \"logprobs\" or key == \"top_logprobs\" or key == \"logit_bias\" or key == \"n\" or key == \"modalities\" or key == \"prediction\" or key == \"response_format\" or key == \"service_tier\" or key == \"seed\" or key == \"stop\" or key == \"stream_options\" or key == \"top_p\" or key == \"parallel_tool_calls\" or key == \"user\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    },
+    "transform_resp": {
+      "chat_completions": {
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"choices\" or key == \"created\" or key == \"model\" or key == \"service_tier\" or key == \"system_fingerprint\" or key == \"stream\" or key == \"object\" or key == \"usage\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    }
+  }
+}
diff --git a/extensions/engine-management-extension/resources/openai.json b/extensions/engine-management-extension/resources/openai.json
new file mode 100644
index 000000000..8f86a1785
--- /dev/null
+++ b/extensions/engine-management-extension/resources/openai.json
@@ -0,0 +1,22 @@
+{
+  "id": "@janhq/inference-openai-extension",
+  "type": "remote",
+  "engine": "openai",
+  "url": "https://api.openai.com",
+  "api_key": "",
+  "metadata": {
+    "get_models_url": "https://api.openai.com/v1/models",
+    "header_template": "Authorization: Bearer {{api_key}}",
+    "transform_req": {
+      "chat_completions": {
+        "url": "https://api.openai.com/v1/chat/completions",
+        "template": "{ {% set first = true %}{% for key, value in input_request %}{% if key == \"model\" or key == \"temperature\" or key == \"store\" or key == \"messages\" or key == \"stream\" or key == \"presence_penalty\" or key == \"metadata\" or key == \"frequency_penalty\" or key == \"tools\" or key == \"tool_choice\" or key == \"logprobs\" or key == \"top_logprobs\" or key == \"logit_bias\" or key == \"n\" or key == \"modalities\" or key == \"prediction\" or key == \"response_format\" or key == \"service_tier\" or key == \"seed\" or key == \"stream_options\" or key == \"top_p\" or key == \"parallel_tool_calls\" or key == \"user\" or (not \"o1\" in input_request.model and (key == \"max_tokens\" or key == \"stop\")) %} {% if key == \"max_tokens\" and \"o1\" in input_request.model %} \"max_completion_tokens\": {{ tojson(value) }} {% else %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endif %} {% endfor %} }"
+      }
+    },
+    "transform_resp": {
+      "chat_completions": {
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"choices\" or key == \"created\" or key == \"model\" or key == \"service_tier\" or key == \"stream\" or key == \"object\" or key == \"usage\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    }
+  }
+}
diff --git a/extensions/engine-management-extension/resources/openrouter.json b/extensions/engine-management-extension/resources/openrouter.json
new file mode 100644
index 000000000..631b211fa
--- /dev/null
+++ b/extensions/engine-management-extension/resources/openrouter.json
@@ -0,0 +1,22 @@
+{
+  "id": "@janhq/inference-openrouter-extension",
+  "type": "remote",
+  "engine": "openrouter",
+  "url": "https://openrouter.ai",
+  "api_key": "",
+  "metadata": {
+    "get_models_url": "https://openrouter.ai/api/v1/models",
+    "header_template": "Authorization: Bearer {{api_key}}",
+    "transform_req": {
+      "chat_completions": {
+        "url": "https://openrouter.ai/api/v1/chat/completions",
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"messages\" or key == \"temperature\" or key == \"store\" or key == \"max_tokens\" or key == \"stream\" or key == \"presence_penalty\" or key == \"metadata\" or key == \"frequency_penalty\" or key == \"tools\" or key == \"tool_choice\" or key == \"logprobs\" or key == \"top_logprobs\" or key == \"logit_bias\" or key == \"n\" or key == \"modalities\" or key == \"prediction\" or key == \"response_format\" or key == \"service_tier\" or key == \"seed\" or key == \"stop\" or key == \"stream_options\" or key == \"top_p\" or key == \"parallel_tool_calls\" or key == \"user\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    },
+    "transform_resp": {
+      "chat_completions": {
+        "template": "{ {% set first = true %} {% for key, value in input_request %} {% if key == \"choices\" or key == \"created\" or key == \"model\" or key == \"service_tier\" or key == \"system_fingerprint\" or key == \"stream\" or key == \"object\" or key == \"usage\" %} {% if not first %},{% endif %} \"{{ key }}\": {{ tojson(value) }} {% set first = false %} {% endif %} {% endfor %} }"
+      }
+    }
+  }
+}
diff --git a/extensions/engine-management-extension/rolldown.config.mjs b/extensions/engine-management-extension/rolldown.config.mjs
index 038f23cc3..b59d395d1 100644
--- a/extensions/engine-management-extension/rolldown.config.mjs
+++ b/extensions/engine-management-extension/rolldown.config.mjs
@@ -1,4 +1,5 @@
 import { defineConfig } from 'rolldown'
+import { engines, models } from './engines.mjs'
 import pkgJson from './package.json' with { type: 'json' }
 
 export default defineConfig([
@@ -13,6 +14,8 @@ export default defineConfig([
       API_URL: JSON.stringify('http://127.0.0.1:39291'),
       SOCKET_URL: JSON.stringify('ws://127.0.0.1:39291'),
       CORTEX_ENGINE_VERSION: JSON.stringify('v0.1.43'),
+      DEFAULT_REMOTE_ENGINES: JSON.stringify(engines),
+      DEFAULT_REMOTE_MODELS: JSON.stringify(models),
     },
   },
   {
diff --git a/extensions/engine-management-extension/src/@types/global.d.ts b/extensions/engine-management-extension/src/@types/global.d.ts
index 8d0a94fef..2d520d5f9 100644
--- a/extensions/engine-management-extension/src/@types/global.d.ts
+++ b/extensions/engine-management-extension/src/@types/global.d.ts
@@ -3,6 +3,12 @@ declare const CORTEX_ENGINE_VERSION: string
 declare const SOCKET_URL: string
 declare const NODE: string
 
+declare const DEFAULT_REMOTE_ENGINES: ({
+  id: string
+  engine: string
+} & EngineConfig)[]
+declare const DEFAULT_REMOTE_MODELS: Model[]
+
 interface Core {
   api: APIFunctions
   events: EventEmitter
diff --git a/extensions/engine-management-extension/src/index.ts b/extensions/engine-management-extension/src/index.ts
index 215ae3bc2..0d30bf4ea 100644
--- a/extensions/engine-management-extension/src/index.ts
+++ b/extensions/engine-management-extension/src/index.ts
@@ -3,14 +3,22 @@ import {
   InferenceEngine,
   DefaultEngineVariant,
   Engines,
+  EngineConfig,
   EngineVariant,
   EngineReleased,
   executeOnMain,
   systemInformation,
+  Model,
+  fs,
+  joinPath,
+  events,
+  ModelEvent,
+  EngineEvent,
 } from '@janhq/core'
 import ky, { HTTPError } from 'ky'
 import PQueue from 'p-queue'
 import { EngineError } from './error'
+import { getJanDataFolderPath } from '@janhq/core'
 
 /**
  * JSONEngineManagementExtension is a EngineManagementExtension implementation that provides
@@ -27,41 +35,11 @@ export default class JSONEngineManagementExtension extends EngineManagementExten
     await executeOnMain(NODE, 'symlinkEngines')
     // Run Healthcheck
     this.queue.add(() => this.healthz())
-    try {
-      const variant = await this.getDefaultEngineVariant(
-        InferenceEngine.cortex_llamacpp
-      )
-      const installedEngines = await this.getInstalledEngines(
-        InferenceEngine.cortex_llamacpp
-      )
-      if (
-        !installedEngines.some(
-          (e) => e.name === variant.variant && e.version === variant.version
-        )
-      ) {
-        throw new EngineError(
-          'Default engine is not available, use bundled version.'
-        )
-      }
-    } catch (error) {
-      if (
-        (error instanceof HTTPError && error.response.status === 400) ||
-        error instanceof EngineError
-      ) {
-        const systemInfo = await systemInformation()
-        const variant = await executeOnMain(
-          NODE,
-          'engineVariant',
-          systemInfo.gpuSetting
-        )
-        await this.setDefaultEngineVariant(InferenceEngine.cortex_llamacpp, {
-          variant: variant,
-          version: `${CORTEX_ENGINE_VERSION}`,
-        })
-      } else {
-        console.error('An unexpected error occurred:', error)
-      }
-    }
+    // Update default local engine
+    this.updateDefaultEngine()
+
+    // Populate default remote engines
+    this.populateDefaultRemoteEngines()
   }
 
   /**
@@ -81,6 +59,19 @@ export default class JSONEngineManagementExtension extends EngineManagementExten
     ) as Promise<Engines>
   }
 
+  /**
+   * @returns A Promise that resolves to an object of list engines.
+   */
+  async getRemoteModels(name: string): Promise<any> {
+    return this.queue.add(() =>
+      ky
+        .get(`${API_URL}/v1/models/remote/${name}`)
+        .json<Model[]>()
+        .then((e) => e)
+        .catch(() => [])
+    ) as Promise<Model[]>
+  }
+
   /**
    * @param name - Inference engine name.
    * @returns A Promise that resolves to an array of installed engine.
@@ -135,10 +126,7 @@ export default class JSONEngineManagementExtension extends EngineManagementExten
    * @param name - Inference engine name.
    * @returns A Promise that resolves to intall of engine.
    */
-  async installEngine(
-    name: InferenceEngine,
-    engineConfig: { variant: string; version?: string }
-  ) {
+  async installEngine(name: string, engineConfig: EngineConfig) {
     return this.queue.add(() =>
       ky
         .post(`${API_URL}/v1/engines/${name}/install`, { json: engineConfig })
@@ -146,14 +134,21 @@ export default class JSONEngineManagementExtension extends EngineManagementExten
     ) as Promise<{ messages: string }>
   }
 
+  /**
+   * Add a new remote engine
+   * @returns A Promise that resolves to intall of engine.
+   */
+  async addRemoteEngine(engineConfig: EngineConfig) {
+    return this.queue.add(() =>
+      ky.post(`${API_URL}/v1/engines`, { json: engineConfig }).then((e) => e)
+    ) as Promise<{ messages: string }>
+  }
+
   /**
    * @param name - Inference engine name.
    * @returns A Promise that resolves to unintall of engine.
    */
-  async uninstallEngine(
-    name: InferenceEngine,
-    engineConfig: { variant: string; version: string }
-  ) {
+  async uninstallEngine(name: InferenceEngine, engineConfig: EngineConfig) {
     return this.queue.add(() =>
       ky
         .delete(`${API_URL}/v1/engines/${name}/install`, { json: engineConfig })
@@ -161,6 +156,16 @@ export default class JSONEngineManagementExtension extends EngineManagementExten
     ) as Promise<{ messages: string }>
   }
 
+  /**
+   * Add a new remote model
+   * @param model - Remote model object.
+   */
+  async addRemoteModel(model: Model) {
+    return this.queue.add(() =>
+      ky.post(`${API_URL}/v1/models/add`, { json: model }).then((e) => e)
+    )
+  }
+
   /**
    * @param name - Inference engine name.
    * @returns A Promise that resolves to an object of default engine.
@@ -181,7 +186,7 @@ export default class JSONEngineManagementExtension extends EngineManagementExten
    */
   async setDefaultEngineVariant(
     name: InferenceEngine,
-    engineConfig: { variant: string; version: string }
+    engineConfig: EngineConfig
   ) {
     return this.queue.add(() =>
       ky
@@ -193,9 +198,11 @@ export default class JSONEngineManagementExtension extends EngineManagementExten
   /**
    * @returns A Promise that resolves to update engine.
    */
-  async updateEngine(name: InferenceEngine) {
+  async updateEngine(name: InferenceEngine, engineConfig?: EngineConfig) {
     return this.queue.add(() =>
-      ky.post(`${API_URL}/v1/engines/${name}/update`).then((e) => e)
+      ky
+        .post(`${API_URL}/v1/engines/${name}/update`, { json: engineConfig })
+        .then((e) => e)
     ) as Promise<{ messages: string }>
   }
 
@@ -210,4 +217,90 @@ export default class JSONEngineManagementExtension extends EngineManagementExten
       })
       .then(() => {})
   }
+
+  /**
+   * Update default local engine
+   * This is to use built-in engine variant in case there is no default engine set
+   */
+  async updateDefaultEngine() {
+    try {
+      const variant = await this.getDefaultEngineVariant(
+        InferenceEngine.cortex_llamacpp
+      )
+      const installedEngines = await this.getInstalledEngines(
+        InferenceEngine.cortex_llamacpp
+      )
+      if (
+        !installedEngines.some(
+          (e) => e.name === variant.variant && e.version === variant.version
+        )
+      ) {
+        throw new EngineError(
+          'Default engine is not available, use bundled version.'
+        )
+      }
+    } catch (error) {
+      if (
+        (error instanceof HTTPError && error.response.status === 400) ||
+        error instanceof EngineError
+      ) {
+        const systemInfo = await systemInformation()
+        const variant = await executeOnMain(
+          NODE,
+          'engineVariant',
+          systemInfo.gpuSetting
+        )
+        await this.setDefaultEngineVariant(InferenceEngine.cortex_llamacpp, {
+          variant: variant,
+          version: `${CORTEX_ENGINE_VERSION}`,
+        })
+      } else {
+        console.error('An unexpected error occurred:', error)
+      }
+    }
+  }
+
+  /**
+   * This is to populate default remote engines in case there is no customized remote engine setting
+   */
+  async populateDefaultRemoteEngines() {
+    const engines = await this.getEngines()
+    if (
+      !Object.values(engines)
+        .flat()
+        .some((e) => e.type === 'remote')
+    ) {
+      await Promise.all(
+        DEFAULT_REMOTE_ENGINES.map(async (engine) => {
+          const { id, ...data } = engine
+
+          /// BEGIN - Migrate legacy api key settings
+          let api_key = undefined
+          if (id) {
+            const apiKeyPath = await joinPath([
+              await getJanDataFolderPath(),
+              'settings',
+              id,
+              'settings.json',
+            ])
+            if (await fs.existsSync(apiKeyPath)) {
+              const settings = await fs.readFileSync(apiKeyPath, 'utf-8')
+              api_key = JSON.parse(settings).find(
+                (e) => e.key === `${data.engine}-api-key`
+              )?.controllerProps?.value
+            }
+          }
+          data.api_key = api_key
+          /// END - Migrate legacy api key settings
+
+          await this.addRemoteEngine(data).catch(console.error)
+        })
+      )
+      events.emit(EngineEvent.OnEngineUpdate, {})
+      DEFAULT_REMOTE_MODELS.forEach(async (data: Model) => {
+        await this.addRemoteModel(data).catch(() => {})
+      })
+      events.emit(ModelEvent.OnModelsUpdate, { fetch: true })
+    }
+  }
 }
diff --git a/extensions/engine-management-extension/tsconfig.json b/extensions/engine-management-extension/tsconfig.json
index 891d28a60..72e1e1895 100644
--- a/extensions/engine-management-extension/tsconfig.json
+++ b/extensions/engine-management-extension/tsconfig.json
@@ -8,7 +8,8 @@
     "forceConsistentCasingInFileNames": true,
     "strict": false,
     "skipLibCheck": true,
-    "rootDir": "./src"
+    "rootDir": "./src",
+    "resolveJsonModule": true
   },
   "include": ["./src"],
   "exclude": ["src/**/*.test.ts", "rolldown.config.mjs"]
diff --git a/extensions/inference-anthropic-extension/README.md b/extensions/inference-anthropic-extension/README.md
deleted file mode 100644
index 1c0dcbd3d..000000000
--- a/extensions/inference-anthropic-extension/README.md
+++ /dev/null
@@ -1,79 +0,0 @@
-# Anthropic Engine Extension
-
-Created using Jan extension example
-
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-anthropic-extension/jest.config.js b/extensions/inference-anthropic-extension/jest.config.js
deleted file mode 100644
index 3e32adceb..000000000
--- a/extensions/inference-anthropic-extension/jest.config.js
+++ /dev/null
@@ -1,9 +0,0 @@
-/** @type {import('ts-jest').JestConfigWithTsJest} */
-module.exports = {
-  preset: 'ts-jest',
-  testEnvironment: 'node',
-  transform: {
-    'node_modules/@janhq/core/.+\\.(j|t)s?$': 'ts-jest',
-  },
-  transformIgnorePatterns: ['node_modules/(?!@janhq/core/.*)'],
-}
diff --git a/extensions/inference-anthropic-extension/package.json b/extensions/inference-anthropic-extension/package.json
deleted file mode 100644
index cb064d2aa..000000000
--- a/extensions/inference-anthropic-extension/package.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
-  "name": "@janhq/inference-anthropic-extension",
-  "productName": "Anthropic Inference Engine",
-  "version": "1.0.3",
-  "description": "This extension enables Anthropic chat completion API calls",
-  "main": "dist/index.js",
-  "engine": "anthropic",
-  "author": "Jan <service@jan.ai>",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "test": "jest test",
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-anthropic-extension/resources/settings.json b/extensions/inference-anthropic-extension/resources/settings.json
deleted file mode 100644
index 9ca4405ac..000000000
--- a/extensions/inference-anthropic-extension/resources/settings.json
+++ /dev/null
@@ -1,24 +0,0 @@
-[
-  {
-    "key": "anthropic-api-key",
-    "title": "API Key",
-    "description": "The Anthropic API uses API keys for authentication. Visit your [API Keys](https://console.anthropic.com/settings/keys) page to retrieve the API key you'll use in your requests.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions. See the [Anthropic API documentation](https://docs.anthropic.com/claude/docs/intro-to-claude) for more information.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "https://api.anthropic.com/v1/messages",
-      "value": "https://api.anthropic.com/v1/messages"
-    }
-  }
-]
diff --git a/extensions/inference-anthropic-extension/rolldown.config.mjs b/extensions/inference-anthropic-extension/rolldown.config.mjs
deleted file mode 100644
index 9ebaace2e..000000000
--- a/extensions/inference-anthropic-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,18 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-import modelsJson from './resources/models.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    MODELS: JSON.stringify(modelsJson),
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-anthropic-extension/src/anthropic.test.ts b/extensions/inference-anthropic-extension/src/anthropic.test.ts
deleted file mode 100644
index 703ead0fb..000000000
--- a/extensions/inference-anthropic-extension/src/anthropic.test.ts
+++ /dev/null
@@ -1,77 +0,0 @@
-// Import necessary modules
-import JanInferenceAnthropicExtension, { Settings } from '.'
-import { PayloadType, ChatCompletionRole } from '@janhq/core'
-
-// Mocks
-jest.mock('@janhq/core', () => ({
-  RemoteOAIEngine: jest.fn().mockImplementation(() => ({
-    registerSettings: jest.fn(),
-    registerModels: jest.fn(),
-    getSetting: jest.fn(),
-    onChange: jest.fn(),
-    onSettingUpdate: jest.fn(),
-    onLoad: jest.fn(),
-    headers: jest.fn(),
-  })),
-  PayloadType: jest.fn(),
-  ChatCompletionRole: {
-    User: 'user' as const,
-    Assistant: 'assistant' as const,
-    System: 'system' as const,
-  },
-}))
-
-// Helper functions
-const createMockPayload = (): PayloadType => ({
-  messages: [
-    { role: ChatCompletionRole.System, content: 'Meow' },
-    { role: ChatCompletionRole.User, content: 'Hello' },
-    { role: ChatCompletionRole.Assistant, content: 'Hi there' },
-  ],
-  model: 'claude-v1',
-  stream: false,
-})
-
-describe('JanInferenceAnthropicExtension', () => {
-  let extension: JanInferenceAnthropicExtension
-
-  beforeEach(() => {
-    extension = new JanInferenceAnthropicExtension('', '')
-    extension.apiKey = 'mock-api-key'
-    extension.inferenceUrl = 'mock-endpoint'
-    jest.clearAllMocks()
-  })
-
-  it('should initialize with correct settings', async () => {
-    await extension.onLoad()
-    expect(extension.apiKey).toBe('mock-api-key')
-    expect(extension.inferenceUrl).toBe('mock-endpoint')
-  })
-
-  it('should transform payload correctly', () => {
-    const payload = createMockPayload()
-    const transformedPayload = extension.transformPayload(payload)
-
-    expect(transformedPayload).toEqual({
-      max_tokens: 4096,
-      model: 'claude-v1',
-      stream: false,
-      system: 'Meow',
-      messages: [
-        { role: 'user', content: 'Hello' },
-        { role: 'assistant', content: 'Hi there' },
-      ],
-    })
-  })
-
-  it('should transform response correctly', () => {
-    const nonStreamResponse = { content: [{ text: 'Test response' }] }
-    const streamResponse =
-      'data: {"type":"content_block_delta","delta":{"text":"Hello"}}'
-
-    expect(extension.transformResponse(nonStreamResponse)).toBe('Test response')
-    expect(extension.transformResponse(streamResponse)).toBe('Hello')
-    expect(extension.transformResponse('')).toBe('')
-    expect(extension.transformResponse('event: something')).toBe('')
-  })
-})
diff --git a/extensions/inference-anthropic-extension/src/env.d.ts b/extensions/inference-anthropic-extension/src/env.d.ts
deleted file mode 100644
index 40ca58094..000000000
--- a/extensions/inference-anthropic-extension/src/env.d.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
-declare const MODELS: Model[]
diff --git a/extensions/inference-anthropic-extension/src/index.ts b/extensions/inference-anthropic-extension/src/index.ts
deleted file mode 100644
index 8c286d7a5..000000000
--- a/extensions/inference-anthropic-extension/src/index.ts
+++ /dev/null
@@ -1,150 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-anthropic-extension/src/index
- */
-
-import { RemoteOAIEngine } from '@janhq/core'
-import { PayloadType } from '@janhq/core'
-import { ChatCompletionRole } from '@janhq/core'
-
-export enum Settings {
-  apiKey = 'anthropic-api-key',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-
-type AnthropicPayloadType = {
-  stream: boolean
-  model?: string
-  max_tokens?: number
-  messages?: Array<{ role: string; content: string }>
-  system?: string
-}
-
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanInferenceAnthropicExtension extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider: string = 'anthropic'
-  maxTokens: number = 4096
-
-  override async onLoad(): Promise<void> {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-    this.registerModels(MODELS)
-
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  // Override the headers method to include the x-API-key in the request headers
-  override async headers(): Promise<HeadersInit> {
-    return {
-      'Content-Type': 'application/json',
-      'x-api-key': this.apiKey,
-      'anthropic-version': '2023-06-01',
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    }
-  }
-
-  // Override the transformPayload method to convert the payload to the required format
-  transformPayload = (payload: PayloadType): AnthropicPayloadType => {
-    if (!payload.messages || payload.messages.length === 0) {
-      return {
-        max_tokens: this.maxTokens,
-        messages: [],
-        model: payload.model,
-        stream: payload.stream,
-      }
-    }
-
-    const convertedData: AnthropicPayloadType = {
-      max_tokens: this.maxTokens,
-      messages: [],
-      model: payload.model,
-      stream: payload.stream,
-    }
-
-    payload.messages.forEach((item) => {
-      if (item.role === ChatCompletionRole.User) {
-        convertedData.messages.push({
-          role: 'user',
-          content: item.content as string,
-        })
-      } else if (item.role === ChatCompletionRole.Assistant) {
-        convertedData.messages.push({
-          role: 'assistant',
-          content: item.content as string,
-        })
-      } else if (item.role === ChatCompletionRole.System) {
-        // When using Claude, you can dramatically improve its performance by using the system parameter to give it a role.
-        // This technique, known as role prompting, is the most powerful way to use system prompts with Claude.
-        convertedData.system = item.content as string
-      }
-    })
-
-    return convertedData
-  }
-
-  // Sample returned stream data from anthropic
-  // {"type":"content_block_start","index":0,"content_block":{"type":"text","text":""}         }
-  // {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":"Hello"}              }
-  // {"type":"content_block_stop","index":0        }
-  // {"type":"message_delta","delta":{"stop_reason":"end_turn","stop_sequence":null},"usage":{"output_tokens":12}   }
-
-  // Override the transformResponse method to convert the response to the required format
-  transformResponse = (data: any): string => {
-    // handling stream response
-    if (typeof data === 'string' && data.trim().length === 0) return ''
-    if (typeof data === 'string' && data.startsWith('event: ')) return ''
-    if (typeof data === 'string' && data.startsWith('data: ')) {
-      data = data.replace('data: ', '')
-      const parsedData = JSON.parse(data)
-      if (parsedData.type !== 'content_block_delta') return ''
-      return parsedData.delta?.text ?? ''
-    }
-
-    // non stream response
-    if (data.content && data.content.length > 0 && data.content[0].text) {
-      return data.content[0].text
-    }
-
-    console.error('Invalid response format:', data)
-    return ''
-  }
-}
diff --git a/extensions/inference-anthropic-extension/tsconfig.json b/extensions/inference-anthropic-extension/tsconfig.json
deleted file mode 100644
index 6db951c9e..000000000
--- a/extensions/inference-anthropic-extension/tsconfig.json
+++ /dev/null
@@ -1,15 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"],
-  "exclude": ["**/*.test.ts"]
-}
diff --git a/extensions/inference-cohere-extension/README.md b/extensions/inference-cohere-extension/README.md
deleted file mode 100644
index 089a096e8..000000000
--- a/extensions/inference-cohere-extension/README.md
+++ /dev/null
@@ -1,79 +0,0 @@
-# Cohere Engine Extension
-
-Created using Jan extension example
-
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-cohere-extension/package.json b/extensions/inference-cohere-extension/package.json
deleted file mode 100644
index 7058c0e53..000000000
--- a/extensions/inference-cohere-extension/package.json
+++ /dev/null
@@ -1,46 +0,0 @@
-{
-  "name": "@janhq/inference-cohere-extension",
-  "productName": "Cohere Inference Engine",
-  "version": "1.0.0",
-  "description": "This extension enables Cohere chat completion API calls",
-  "main": "dist/index.js",
-  "module": "dist/module.js",
-  "engine": "cohere",
-  "author": "Jan <service@jan.ai>",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "exports": {
-    ".": "./dist/index.js",
-    "./main": "./dist/module.js"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-cohere-extension/resources/settings.json b/extensions/inference-cohere-extension/resources/settings.json
deleted file mode 100644
index 79150d7e5..000000000
--- a/extensions/inference-cohere-extension/resources/settings.json
+++ /dev/null
@@ -1,24 +0,0 @@
-[
-  {
-    "key": "cohere-api-key",
-    "title": "API Key",
-    "description": "The Cohere API uses API keys for authentication. Visit your [API Keys](https://dashboard.cohere.com/api-keys) page to retrieve the API key you'll use in your requests.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions. See the [Cohere API documentation](https://docs.cohere.com/reference/chat) for more information.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "https://api.cohere.ai/v1/chat",
-      "value": "https://api.cohere.ai/v1/chat"
-    }
-  }
-]
diff --git a/extensions/inference-cohere-extension/rolldown.config.mjs b/extensions/inference-cohere-extension/rolldown.config.mjs
deleted file mode 100644
index 9ebaace2e..000000000
--- a/extensions/inference-cohere-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,18 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-import modelsJson from './resources/models.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    MODELS: JSON.stringify(modelsJson),
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-cohere-extension/src/env.d.ts b/extensions/inference-cohere-extension/src/env.d.ts
deleted file mode 100644
index 40ca58094..000000000
--- a/extensions/inference-cohere-extension/src/env.d.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
-declare const MODELS: Model[]
diff --git a/extensions/inference-cohere-extension/src/index.ts b/extensions/inference-cohere-extension/src/index.ts
deleted file mode 100644
index 018df60f9..000000000
--- a/extensions/inference-cohere-extension/src/index.ts
+++ /dev/null
@@ -1,117 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-cohere-extension/src/index
- */
-
-import { RemoteOAIEngine } from '@janhq/core'
-import { PayloadType } from '@janhq/core'
-import { ChatCompletionRole } from '@janhq/core'
-
-enum Settings {
-  apiKey = 'cohere-api-key',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-
-enum RoleType {
-  user = 'USER',
-  chatbot = 'CHATBOT',
-  system = 'SYSTEM',
-}
-
-type CoherePayloadType = {
-  chat_history?: Array<{ role: RoleType; message: string }>
-  message?: string
-  preamble?: string
-}
-
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanInferenceCohereExtension extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider: string = 'cohere'
-
-  override async onLoad(): Promise<void> {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-    this.registerModels(MODELS)
-
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    }
-  }
-
-  transformPayload = (payload: PayloadType): CoherePayloadType => {
-    if (payload.messages.length === 0) {
-      return {}
-    }
-
-    const { messages, ...params } = payload
-    const convertedData: CoherePayloadType = {
-      ...params,
-      chat_history: [],
-      message: '',
-    }
-    messages.forEach((item, index) => {
-      // Assign the message of the last item to the `message` property
-      if (index === messages.length - 1) {
-        convertedData.message = item.content as string
-        return
-      }
-      if (item.role === ChatCompletionRole.User) {
-        convertedData.chat_history.push({
-          role: RoleType.user,
-          message: item.content as string,
-        })
-      } else if (item.role === ChatCompletionRole.Assistant) {
-        convertedData.chat_history.push({
-          role: RoleType.chatbot,
-          message: item.content as string,
-        })
-      } else if (item.role === ChatCompletionRole.System) {
-        convertedData.preamble = item.content as string
-      }
-    })
-    return convertedData
-  }
-
-  transformResponse = (data: any) => {
-    return typeof data === 'object'
-      ? data.text
-      : (JSON.parse(data.replace('data: ', '').trim()).text ?? '')
-  }
-}
diff --git a/extensions/inference-cohere-extension/tsconfig.json b/extensions/inference-cohere-extension/tsconfig.json
deleted file mode 100644
index 2477d58ce..000000000
--- a/extensions/inference-cohere-extension/tsconfig.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"]
-}
diff --git a/extensions/inference-cortex-extension/bin/version.txt b/extensions/inference-cortex-extension/bin/version.txt
index b0f3d96f8..9b3178149 100644
--- a/extensions/inference-cortex-extension/bin/version.txt
+++ b/extensions/inference-cortex-extension/bin/version.txt
@@ -1 +1 @@
-1.0.8
+1.0.9-rc1
diff --git a/extensions/inference-cortex-extension/src/@types/global.d.ts b/extensions/inference-cortex-extension/src/@types/global.d.ts
index 907db0df1..2de432c29 100644
--- a/extensions/inference-cortex-extension/src/@types/global.d.ts
+++ b/extensions/inference-cortex-extension/src/@types/global.d.ts
@@ -2,5 +2,5 @@ declare const NODE: string
 declare const CORTEX_API_URL: string
 declare const CORTEX_SOCKET_URL: string
 declare const CORTEX_ENGINE_VERSION: string
-declare const SETTINGS: object[]
-declare const MODELS: object[]
+declare const SETTINGS: any
+declare const MODELS: any
diff --git a/extensions/inference-cortex-extension/src/index.ts b/extensions/inference-cortex-extension/src/index.ts
index 03c094ec1..84cc49b94 100644
--- a/extensions/inference-cortex-extension/src/index.ts
+++ b/extensions/inference-cortex-extension/src/index.ts
@@ -111,8 +111,6 @@ export default class JanInferenceCortexExtension extends LocalOAIEngine {
     )
     if (!Number.isNaN(threads_number)) this.cpu_threads = threads_number
 
-    this.queue.add(() => this.clean())
-
     // Run the process watchdog
     const systemInfo = await systemInformation()
     this.queue.add(() => executeOnMain(NODE, 'run', systemInfo))
diff --git a/extensions/inference-groq-extension/README.md b/extensions/inference-groq-extension/README.md
deleted file mode 100644
index f9690da09..000000000
--- a/extensions/inference-groq-extension/README.md
+++ /dev/null
@@ -1,75 +0,0 @@
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-groq-extension/package.json b/extensions/inference-groq-extension/package.json
deleted file mode 100644
index e400c517b..000000000
--- a/extensions/inference-groq-extension/package.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
-  "name": "@janhq/inference-groq-extension",
-  "productName": "Groq Inference Engine",
-  "version": "1.0.1",
-  "description": "This extension enables fast Groq chat completion API calls",
-  "main": "dist/index.js",
-  "engine": "groq",
-  "module": "dist/module.js",
-  "author": "Carsen Klock & Jan",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-groq-extension/resources/settings.json b/extensions/inference-groq-extension/resources/settings.json
deleted file mode 100644
index 767fec0ba..000000000
--- a/extensions/inference-groq-extension/resources/settings.json
+++ /dev/null
@@ -1,24 +0,0 @@
-[
-  {
-    "key": "groq-api-key",
-    "title": "API Key",
-    "description": "The Groq API uses API keys for authentication. Visit your [API Keys](https://console.groq.com/keys) page to retrieve the API key you'll use in your requests.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions. See the [Groq documentation](https://console.groq.com/docs/openai) for more information.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "https://api.groq.com/openai/v1/chat/completions",
-      "value": "https://api.groq.com/openai/v1/chat/completions"
-    }
-  }
-]
diff --git a/extensions/inference-groq-extension/rolldown.config.mjs b/extensions/inference-groq-extension/rolldown.config.mjs
deleted file mode 100644
index 9ebaace2e..000000000
--- a/extensions/inference-groq-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,18 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-import modelsJson from './resources/models.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    MODELS: JSON.stringify(modelsJson),
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-groq-extension/src/env.d.ts b/extensions/inference-groq-extension/src/env.d.ts
deleted file mode 100644
index 40ca58094..000000000
--- a/extensions/inference-groq-extension/src/env.d.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
-declare const MODELS: Model[]
diff --git a/extensions/inference-groq-extension/src/index.ts b/extensions/inference-groq-extension/src/index.ts
deleted file mode 100644
index d6969b48f..000000000
--- a/extensions/inference-groq-extension/src/index.ts
+++ /dev/null
@@ -1,64 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-groq-extension/src/index
- */
-
-import { RemoteOAIEngine } from '@janhq/core'
-
-enum Settings {
-  apiKey = 'groq-api-key',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanInferenceGroqExtension extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider = 'groq'
-
-  override async onLoad(): Promise<void> {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-    this.registerModels(MODELS)
-
-    // Retrieve API Key Setting
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    }
-  }
-}
diff --git a/extensions/inference-groq-extension/tsconfig.json b/extensions/inference-groq-extension/tsconfig.json
deleted file mode 100644
index 2477d58ce..000000000
--- a/extensions/inference-groq-extension/tsconfig.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"]
-}
diff --git a/extensions/inference-martian-extension/README.md b/extensions/inference-martian-extension/README.md
deleted file mode 100644
index 5b8e898d7..000000000
--- a/extensions/inference-martian-extension/README.md
+++ /dev/null
@@ -1,79 +0,0 @@
-# Martian Engine Extension
-
-Created using Jan extension example
-
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-martian-extension/package.json b/extensions/inference-martian-extension/package.json
deleted file mode 100644
index c1371917c..000000000
--- a/extensions/inference-martian-extension/package.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
-  "name": "@janhq/inference-martian-extension",
-  "productName": "Martian Inference Engine",
-  "version": "1.0.1",
-  "description": "This extension enables Martian chat completion API calls",
-  "main": "dist/index.js",
-  "module": "dist/module.js",
-  "engine": "martian",
-  "author": "Jan <service@jan.ai>",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-martian-extension/resources/settings.json b/extensions/inference-martian-extension/resources/settings.json
deleted file mode 100644
index 6825099f5..000000000
--- a/extensions/inference-martian-extension/resources/settings.json
+++ /dev/null
@@ -1,24 +0,0 @@
-[
-  {
-    "key": "martian-api-key",
-    "title": "API Key",
-    "description": "The Martian API uses API keys for authentication. Visit your [API Keys](https://withmartian.com/dashboard) page to retrieve the API key you'll use in your requests.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions. See the [Martian API documentation](https://docs.withmartian.com/martian-model-router/getting-started/quickstart-integrating-martian-into-your-codebase) for more information.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "https://withmartian.com/api/openai/v1/chat/completions",
-      "value": "https://withmartian.com/api/openai/v1/chat/completions"
-    }
-  }
-]
diff --git a/extensions/inference-martian-extension/rolldown.config.mjs b/extensions/inference-martian-extension/rolldown.config.mjs
deleted file mode 100644
index 9ebaace2e..000000000
--- a/extensions/inference-martian-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,18 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-import modelsJson from './resources/models.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    MODELS: JSON.stringify(modelsJson),
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-martian-extension/src/env.d.ts b/extensions/inference-martian-extension/src/env.d.ts
deleted file mode 100644
index 40ca58094..000000000
--- a/extensions/inference-martian-extension/src/env.d.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
-declare const MODELS: Model[]
diff --git a/extensions/inference-martian-extension/src/index.ts b/extensions/inference-martian-extension/src/index.ts
deleted file mode 100644
index 8cbe4e52d..000000000
--- a/extensions/inference-martian-extension/src/index.ts
+++ /dev/null
@@ -1,63 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-martian-extension/src/index
- */
-
-import { RemoteOAIEngine } from '@janhq/core'
-
-enum Settings {
-  apiKey = 'martian-api-key',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanInferenceMartianExtension extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider: string = 'martian'
-
-  override async onLoad(): Promise<void> {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-    this.registerModels(MODELS)
-
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    }
-  }
-}
diff --git a/extensions/inference-martian-extension/tsconfig.json b/extensions/inference-martian-extension/tsconfig.json
deleted file mode 100644
index 2477d58ce..000000000
--- a/extensions/inference-martian-extension/tsconfig.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"]
-}
diff --git a/extensions/inference-mistral-extension/README.md b/extensions/inference-mistral-extension/README.md
deleted file mode 100644
index adb36558c..000000000
--- a/extensions/inference-mistral-extension/README.md
+++ /dev/null
@@ -1,79 +0,0 @@
-# Mistral Engine Extension
-
-Created using Jan extension example
-
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-mistral-extension/package.json b/extensions/inference-mistral-extension/package.json
deleted file mode 100644
index 504a3d613..000000000
--- a/extensions/inference-mistral-extension/package.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
-  "name": "@janhq/inference-mistral-extension",
-  "productName": "MistralAI Inference Engine",
-  "version": "1.0.1",
-  "description": "This extension enables Mistral chat completion API calls",
-  "main": "dist/index.js",
-  "module": "dist/module.js",
-  "engine": "mistral",
-  "author": "Jan <service@jan.ai>",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-mistral-extension/resources/settings.json b/extensions/inference-mistral-extension/resources/settings.json
deleted file mode 100644
index 963674b02..000000000
--- a/extensions/inference-mistral-extension/resources/settings.json
+++ /dev/null
@@ -1,24 +0,0 @@
-[
-  {
-    "key": "mistral-api-key",
-    "title": "API Key",
-    "description": "The Mistral API uses API keys for authentication. Visit your [API Keys](https://console.mistral.ai/api-keys/) page to retrieve the API key you'll use in your requests.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions. See the [Mistral API documentation](https://docs.mistral.ai/api/#operation/createChatCompletion) for more information.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "https://api.mistral.ai/v1/chat/completions",
-      "value": "https://api.mistral.ai/v1/chat/completions"
-    }
-  }
-]
diff --git a/extensions/inference-mistral-extension/rolldown.config.mjs b/extensions/inference-mistral-extension/rolldown.config.mjs
deleted file mode 100644
index 9ebaace2e..000000000
--- a/extensions/inference-mistral-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,18 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-import modelsJson from './resources/models.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    MODELS: JSON.stringify(modelsJson),
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-mistral-extension/src/env.d.ts b/extensions/inference-mistral-extension/src/env.d.ts
deleted file mode 100644
index 40ca58094..000000000
--- a/extensions/inference-mistral-extension/src/env.d.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
-declare const MODELS: Model[]
diff --git a/extensions/inference-mistral-extension/src/index.ts b/extensions/inference-mistral-extension/src/index.ts
deleted file mode 100644
index 22b977c5a..000000000
--- a/extensions/inference-mistral-extension/src/index.ts
+++ /dev/null
@@ -1,63 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-mistral-extension/src/index
- */
-
-import { RemoteOAIEngine } from '@janhq/core'
-
-enum Settings {
-  apiKey = 'mistral-api-key',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanInferenceMistralExtension extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider: string = 'mistral'
-
-  override async onLoad(): Promise<void> {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-    this.registerModels(MODELS)
-
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    }
-  }
-}
diff --git a/extensions/inference-mistral-extension/tsconfig.json b/extensions/inference-mistral-extension/tsconfig.json
deleted file mode 100644
index 2477d58ce..000000000
--- a/extensions/inference-mistral-extension/tsconfig.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"]
-}
diff --git a/extensions/inference-nvidia-extension/README.md b/extensions/inference-nvidia-extension/README.md
deleted file mode 100644
index 65a1b2b59..000000000
--- a/extensions/inference-nvidia-extension/README.md
+++ /dev/null
@@ -1,79 +0,0 @@
-# Nvidia Engine Extension
-
-Created using Jan extension example
-
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-nvidia-extension/package.json b/extensions/inference-nvidia-extension/package.json
deleted file mode 100644
index 771ccec4f..000000000
--- a/extensions/inference-nvidia-extension/package.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
-  "name": "@janhq/inference-nvidia-extension",
-  "productName": "NVIDIA NIM Inference Engine",
-  "version": "1.0.1",
-  "description": "This extension enables NVIDIA chat completion API calls",
-  "main": "dist/index.js",
-  "module": "dist/module.js",
-  "engine": "nvidia",
-  "author": "Jan <service@jan.ai>",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-nvidia-extension/resources/settings.json b/extensions/inference-nvidia-extension/resources/settings.json
deleted file mode 100644
index 6b2652653..000000000
--- a/extensions/inference-nvidia-extension/resources/settings.json
+++ /dev/null
@@ -1,24 +0,0 @@
-[
-  {
-    "key": "nvidia-api-key",
-    "title": "API Key",
-    "description": "The NVIDIA API uses API keys for authentication. Visit your [API Keys](https://org.ngc.nvidia.com/setup/personal-keys) page to retrieve the API key you'll use in your requests..",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions. See the [NVIDIA API documentation](https://www.nvidia.com/en-us/ai/) for more information.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "https://integrate.api.nvidia.com/v1/chat/completions",
-      "value": "https://integrate.api.nvidia.com/v1/chat/completions"
-    }
-  }
-]
diff --git a/extensions/inference-nvidia-extension/rolldown.config.mjs b/extensions/inference-nvidia-extension/rolldown.config.mjs
deleted file mode 100644
index 9ebaace2e..000000000
--- a/extensions/inference-nvidia-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,18 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-import modelsJson from './resources/models.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    MODELS: JSON.stringify(modelsJson),
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-nvidia-extension/src/env.d.ts b/extensions/inference-nvidia-extension/src/env.d.ts
deleted file mode 100644
index 40ca58094..000000000
--- a/extensions/inference-nvidia-extension/src/env.d.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
-declare const MODELS: Model[]
diff --git a/extensions/inference-nvidia-extension/src/index.ts b/extensions/inference-nvidia-extension/src/index.ts
deleted file mode 100644
index 0e5bb8135..000000000
--- a/extensions/inference-nvidia-extension/src/index.ts
+++ /dev/null
@@ -1,63 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-mistral-extension/src/index
- */
-
-import { RemoteOAIEngine } from '@janhq/core'
-
-enum Settings {
-  apiKey = 'nvidia-api-key',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanNVIDIANIMInferenceEngine extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider: string = 'nvidia'
-
-  override async onLoad(): Promise<void> {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-    this.registerModels(MODELS)
-
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    }
-  }
-}
diff --git a/extensions/inference-nvidia-extension/tsconfig.json b/extensions/inference-nvidia-extension/tsconfig.json
deleted file mode 100644
index 2477d58ce..000000000
--- a/extensions/inference-nvidia-extension/tsconfig.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"]
-}
diff --git a/extensions/inference-openai-extension/README.md b/extensions/inference-openai-extension/README.md
deleted file mode 100644
index c716c725c..000000000
--- a/extensions/inference-openai-extension/README.md
+++ /dev/null
@@ -1,79 +0,0 @@
-# OpenAI Engine Extension
-
-Created using Jan extension example
-
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-openai-extension/jest.config.js b/extensions/inference-openai-extension/jest.config.js
deleted file mode 100644
index 3e32adceb..000000000
--- a/extensions/inference-openai-extension/jest.config.js
+++ /dev/null
@@ -1,9 +0,0 @@
-/** @type {import('ts-jest').JestConfigWithTsJest} */
-module.exports = {
-  preset: 'ts-jest',
-  testEnvironment: 'node',
-  transform: {
-    'node_modules/@janhq/core/.+\\.(j|t)s?$': 'ts-jest',
-  },
-  transformIgnorePatterns: ['node_modules/(?!@janhq/core/.*)'],
-}
diff --git a/extensions/inference-openai-extension/package.json b/extensions/inference-openai-extension/package.json
deleted file mode 100644
index f790b60ca..000000000
--- a/extensions/inference-openai-extension/package.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
-  "name": "@janhq/inference-openai-extension",
-  "productName": "OpenAI Inference Engine",
-  "version": "1.0.5",
-  "description": "This extension enables OpenAI chat completion API calls",
-  "main": "dist/index.js",
-  "module": "dist/module.js",
-  "engine": "openai",
-  "author": "Jan <service@jan.ai>",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-openai-extension/resources/settings.json b/extensions/inference-openai-extension/resources/settings.json
deleted file mode 100644
index db2e80c9b..000000000
--- a/extensions/inference-openai-extension/resources/settings.json
+++ /dev/null
@@ -1,24 +0,0 @@
-[
-  {
-    "key": "openai-api-key",
-    "title": "API Key",
-    "description": "The OpenAI API uses API keys for authentication. Visit your [API Keys](https://platform.openai.com/account/api-keys) page to retrieve the API key you'll use in your requests.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions. See the [OpenAI API documentation](https://platform.openai.com/docs/api-reference/chat/create) for more information.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "https://api.openai.com/v1/chat/completions",
-      "value": "https://api.openai.com/v1/chat/completions"
-    }
-  }
-]
diff --git a/extensions/inference-openai-extension/rolldown.config.mjs b/extensions/inference-openai-extension/rolldown.config.mjs
deleted file mode 100644
index 9ebaace2e..000000000
--- a/extensions/inference-openai-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,18 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-import modelsJson from './resources/models.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    MODELS: JSON.stringify(modelsJson),
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-openai-extension/src/OpenAIExtension.test.ts b/extensions/inference-openai-extension/src/OpenAIExtension.test.ts
deleted file mode 100644
index 4d46bc007..000000000
--- a/extensions/inference-openai-extension/src/OpenAIExtension.test.ts
+++ /dev/null
@@ -1,54 +0,0 @@
-/**
- * @jest-environment jsdom
- */
-jest.mock('@janhq/core', () => ({
-  ...jest.requireActual('@janhq/core/node'),
-  RemoteOAIEngine: jest.fn().mockImplementation(() => ({
-    onLoad: jest.fn(),
-    registerSettings: jest.fn(),
-    registerModels: jest.fn(),
-    getSetting: jest.fn(),
-    onSettingUpdate: jest.fn(),
-  })),
-}))
-import JanInferenceOpenAIExtension, { Settings } from '.'
-
-describe('JanInferenceOpenAIExtension', () => {
-  let extension: JanInferenceOpenAIExtension
-
-  beforeEach(() => {
-    // @ts-ignore
-    extension = new JanInferenceOpenAIExtension()
-  })
-
-  it('should initialize with settings and models', async () => {
-    await extension.onLoad()
-    // Assuming there are some default SETTINGS and MODELS being registered
-    expect(extension.apiKey).toBe(undefined)
-    expect(extension.inferenceUrl).toBe('')
-  })
-
-  it('should transform the payload for preview models', () => {
-    const payload: any = {
-      max_tokens: 100,
-      model: 'o1-mini',
-      // Add other required properties...
-    }
-
-    const transformedPayload = extension.transformPayload(payload)
-    expect(transformedPayload.max_completion_tokens).toBe(payload.max_tokens)
-    expect(transformedPayload).not.toHaveProperty('max_tokens')
-    expect(transformedPayload).toHaveProperty('max_completion_tokens')
-  })
-
-  it('should not transform the payload for non-preview models', () => {
-    const payload: any = {
-      max_tokens: 100,
-      model: 'non-preview-model',
-      // Add other required properties...
-    }
-
-    const transformedPayload = extension.transformPayload(payload)
-    expect(transformedPayload).toEqual(payload)
-  })
-})
diff --git a/extensions/inference-openai-extension/src/env.d.ts b/extensions/inference-openai-extension/src/env.d.ts
deleted file mode 100644
index 40ca58094..000000000
--- a/extensions/inference-openai-extension/src/env.d.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
-declare const MODELS: Model[]
diff --git a/extensions/inference-openai-extension/src/index.ts b/extensions/inference-openai-extension/src/index.ts
deleted file mode 100644
index 0996c6bef..000000000
--- a/extensions/inference-openai-extension/src/index.ts
+++ /dev/null
@@ -1,90 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-openai-extension/src/index
- */
-
-import { ModelRuntimeParams, PayloadType, RemoteOAIEngine } from '@janhq/core'
-
-export enum Settings {
-  apiKey = 'openai-api-key',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-type OpenAIPayloadType = PayloadType &
-  ModelRuntimeParams & { max_completion_tokens: number }
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanInferenceOpenAIExtension extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider: string = 'openai'
-  previewModels = ['o1-mini', 'o1-preview']
-
-  override async onLoad(): Promise<void> {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-    this.registerModels(MODELS)
-
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    }
-  }
-
-  /**
-   * Tranform the payload before sending it to the inference endpoint.
-   * The new preview models such as o1-mini and o1-preview replaced max_tokens by max_completion_tokens parameter.
-   * Others do not.
-   * @param payload
-   * @returns
-   */
-  transformPayload = (payload: OpenAIPayloadType): OpenAIPayloadType => {
-    // Remove empty stop words
-    if (payload.stop?.length === 0) {
-      const { stop, ...params } = payload
-      payload = params
-    }
-    // Transform the payload for preview models
-    if (this.previewModels.includes(payload.model)) {
-      const { max_tokens, stop, ...params } = payload
-      return {
-        ...params,
-        max_completion_tokens: max_tokens,
-      }
-    }
-    // Pass through for non-preview models
-    return payload
-  }
-}
diff --git a/extensions/inference-openai-extension/tsconfig.json b/extensions/inference-openai-extension/tsconfig.json
deleted file mode 100644
index 6db951c9e..000000000
--- a/extensions/inference-openai-extension/tsconfig.json
+++ /dev/null
@@ -1,15 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"],
-  "exclude": ["**/*.test.ts"]
-}
diff --git a/extensions/inference-openrouter-extension/README.md b/extensions/inference-openrouter-extension/README.md
deleted file mode 100644
index aab10755d..000000000
--- a/extensions/inference-openrouter-extension/README.md
+++ /dev/null
@@ -1,79 +0,0 @@
-# Open Router Engine Extension
-
-Created using Jan extension example
-
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-openrouter-extension/package.json b/extensions/inference-openrouter-extension/package.json
deleted file mode 100644
index fd53ad0f5..000000000
--- a/extensions/inference-openrouter-extension/package.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
-  "name": "@janhq/inference-openrouter-extension",
-  "productName": "OpenRouter Inference Engine",
-  "version": "1.0.0",
-  "description": "This extension enables Open Router chat completion API calls",
-  "main": "dist/index.js",
-  "module": "dist/module.js",
-  "engine": "openrouter",
-  "author": "Jan <service@jan.ai>",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-openrouter-extension/resources/settings.json b/extensions/inference-openrouter-extension/resources/settings.json
deleted file mode 100644
index 189aee0a0..000000000
--- a/extensions/inference-openrouter-extension/resources/settings.json
+++ /dev/null
@@ -1,34 +0,0 @@
-[
-  {
-    "key": "openrouter-api-key",
-    "title": "API Key",
-    "description": "The OpenRouter API uses API keys for authentication. Visit your [API Keys](https://openrouter.ai/keys) page to retrieve the API key you'll use in your requests.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions. See the [OpenRouter API documentation](https://openrouter.ai/docs/requests) for more information.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "https://openrouter.ai/api/v1/chat/completions",
-      "value": "https://openrouter.ai/api/v1/chat/completions"
-    }
-  },
-  {
-    "key": "openrouter-model",
-    "title": "Model",
-    "description": "If the model parameter is omitted, the user or payer's default is used. Otherwise, remember to select a value for model from the [supported models](https://openrouter.ai/docs/models) or API, and include the organization prefix.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Leave empty for default model",
-      "value": ""
-    }
-  }
-]
diff --git a/extensions/inference-openrouter-extension/rolldown.config.mjs b/extensions/inference-openrouter-extension/rolldown.config.mjs
deleted file mode 100644
index 9ebaace2e..000000000
--- a/extensions/inference-openrouter-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,18 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-import modelsJson from './resources/models.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    MODELS: JSON.stringify(modelsJson),
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-openrouter-extension/src/env.d.ts b/extensions/inference-openrouter-extension/src/env.d.ts
deleted file mode 100644
index 40ca58094..000000000
--- a/extensions/inference-openrouter-extension/src/env.d.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
-declare const MODELS: Model[]
diff --git a/extensions/inference-openrouter-extension/src/index.ts b/extensions/inference-openrouter-extension/src/index.ts
deleted file mode 100644
index a34c4c38b..000000000
--- a/extensions/inference-openrouter-extension/src/index.ts
+++ /dev/null
@@ -1,85 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-openai-extension/src/index
- */
-
-import { RemoteOAIEngine } from '@janhq/core'
-import { PayloadType } from '@janhq/core'
-
-enum Settings {
-  apiKey = 'openrouter-api-key',
-  model = 'openrouter-model',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanInferenceOpenRouterExtension extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider: string = 'openrouter'
-  model?: string | undefined
-
-  override async onLoad(): Promise<void> {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-    this.registerModels(MODELS)
-
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-    this.model = await this.getSetting<string>(Settings.model, '')
-    // Openrouter uses default model on no model param set
-    if (!this.model?.length) this.model = undefined
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  override async headers(): Promise<HeadersInit> {
-    return {
-      'Content-Type': 'application/json',
-      'HTTP-Referer': 'https://jan.ai',
-      'Authorization': `Bearer ${this.apiKey}`,
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    } else if (key === Settings.model) {
-      this.model =
-        typeof value === 'string' && value.length > 0 ? value : undefined
-    }
-  }
-
-  transformPayload = (payload: PayloadType) => ({
-    ...payload,
-    model: payload.model !== 'open-router-auto' ? payload.model : this.model,
-  })
-}
diff --git a/extensions/inference-openrouter-extension/tsconfig.json b/extensions/inference-openrouter-extension/tsconfig.json
deleted file mode 100644
index 2477d58ce..000000000
--- a/extensions/inference-openrouter-extension/tsconfig.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"]
-}
diff --git a/extensions/inference-triton-trtllm-extension/README.md b/extensions/inference-triton-trtllm-extension/README.md
deleted file mode 100644
index f9690da09..000000000
--- a/extensions/inference-triton-trtllm-extension/README.md
+++ /dev/null
@@ -1,75 +0,0 @@
-# Create a Jan Extension using Typescript
-
-Use this template to bootstrap the creation of a TypeScript Jan extension. 🚀
-
-## Create Your Own Extension
-
-To create your own extension, you can use this repository as a template! Just follow the below instructions:
-
-1. Click the Use this template button at the top of the repository
-2. Select Create a new repository
-3. Select an owner and name for your new repository
-4. Click Create repository
-5. Clone your new repository
-
-## Initial Setup
-
-After you've cloned the repository to your local machine or codespace, you'll need to perform some initial setup steps before you can develop your extension.
-
-> [!NOTE]
->
-> You'll need to have a reasonably modern version of
-> [Node.js](https://nodejs.org) handy. If you are using a version manager like
-> [`nodenv`](https://github.com/nodenv/nodenv) or
-> [`nvm`](https://github.com/nvm-sh/nvm), you can run `nodenv install` in the
-> root of your repository to install the version specified in
-> [`package.json`](./package.json). Otherwise, 20.x or later should work!
-
-1. :hammer_and_wrench: Install the dependencies
-
-   ```bash
-   npm install
-   ```
-
-1. :building_construction: Package the TypeScript for distribution
-
-   ```bash
-   npm run bundle
-   ```
-
-1. :white_check_mark: Check your artifact
-
-   There will be a tgz file in your extension directory now
-
-## Update the Extension Metadata
-
-The [`package.json`](package.json) file defines metadata about your extension, such as
-extension name, main entry, description and version.
-
-When you copy this repository, update `package.json` with the name, description for your extension.
-
-## Update the Extension Code
-
-The [`src/`](./src/) directory is the heart of your extension! This contains the
-source code that will be run when your extension functions are invoked. You can replace the
-contents of this directory with your own code.
-
-There are a few things to keep in mind when writing your extension code:
-
-- Most Jan Extension functions are processed asynchronously.
-  In `index.ts`, you will see that the extension function will return a `Promise<any>`.
-
-  ```typescript
-  import { events, MessageEvent, MessageRequest } from '@janhq/core'
-
-  function onStart(): Promise<any> {
-    return events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.inference(data)
-    )
-  }
-  ```
-
-  For more information about the Jan Extension Core module, see the
-  [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
-
-So, what are you waiting for? Go ahead and start customizing your extension!
diff --git a/extensions/inference-triton-trtllm-extension/package.json b/extensions/inference-triton-trtllm-extension/package.json
deleted file mode 100644
index 9c1f5e05f..000000000
--- a/extensions/inference-triton-trtllm-extension/package.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
-  "name": "@janhq/inference-triton-trt-llm-extension",
-  "productName": "Triton-TRT-LLM Inference Engine",
-  "version": "1.0.0",
-  "description": "This extension enables Nvidia's TensorRT-LLM as an inference engine option",
-  "main": "dist/index.js",
-  "engine": "triton_trtllm",
-  "author": "Jan <service@jan.ai>",
-  "license": "AGPL-3.0",
-  "scripts": {
-    "build": "rolldown -c rolldown.config.mjs",
-    "build:publish": "rimraf *.tgz --glob || true && yarn build && npm pack && cpx *.tgz ../../pre-install"
-  },
-  "devDependencies": {
-    "cpx": "^1.5.0",
-    "rimraf": "^3.0.2",
-    "rolldown": "1.0.0-beta.1",
-    "ts-loader": "^9.5.0",
-    "typescript": "^5.7.2"
-  },
-  "dependencies": {
-    "@janhq/core": "../../core/package.tgz",
-    "fetch-retry": "^5.0.6",
-    "rxjs": "^7.8.1",
-    "ulidx": "^2.3.0"
-  },
-  "engines": {
-    "node": ">=18.0.0"
-  },
-  "files": [
-    "dist/*",
-    "package.json",
-    "README.md"
-  ],
-  "bundleDependencies": [
-    "fetch-retry"
-  ],
-  "installConfig": {
-    "hoistingLimits": "workspaces"
-  },
-  "packageManager": "yarn@4.5.3"
-}
diff --git a/extensions/inference-triton-trtllm-extension/resources/settings.json b/extensions/inference-triton-trtllm-extension/resources/settings.json
deleted file mode 100644
index 26b80a686..000000000
--- a/extensions/inference-triton-trtllm-extension/resources/settings.json
+++ /dev/null
@@ -1,24 +0,0 @@
-[
-  {
-    "key": "tritonllm-api-key",
-    "title": "API Key",
-    "description": "The Triton LLM API uses API keys for authentication.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "Insert API Key",
-      "value": "",
-      "type": "password",
-      "inputActions": ["unobscure", "copy"]
-    }
-  },
-  {
-    "key": "chat-completions-endpoint",
-    "title": "Chat Completions Endpoint",
-    "description": "The endpoint to use for chat completions.",
-    "controllerType": "input",
-    "controllerProps": {
-      "placeholder": "http://localhost:8000/v2/models/tensorrt_llm_bls/generate",
-      "value": "http://localhost:8000/v2/models/tensorrt_llm_bls/generate"
-    }
-  }
-]
diff --git a/extensions/inference-triton-trtllm-extension/rolldown.config.mjs b/extensions/inference-triton-trtllm-extension/rolldown.config.mjs
deleted file mode 100644
index e0659a485..000000000
--- a/extensions/inference-triton-trtllm-extension/rolldown.config.mjs
+++ /dev/null
@@ -1,16 +0,0 @@
-import { defineConfig } from 'rolldown'
-import pkgJson from './package.json' with { type: 'json' }
-import settingJson from './resources/settings.json' with { type: 'json' }
-
-export default defineConfig({
-  input: 'src/index.ts',
-  output: {
-    format: 'esm',
-    file: 'dist/index.js',
-  },
-  platform: 'browser',
-  define: {
-    SETTINGS: JSON.stringify(settingJson),
-    ENGINE: JSON.stringify(pkgJson.engine),
-  },
-})
diff --git a/extensions/inference-triton-trtllm-extension/src/env.d.ts b/extensions/inference-triton-trtllm-extension/src/env.d.ts
deleted file mode 100644
index 4ff21449c..000000000
--- a/extensions/inference-triton-trtllm-extension/src/env.d.ts
+++ /dev/null
@@ -1 +0,0 @@
-declare const SETTINGS: SettingComponentProps[]
diff --git a/extensions/inference-triton-trtllm-extension/src/index.ts b/extensions/inference-triton-trtllm-extension/src/index.ts
deleted file mode 100644
index 2f351defe..000000000
--- a/extensions/inference-triton-trtllm-extension/src/index.ts
+++ /dev/null
@@ -1,66 +0,0 @@
-/**
- * @file This file exports a class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- * @version 1.0.0
- * @module inference-nvidia-triton-trt-llm-extension/src/index
- */
-
-import { RemoteOAIEngine } from '@janhq/core'
-
-enum Settings {
-  apiKey = 'tritonllm-api-key',
-  chatCompletionsEndPoint = 'chat-completions-endpoint',
-}
-/**
- * A class that implements the InferenceExtension interface from the @janhq/core package.
- * The class provides methods for initializing and stopping a model, and for making inference requests.
- * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
- */
-export default class JanInferenceTritonTrtLLMExtension extends RemoteOAIEngine {
-  inferenceUrl: string = ''
-  provider: string = 'triton_trtllm'
-
-  /**
-   * Subscribes to events emitted by the @janhq/core package.
-   */
-  async onLoad() {
-    super.onLoad()
-
-    // Register Settings
-    this.registerSettings(SETTINGS)
-
-    // Retrieve API Key Setting
-    this.apiKey = await this.getSetting<string>(Settings.apiKey, '')
-    this.inferenceUrl = await this.getSetting<string>(
-      Settings.chatCompletionsEndPoint,
-      ''
-    )
-
-    if (this.inferenceUrl.length === 0) {
-      SETTINGS.forEach((setting) => {
-        if (setting.key === Settings.chatCompletionsEndPoint) {
-          this.inferenceUrl = setting.controllerProps.value as string
-        }
-      })
-    }
-  }
-
-  onSettingUpdate<T>(key: string, value: T): void {
-    if (key === Settings.apiKey) {
-      this.apiKey = value as string
-    } else if (key === Settings.chatCompletionsEndPoint) {
-      if (typeof value !== 'string') return
-
-      if (value.trim().length === 0) {
-        SETTINGS.forEach((setting) => {
-          if (setting.key === Settings.chatCompletionsEndPoint) {
-            this.inferenceUrl = setting.controllerProps.value as string
-          }
-        })
-      } else {
-        this.inferenceUrl = value
-      }
-    }
-  }
-}
diff --git a/extensions/inference-triton-trtllm-extension/tsconfig.json b/extensions/inference-triton-trtllm-extension/tsconfig.json
deleted file mode 100644
index 2477d58ce..000000000
--- a/extensions/inference-triton-trtllm-extension/tsconfig.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
-    "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
-    "skipLibCheck": true,
-    "rootDir": "./src"
-  },
-  "include": ["./src"]
-}
diff --git a/extensions/model-extension/src/cortex.ts b/extensions/model-extension/src/cortex.ts
index ca5763962..7618e8170 100644
--- a/extensions/model-extension/src/cortex.ts
+++ b/extensions/model-extension/src/cortex.ts
@@ -183,6 +183,7 @@ export class CortexAPI implements ICortexAPI {
     model.parameters = {
       ...extractInferenceParams(model),
       ...model.parameters,
+      ...model.inference_params,
     }
     model.settings = {
       ...extractModelLoadParams(model),
diff --git a/extensions/yarn.lock b/extensions/yarn.lock
index d139b917c..d7ef3c4cb 100644
--- a/extensions/yarn.lock
+++ b/extensions/yarn.lock
@@ -509,161 +509,71 @@ __metadata:
 
 "@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Fassistant-extension%40workspace%3Aassistant-extension":
   version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Fassistant-extension%40workspace%3Aassistant-extension"
+  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=e8dac7&locator=%40janhq%2Fassistant-extension%40workspace%3Aassistant-extension"
   dependencies:
     rxjs: "npm:^7.8.1"
     ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
+  checksum: 10c0/394734b0cc26f051a9ad138f8ae642d066acff07de26ab7c4b944d190c030cb422ac044da6352461589e13a480425200cbd8e5a549cf0181cd5c9af4b1d7eb2c
   languageName: node
   linkType: hard
 
 "@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Fconversational-extension%40workspace%3Aconversational-extension":
   version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Fconversational-extension%40workspace%3Aconversational-extension"
+  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=e8dac7&locator=%40janhq%2Fconversational-extension%40workspace%3Aconversational-extension"
   dependencies:
     rxjs: "npm:^7.8.1"
     ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
+  checksum: 10c0/394734b0cc26f051a9ad138f8ae642d066acff07de26ab7c4b944d190c030cb422ac044da6352461589e13a480425200cbd8e5a549cf0181cd5c9af4b1d7eb2c
   languageName: node
   linkType: hard
 
 "@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Fengine-management-extension%40workspace%3Aengine-management-extension":
   version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Fengine-management-extension%40workspace%3Aengine-management-extension"
+  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=e8dac7&locator=%40janhq%2Fengine-management-extension%40workspace%3Aengine-management-extension"
   dependencies:
     rxjs: "npm:^7.8.1"
     ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-anthropic-extension%40workspace%3Ainference-anthropic-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-anthropic-extension%40workspace%3Ainference-anthropic-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-cohere-extension%40workspace%3Ainference-cohere-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-cohere-extension%40workspace%3Ainference-cohere-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
+  checksum: 10c0/394734b0cc26f051a9ad138f8ae642d066acff07de26ab7c4b944d190c030cb422ac044da6352461589e13a480425200cbd8e5a549cf0181cd5c9af4b1d7eb2c
   languageName: node
   linkType: hard
 
 "@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-cortex-extension%40workspace%3Ainference-cortex-extension":
   version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-cortex-extension%40workspace%3Ainference-cortex-extension"
+  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=e8dac7&locator=%40janhq%2Finference-cortex-extension%40workspace%3Ainference-cortex-extension"
   dependencies:
     rxjs: "npm:^7.8.1"
     ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-groq-extension%40workspace%3Ainference-groq-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-groq-extension%40workspace%3Ainference-groq-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-martian-extension%40workspace%3Ainference-martian-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-martian-extension%40workspace%3Ainference-martian-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-mistral-extension%40workspace%3Ainference-mistral-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-mistral-extension%40workspace%3Ainference-mistral-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-nvidia-extension%40workspace%3Ainference-nvidia-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-nvidia-extension%40workspace%3Ainference-nvidia-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-openai-extension%40workspace%3Ainference-openai-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-openai-extension%40workspace%3Ainference-openai-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-openrouter-extension%40workspace%3Ainference-openrouter-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-openrouter-extension%40workspace%3Ainference-openrouter-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
-  languageName: node
-  linkType: hard
-
-"@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Finference-triton-trt-llm-extension%40workspace%3Ainference-triton-trtllm-extension":
-  version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Finference-triton-trt-llm-extension%40workspace%3Ainference-triton-trtllm-extension"
-  dependencies:
-    rxjs: "npm:^7.8.1"
-    ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
+  checksum: 10c0/394734b0cc26f051a9ad138f8ae642d066acff07de26ab7c4b944d190c030cb422ac044da6352461589e13a480425200cbd8e5a549cf0181cd5c9af4b1d7eb2c
   languageName: node
   linkType: hard
 
 "@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Fmodel-extension%40workspace%3Amodel-extension":
   version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Fmodel-extension%40workspace%3Amodel-extension"
+  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=e8dac7&locator=%40janhq%2Fmodel-extension%40workspace%3Amodel-extension"
   dependencies:
     rxjs: "npm:^7.8.1"
     ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
+  checksum: 10c0/394734b0cc26f051a9ad138f8ae642d066acff07de26ab7c4b944d190c030cb422ac044da6352461589e13a480425200cbd8e5a549cf0181cd5c9af4b1d7eb2c
   languageName: node
   linkType: hard
 
 "@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Fmonitoring-extension%40workspace%3Amonitoring-extension":
   version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Fmonitoring-extension%40workspace%3Amonitoring-extension"
+  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=e8dac7&locator=%40janhq%2Fmonitoring-extension%40workspace%3Amonitoring-extension"
   dependencies:
     rxjs: "npm:^7.8.1"
     ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
+  checksum: 10c0/394734b0cc26f051a9ad138f8ae642d066acff07de26ab7c4b944d190c030cb422ac044da6352461589e13a480425200cbd8e5a549cf0181cd5c9af4b1d7eb2c
   languageName: node
   linkType: hard
 
 "@janhq/core@file:../../core/package.tgz::locator=%40janhq%2Ftensorrt-llm-extension%40workspace%3Atensorrt-llm-extension":
   version: 0.1.10
-  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=91cd98&locator=%40janhq%2Ftensorrt-llm-extension%40workspace%3Atensorrt-llm-extension"
+  resolution: "@janhq/core@file:../../core/package.tgz#../../core/package.tgz::hash=e8dac7&locator=%40janhq%2Ftensorrt-llm-extension%40workspace%3Atensorrt-llm-extension"
   dependencies:
     rxjs: "npm:^7.8.1"
     ulidx: "npm:^2.3.0"
-  checksum: 10c0/af79c509b1ff8a2893f5fd6545cfa8b3bb6a2e2bc13acdd5963766a1caac635b8b69ab627bfb356e052f16542f2b7187b607bdaed6acec24cd7c9a6087e4abc2
+  checksum: 10c0/394734b0cc26f051a9ad138f8ae642d066acff07de26ab7c4b944d190c030cb422ac044da6352461589e13a480425200cbd8e5a549cf0181cd5c9af4b1d7eb2c
   languageName: node
   linkType: hard
 
@@ -683,36 +593,6 @@ __metadata:
   languageName: unknown
   linkType: soft
 
-"@janhq/inference-anthropic-extension@workspace:inference-anthropic-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-anthropic-extension@workspace:inference-anthropic-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
-"@janhq/inference-cohere-extension@workspace:inference-cohere-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-cohere-extension@workspace:inference-cohere-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
 "@janhq/inference-cortex-extension@workspace:inference-cortex-extension":
   version: 0.0.0-use.local
   resolution: "@janhq/inference-cortex-extension@workspace:inference-cortex-extension"
@@ -743,112 +623,6 @@ __metadata:
   languageName: unknown
   linkType: soft
 
-"@janhq/inference-groq-extension@workspace:inference-groq-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-groq-extension@workspace:inference-groq-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
-"@janhq/inference-martian-extension@workspace:inference-martian-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-martian-extension@workspace:inference-martian-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
-"@janhq/inference-mistral-extension@workspace:inference-mistral-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-mistral-extension@workspace:inference-mistral-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
-"@janhq/inference-nvidia-extension@workspace:inference-nvidia-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-nvidia-extension@workspace:inference-nvidia-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
-"@janhq/inference-openai-extension@workspace:inference-openai-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-openai-extension@workspace:inference-openai-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
-"@janhq/inference-openrouter-extension@workspace:inference-openrouter-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-openrouter-extension@workspace:inference-openrouter-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
-"@janhq/inference-triton-trt-llm-extension@workspace:inference-triton-trtllm-extension":
-  version: 0.0.0-use.local
-  resolution: "@janhq/inference-triton-trt-llm-extension@workspace:inference-triton-trtllm-extension"
-  dependencies:
-    "@janhq/core": ../../core/package.tgz
-    cpx: "npm:^1.5.0"
-    fetch-retry: "npm:^5.0.6"
-    rimraf: "npm:^3.0.2"
-    rolldown: "npm:1.0.0-beta.1"
-    rxjs: "npm:^7.8.1"
-    ts-loader: "npm:^9.5.0"
-    typescript: "npm:^5.7.2"
-    ulidx: "npm:^2.3.0"
-  languageName: unknown
-  linkType: soft
-
 "@janhq/model-extension@workspace:model-extension":
   version: 0.0.0-use.local
   resolution: "@janhq/model-extension@workspace:model-extension"
diff --git a/web/containers/ErrorMessage/index.tsx b/web/containers/ErrorMessage/index.tsx
index e0705e6b6..71fd56c5d 100644
--- a/web/containers/ErrorMessage/index.tsx
+++ b/web/containers/ErrorMessage/index.tsx
@@ -1,7 +1,7 @@
 import {
   EngineManager,
   ErrorCode,
-  MessageStatus,
+  InferenceEngine,
   ThreadMessage,
 } from '@janhq/core'
 
@@ -14,8 +14,6 @@ import ModalTroubleShooting, {
 
 import { MainViewState } from '@/constants/screens'
 
-import { isLocalEngine } from '@/utils/modelEngine'
-
 import { mainViewStateAtom } from '@/helpers/atoms/App.atom'
 
 import { activeAssistantAtom } from '@/helpers/atoms/Assistant.atom'
@@ -82,7 +80,7 @@ const ErrorMessage = ({ message }: { message: ThreadMessage }) => {
           >
             {message.content[0]?.text?.value === 'Failed to fetch' &&
             engine &&
-            !isLocalEngine(String(engine?.name)) ? (
+            engine?.name !== InferenceEngine.cortex_llamacpp ? (
               <span>
                 No internet connection. <br /> Switch to an on-device model or
                 check connection.
diff --git a/web/containers/Layout/BottomPanel/SystemMonitor/TableActiveModel/index.tsx b/web/containers/Layout/BottomPanel/SystemMonitor/TableActiveModel/index.tsx
index 8ad16eeba..06eebea92 100644
--- a/web/containers/Layout/BottomPanel/SystemMonitor/TableActiveModel/index.tsx
+++ b/web/containers/Layout/BottomPanel/SystemMonitor/TableActiveModel/index.tsx
@@ -1,6 +1,6 @@
 import { Tooltip, Button, Badge } from '@janhq/joi'
 
-import { useAtom } from 'jotai'
+import { useAtom, useAtomValue } from 'jotai'
 
 import { useActiveModel } from '@/hooks/useActiveModel'
 
@@ -8,10 +8,12 @@ import { toGibibytes } from '@/utils/converter'
 
 import { isLocalEngine } from '@/utils/modelEngine'
 
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
 
 const TableActiveModel = () => {
   const { activeModel, stateModel, stopModel } = useActiveModel()
+  const engines = useAtomValue(installedEnginesAtom)
 
   const [serverEnabled, setServerEnabled] = useAtom(serverEnabledAtom)
 
@@ -19,7 +21,9 @@ const TableActiveModel = () => {
     <div className="w-1/2">
       <div className="overflow-hidden border-b border-[hsla(var(--app-border))]">
         <table className="w-full px-8">
-          {activeModel && isLocalEngine(activeModel.engine) ? (
+          {activeModel &&
+          engines &&
+          isLocalEngine(engines, activeModel.engine) ? (
             <tbody>
               <tr>
                 <td
diff --git a/web/containers/ModelDropdown/index.tsx b/web/containers/ModelDropdown/index.tsx
index b5abf89d7..d64e6730b 100644
--- a/web/containers/ModelDropdown/index.tsx
+++ b/web/containers/ModelDropdown/index.tsx
@@ -2,7 +2,7 @@ import { useState, useMemo, useEffect, useCallback, useRef } from 'react'
 
 import Image from 'next/image'
 
-import { InferenceEngine, Model } from '@janhq/core'
+import { EngineConfig, InferenceEngine } from '@janhq/core'
 import {
   Badge,
   Button,
@@ -31,6 +31,7 @@ import SetupRemoteModel from '@/containers/SetupRemoteModel'
 import { useCreateNewThread } from '@/hooks/useCreateNewThread'
 import useDownloadModel from '@/hooks/useDownloadModel'
 import { modelDownloadStateAtom } from '@/hooks/useDownloadState'
+
 import useRecommendedModel from '@/hooks/useRecommendedModel'
 
 import useUpdateModelParameters from '@/hooks/useUpdateModelParameters'
@@ -38,23 +39,17 @@ import useUpdateModelParameters from '@/hooks/useUpdateModelParameters'
 import { formatDownloadPercentage, toGibibytes } from '@/utils/converter'
 
 import { manualRecommendationModel } from '@/utils/model'
-import {
-  getLogoEngine,
-  getTitleByEngine,
-  isLocalEngine,
-  priorityEngine,
-} from '@/utils/modelEngine'
-
-import { extensionManager } from '@/extension'
+import { getLogoEngine } from '@/utils/modelEngine'
 
 import { activeAssistantAtom } from '@/helpers/atoms/Assistant.atom'
-import { inActiveEngineProviderAtom } from '@/helpers/atoms/Extension.atom'
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import {
   configuredModelsAtom,
   getDownloadingModelAtom,
   selectedModelAtom,
   showEngineListModelAtom,
 } from '@/helpers/atoms/Model.atom'
+
 import {
   activeThreadAtom,
   setThreadModelParamsAtom,
@@ -91,13 +86,15 @@ const ModelDropdown = ({
     null
   )
 
+  const engines = useAtomValue(installedEnginesAtom)
+
   const downloadStates = useAtomValue(modelDownloadStateAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
   const { updateModelParameter } = useUpdateModelParameters()
   const searchInputRef = useRef<HTMLInputElement>(null)
   const configuredModels = useAtomValue(configuredModelsAtom)
 
-  const featuredModel = configuredModels.filter(
+  const featuredModels = configuredModels.filter(
     (x) =>
       manualRecommendationModel.includes(x.id) &&
       x.metadata?.tags?.includes('Featured') &&
@@ -105,6 +102,16 @@ const ModelDropdown = ({
   )
   const { updateThreadMetadata } = useCreateNewThread()
 
+  const engineList = useMemo(
+    () =>
+      Object.entries(engines ?? {}).flatMap((e) => ({
+        name: e[0],
+        type: e[1][0]?.type === 'remote' ? 'remote' : 'local',
+        engine: e[1][0],
+      })),
+    [engines]
+  )
+
   useClickOutside(() => handleChangeStateOpen(false), null, [
     dropdownOptions,
     toggle,
@@ -122,13 +129,6 @@ const ModelDropdown = ({
     [setModelDropdownState]
   )
 
-  const isModelSupportRagAndTools = useCallback((model: Model) => {
-    return (
-      model?.engine === InferenceEngine.openai ||
-      isLocalEngine(model?.engine as InferenceEngine)
-    )
-  }, [])
-
   const filteredDownloadedModels = useMemo(
     () =>
       configuredModels
@@ -142,11 +142,12 @@ const ModelDropdown = ({
         )
         .filter((e) => {
           if (searchFilter === 'local') {
-            return isLocalEngine(e.engine)
-          }
-          if (searchFilter === 'remote') {
-            return !isLocalEngine(e.engine)
+            return (
+              engineList.find((t) => t.engine?.engine === e.engine)?.type ===
+              'local'
+            )
           }
+          return true
         })
         .sort((a, b) => a.name.localeCompare(b.name))
         .sort((a, b) => {
@@ -164,7 +165,7 @@ const ModelDropdown = ({
             return 0
           }
         }),
-    [configuredModels, searchText, searchFilter, downloadedModels]
+    [configuredModels, searchText, searchFilter, downloadedModels, engineList]
   )
 
   useEffect(() => {
@@ -179,6 +180,15 @@ const ModelDropdown = ({
     }
   }, [open])
 
+  useEffect(() => {
+    setShowEngineListModel((prev) => [
+      ...prev,
+      ...engineList
+        .filter((x) => (x.engine?.api_key?.length ?? 0) > 0)
+        .map((e) => e.name),
+    ])
+  }, [setShowEngineListModel, engineList])
+
   useEffect(() => {
     if (!activeThread) return
     const modelId = activeAssistant?.model?.id
@@ -193,6 +203,14 @@ const ModelDropdown = ({
     activeAssistant?.model?.id,
   ])
 
+  const isLocalEngine = useCallback(
+    (engine?: string) => {
+      if (!engine) return false
+      return engineList.some((t) => t.name === engine && t.type === 'local')
+    },
+    [engineList]
+  )
+
   const onClickModelItem = useCallback(
     async (modelId: string) => {
       if (!activeAssistant) return
@@ -210,7 +228,7 @@ const ModelDropdown = ({
               tools: [
                 {
                   type: 'retrieval',
-                  enabled: isModelSupportRagAndTools(model as Model),
+                  enabled: model?.engine === InferenceEngine.cortex,
                   settings: {
                     ...(activeAssistant.tools &&
                       activeAssistant.tools[0]?.settings),
@@ -225,13 +243,15 @@ const ModelDropdown = ({
           8192,
           model?.settings.ctx_len ?? 8192
         )
+
         const overriddenParameters = {
-          ctx_len: !isLocalEngine(model?.engine)
-            ? undefined
-            : defaultContextLength,
-          max_tokens: !isLocalEngine(model?.engine)
-            ? (model?.parameters.max_tokens ?? 8192)
-            : defaultContextLength,
+          ctx_len: model?.settings.ctx_len ? defaultContextLength : undefined,
+          max_tokens: defaultContextLength
+            ? Math.min(
+                model?.parameters.token_limit ?? 8192,
+                defaultContextLength
+              )
+            : model?.parameters.token_limit,
         }
 
         const modelParams = {
@@ -258,95 +278,17 @@ const ModelDropdown = ({
       setSelectedModel,
       activeThread,
       updateThreadMetadata,
-      isModelSupportRagAndTools,
       setThreadModelParams,
       updateModelParameter,
     ]
   )
 
-  const [extensionHasSettings, setExtensionHasSettings] = useState<
-    { name?: string; setting: string; apiKey: string; provider: string }[]
-  >([])
-
-  const inActiveEngineProvider = useAtomValue(inActiveEngineProviderAtom)
-
-  useEffect(() => {
-    const getAllSettings = async () => {
-      const extensionsMenu: {
-        name?: string
-        setting: string
-        apiKey: string
-        provider: string
-      }[] = []
-      const extensions = extensionManager.getAll()
-
-      for (const extension of extensions) {
-        if (typeof extension.getSettings === 'function') {
-          const settings = await extension.getSettings()
-          if (
-            (settings && settings.length > 0) ||
-            (await extension.installationState()) !== 'NotRequired'
-          ) {
-            extensionsMenu.push({
-              name: extension.productName,
-              setting: extension.name,
-              apiKey:
-                'apiKey' in extension && typeof extension.apiKey === 'string'
-                  ? extension.apiKey
-                  : '',
-              provider:
-                'provider' in extension &&
-                typeof extension.provider === 'string'
-                  ? extension.provider
-                  : '',
-            })
-          }
-        }
-      }
-      setExtensionHasSettings(extensionsMenu)
-    }
-    getAllSettings()
-  }, [])
-
-  const findByEngine = filteredDownloadedModels
-    .map((x) => {
-      // Legacy engine support - they will be grouped under Cortex LlamaCPP
-      if (x.engine === InferenceEngine.nitro)
-        return InferenceEngine.cortex_llamacpp
-      return x.engine
-    })
-    .filter((x) => !inActiveEngineProvider.includes(x))
-
-  const groupByEngine = findByEngine
-    .filter(function (item, index) {
-      if (findByEngine.indexOf(item) === index) return item
-    })
-    .sort((a, b) => {
-      if (priorityEngine.includes(a) && priorityEngine.includes(b)) {
-        return priorityEngine.indexOf(a) - priorityEngine.indexOf(b)
-      } else if (priorityEngine.includes(a)) {
-        return -1
-      } else if (priorityEngine.includes(b)) {
-        return 1
-      } else {
-        return 0 // Leave the rest in their original order
-      }
-    })
-
-  const getEngineStatusReady: InferenceEngine[] = extensionHasSettings
-    ?.filter((e) => e.apiKey.length > 0)
-    .map((x) => x.provider as InferenceEngine)
-
-  useEffect(() => {
-    setShowEngineListModel((prev) => [
-      ...prev,
-      ...(getEngineStatusReady as InferenceEngine[]),
-    ])
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [setShowEngineListModel, extensionHasSettings])
-
-  const isDownloadALocalModel = downloadedModels.some((x) =>
-    isLocalEngine(x.engine)
+  const isDownloadALocalModel = useMemo(
+    () =>
+      downloadedModels.some((x) =>
+        engineList.some((t) => t.name === x.engine && t.type === 'local')
+      ),
+    [downloadedModels, engineList]
   )
 
   if (strictedThread && !activeThread) {
@@ -434,85 +376,193 @@ const ModelDropdown = ({
             />
           </div>
           <ScrollArea className="h-[calc(100%-90px)] w-full">
-            {groupByEngine.map((engine, i) => {
-              const apiKey = !isLocalEngine(engine)
-                ? extensionHasSettings.filter((x) => x.provider === engine)[0]
-                    ?.apiKey.length > 1
-                : true
-              const engineLogo = getLogoEngine(engine as InferenceEngine)
-              const showModel = showEngineListModel.includes(engine)
-              const onClickChevron = () => {
-                if (showModel) {
-                  setShowEngineListModel((prev) =>
-                    prev.filter((item) => item !== engine)
-                  )
-                } else {
-                  setShowEngineListModel((prev) => [...prev, engine])
+            {engineList
+              .filter((e) => e.type === searchFilter)
+              .filter(
+                (e) =>
+                  e.type === 'remote' ||
+                  e.name === InferenceEngine.cortex_llamacpp ||
+                  filteredDownloadedModels.some((e) => e.engine === e.name)
+              )
+              .map((engine, i) => {
+                const isConfigured =
+                  engine.type === 'local' ||
+                  ((engine.engine as EngineConfig).api_key?.length ?? 0) > 1
+                const engineLogo = getLogoEngine(engine.name as InferenceEngine)
+                const showModel = showEngineListModel.includes(engine.name)
+                const onClickChevron = () => {
+                  if (showModel) {
+                    setShowEngineListModel((prev) =>
+                      prev.filter((item) => item !== engine.name)
+                    )
+                  } else {
+                    setShowEngineListModel((prev) => [...prev, engine.name])
+                  }
                 }
-              }
-              return (
-                <div
-                  className="relative w-full border-t border-[hsla(var(--app-border))] first:border-t-0"
-                  key={i}
-                >
-                  <div className="mt-2">
-                    <div className="flex items-center justify-between px-4">
-                      <div
-                        className="flex w-full cursor-pointer items-center gap-2 py-1"
-                        onClick={onClickChevron}
-                      >
-                        {engineLogo && (
-                          <Image
-                            className="h-6 w-6 flex-shrink-0"
-                            width={48}
-                            height={48}
-                            src={engineLogo}
-                            alt="logo"
-                          />
-                        )}
-                        <h6 className="font-medium text-[hsla(var(--text-secondary))]">
-                          {getTitleByEngine(engine)}
-                        </h6>
-                      </div>
-                      <div className="-mr-2 flex gap-1">
-                        {!isLocalEngine(engine) && (
-                          <SetupRemoteModel engine={engine} />
-                        )}
-                        {!showModel ? (
-                          <Button theme="icon" onClick={onClickChevron}>
-                            <ChevronDownIcon
-                              size={14}
-                              className="text-[hsla(var(--text-secondary))]"
+                return (
+                  <div
+                    className="relative w-full border-t border-[hsla(var(--app-border))] first:border-t-0"
+                    key={i}
+                  >
+                    <div className="mt-2">
+                      <div className="flex items-center justify-between px-4">
+                        <div
+                          className="flex w-full cursor-pointer items-center gap-2 py-1"
+                          onClick={onClickChevron}
+                        >
+                          {engineLogo && (
+                            <Image
+                              className="h-6 w-6 flex-shrink-0"
+                              width={48}
+                              height={48}
+                              src={engineLogo}
+                              alt="logo"
                             />
-                          </Button>
-                        ) : (
-                          <Button theme="icon" onClick={onClickChevron}>
-                            <ChevronUpIcon
-                              size={14}
-                              className="text-[hsla(var(--text-secondary))]"
+                          )}
+                          <h6 className="font-medium capitalize text-[hsla(var(--text-secondary))]">
+                            {engine.name}
+                          </h6>
+                        </div>
+                        <div className="-mr-2 flex gap-1">
+                          {engine.type === 'remote' && (
+                            <SetupRemoteModel
+                              engine={engine.name as InferenceEngine}
+                              isConfigured={
+                                (engine.engine.api_key?.length ?? 0) > 0
+                              }
                             />
-                          </Button>
-                        )}
+                          )}
+                          {!showModel ? (
+                            <Button theme="icon" onClick={onClickChevron}>
+                              <ChevronDownIcon
+                                size={14}
+                                className="text-[hsla(var(--text-secondary))]"
+                              />
+                            </Button>
+                          ) : (
+                            <Button theme="icon" onClick={onClickChevron}>
+                              <ChevronUpIcon
+                                size={14}
+                                className="text-[hsla(var(--text-secondary))]"
+                              />
+                            </Button>
+                          )}
+                        </div>
                       </div>
-                    </div>
 
-                    {isLocalEngine(engine) &&
-                      !isDownloadALocalModel &&
-                      showModel &&
-                      !searchText.length && (
-                        <ul className="pb-2">
-                          {featuredModel.map((model) => {
+                      {engine.type === 'local' &&
+                        !isDownloadALocalModel &&
+                        showModel &&
+                        !searchText.length && (
+                          <ul className="pb-2">
+                            {featuredModels.map((model) => {
+                              const isDownloading = downloadingModels.some(
+                                (md) => md === model.id
+                              )
+                              return (
+                                <li
+                                  key={model.id}
+                                  className="flex items-center justify-between gap-4 px-3 py-2 hover:bg-[hsla(var(--dropdown-menu-hover-bg))]"
+                                >
+                                  <div className="flex items-center gap-2">
+                                    <p
+                                      className="line-clamp-1 text-[hsla(var(--text-secondary))]"
+                                      title={model.name}
+                                    >
+                                      {model.name}
+                                    </p>
+                                    <ModelLabel
+                                      metadata={model.metadata}
+                                      compact
+                                    />
+                                  </div>
+                                  <div className="flex items-center gap-2 text-[hsla(var(--text-tertiary))]">
+                                    <span className="font-medium">
+                                      {toGibibytes(model.metadata?.size)}
+                                    </span>
+                                    {!isDownloading ? (
+                                      <DownloadCloudIcon
+                                        size={18}
+                                        className="cursor-pointer text-[hsla(var(--app-link))]"
+                                        onClick={() =>
+                                          downloadModel(
+                                            model.sources[0].url,
+                                            model.id
+                                          )
+                                        }
+                                      />
+                                    ) : (
+                                      Object.values(downloadStates)
+                                        .filter((x) => x.modelId === model.id)
+                                        .map((item) => (
+                                          <ProgressCircle
+                                            key={item.modelId}
+                                            percentage={
+                                              formatDownloadPercentage(
+                                                item?.percent,
+                                                {
+                                                  hidePercentage: true,
+                                                }
+                                              ) as number
+                                            }
+                                            size={100}
+                                          />
+                                        ))
+                                    )}
+                                  </div>
+                                </li>
+                              )
+                            })}
+                          </ul>
+                        )}
+
+                      <ul className="pb-2">
+                        {filteredDownloadedModels
+                          .filter(
+                            (x) =>
+                              x.engine === engine.name ||
+                              (x.engine === InferenceEngine.nitro &&
+                                engine.name === InferenceEngine.cortex_llamacpp)
+                          )
+                          .filter((y) => {
+                            if (isLocalEngine(y.engine) && !searchText.length) {
+                              return downloadedModels.find((c) => c.id === y.id)
+                            } else {
+                              return y
+                            }
+                          })
+                          .map((model) => {
+                            if (!showModel) return null
                             const isDownloading = downloadingModels.some(
                               (md) => md === model.id
                             )
+                            const isDownloaded = downloadedModels.some(
+                              (c) => c.id === model.id
+                            )
                             return (
                               <li
                                 key={model.id}
-                                className="flex items-center justify-between gap-4 px-3 py-2 hover:bg-[hsla(var(--dropdown-menu-hover-bg))]"
+                                className={twMerge(
+                                  'flex items-center justify-between gap-4 px-3 py-2 hover:bg-[hsla(var(--dropdown-menu-hover-bg))]',
+                                  !isConfigured
+                                    ? 'cursor-not-allowed text-[hsla(var(--text-tertiary))]'
+                                    : 'text-[hsla(var(--text-primary))]'
+                                )}
+                                onClick={() => {
+                                  if (!isConfigured && engine.type === 'remote')
+                                    return null
+                                  if (isDownloaded) {
+                                    onClickModelItem(model.id)
+                                  }
+                                }}
                               >
-                                <div className="flex items-center gap-2">
+                                <div className="flex gap-x-2">
                                   <p
-                                    className="line-clamp-1 text-[hsla(var(--text-secondary))]"
+                                    className={twMerge(
+                                      'line-clamp-1',
+                                      !isDownloaded &&
+                                        'text-[hsla(var(--text-secondary))]'
+                                    )}
                                     title={model.name}
                                   >
                                     {model.name}
@@ -523,10 +573,12 @@ const ModelDropdown = ({
                                   />
                                 </div>
                                 <div className="flex items-center gap-2 text-[hsla(var(--text-tertiary))]">
-                                  <span className="font-medium">
-                                    {toGibibytes(model.metadata?.size)}
-                                  </span>
-                                  {!isDownloading ? (
+                                  {!isDownloaded && (
+                                    <span className="font-medium">
+                                      {toGibibytes(model.metadata?.size)}
+                                    </span>
+                                  )}
+                                  {!isDownloading && !isDownloaded ? (
                                     <DownloadCloudIcon
                                       size={18}
                                       className="cursor-pointer text-[hsla(var(--app-link))]"
@@ -559,106 +611,11 @@ const ModelDropdown = ({
                               </li>
                             )
                           })}
-                        </ul>
-                      )}
-
-                    <ul className="pb-2">
-                      {filteredDownloadedModels
-                        .filter(
-                          (x) =>
-                            x.engine === engine ||
-                            (x.engine === InferenceEngine.nitro &&
-                              engine === InferenceEngine.cortex_llamacpp)
-                        )
-                        .filter((y) => {
-                          if (isLocalEngine(y.engine) && !searchText.length) {
-                            return downloadedModels.find((c) => c.id === y.id)
-                          } else {
-                            return y
-                          }
-                        })
-                        .map((model) => {
-                          if (!showModel) return null
-                          const isDownloading = downloadingModels.some(
-                            (md) => md === model.id
-                          )
-                          const isDownloaded = downloadedModels.some(
-                            (c) => c.id === model.id
-                          )
-                          return (
-                            <li
-                              key={model.id}
-                              className={twMerge(
-                                'flex items-center justify-between gap-4 px-3 py-2 hover:bg-[hsla(var(--dropdown-menu-hover-bg))]',
-                                !apiKey
-                                  ? 'cursor-not-allowed text-[hsla(var(--text-tertiary))]'
-                                  : 'text-[hsla(var(--text-primary))]'
-                              )}
-                              onClick={() => {
-                                if (!apiKey && !isLocalEngine(model.engine))
-                                  return null
-                                if (isDownloaded) {
-                                  onClickModelItem(model.id)
-                                }
-                              }}
-                            >
-                              <div className="flex gap-x-2">
-                                <p
-                                  className={twMerge(
-                                    'line-clamp-1',
-                                    !isDownloaded &&
-                                      'text-[hsla(var(--text-secondary))]'
-                                  )}
-                                  title={model.name}
-                                >
-                                  {model.name}
-                                </p>
-                                <ModelLabel metadata={model.metadata} compact />
-                              </div>
-                              <div className="flex items-center gap-2 text-[hsla(var(--text-tertiary))]">
-                                {!isDownloaded && (
-                                  <span className="font-medium">
-                                    {toGibibytes(model.metadata?.size)}
-                                  </span>
-                                )}
-                                {!isDownloading && !isDownloaded ? (
-                                  <DownloadCloudIcon
-                                    size={18}
-                                    className="cursor-pointer text-[hsla(var(--app-link))]"
-                                    onClick={() =>
-                                      downloadModel(
-                                        model.sources[0].url,
-                                        model.id
-                                      )
-                                    }
-                                  />
-                                ) : (
-                                  Object.values(downloadStates)
-                                    .filter((x) => x.modelId === model.id)
-                                    .map((item) => (
-                                      <ProgressCircle
-                                        key={item.modelId}
-                                        percentage={
-                                          formatDownloadPercentage(
-                                            item?.percent,
-                                            {
-                                              hidePercentage: true,
-                                            }
-                                          ) as number
-                                        }
-                                        size={100}
-                                      />
-                                    ))
-                                )}
-                              </div>
-                            </li>
-                          )
-                        })}
-                    </ul>
+                      </ul>
+                    </div>
                   </div>
-                </div>
-              )
-            })}
+                )
+              })}
           </ScrollArea>
         </div>
       </div>
diff --git a/web/containers/Providers/DataLoader.tsx b/web/containers/Providers/DataLoader.tsx
index 470294996..01093e4b2 100644
--- a/web/containers/Providers/DataLoader.tsx
+++ b/web/containers/Providers/DataLoader.tsx
@@ -6,6 +6,7 @@ import { AppConfiguration, getUserHomePath } from '@janhq/core'
 import { useSetAtom } from 'jotai'
 
 import useAssistants from '@/hooks/useAssistants'
+import useEngines from '@/hooks/useEngines'
 import useGetSystemResources from '@/hooks/useGetSystemResources'
 import useModels from '@/hooks/useModels'
 import useThreads from '@/hooks/useThreads'
@@ -25,6 +26,7 @@ const DataLoader: React.FC = () => {
   const setJanDefaultDataFolder = useSetAtom(defaultJanDataFolderAtom)
   const setJanSettingScreen = useSetAtom(janSettingScreenAtom)
   const { getData: loadModels } = useModels()
+  const { getData: loadEngines } = useEngines()
 
   useThreads()
   useAssistants()
@@ -33,6 +35,7 @@ const DataLoader: React.FC = () => {
   useEffect(() => {
     // Load data once
     loadModels()
+    loadEngines()
     // eslint-disable-next-line react-hooks/exhaustive-deps
   }, [])
 
diff --git a/web/containers/Providers/ModelHandler.tsx b/web/containers/Providers/ModelHandler.tsx
index 42376c081..32182804c 100644
--- a/web/containers/Providers/ModelHandler.tsx
+++ b/web/containers/Providers/ModelHandler.tsx
@@ -18,7 +18,7 @@ import {
   extractInferenceParams,
   ModelExtension,
 } from '@janhq/core'
-import { useAtom, useAtomValue, useSetAtom } from 'jotai'
+import { useAtomValue, useSetAtom } from 'jotai'
 import { ulid } from 'ulidx'
 
 import { activeModelAtom, stateModelAtom } from '@/hooks/useActiveModel'
@@ -34,6 +34,7 @@ import {
   deleteMessageAtom,
   subscribedGeneratingMessageAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
 import {
   updateThreadWaitingForResponseAtom,
@@ -74,6 +75,7 @@ export default function ModelHandler() {
   const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
   const activeModelParamsRef = useRef(activeModelParams)
   const setTokenSpeed = useSetAtom(tokenSpeedAtom)
+  const engines = useAtomValue(installedEnginesAtom)
 
   useEffect(() => {
     activeThreadRef.current = activeThread
@@ -241,7 +243,8 @@ export default function ModelHandler() {
       } else if (
         message.status === MessageStatus.Error &&
         activeModelRef.current?.engine &&
-        isLocalEngine(activeModelRef.current.engine)
+        engines &&
+        isLocalEngine(engines, activeModelRef.current.engine)
       ) {
         ;(async () => {
           if (
@@ -332,7 +335,9 @@ export default function ModelHandler() {
     if (!activeModelRef.current) return
 
     // Check model engine; we don't want to generate a title when it's not a local engine. remote model using first promp
-    if (!isLocalEngine(activeModelRef.current?.engine as InferenceEngine)) {
+    if (
+      !isLocalEngine(engines, activeModelRef.current?.engine as InferenceEngine)
+    ) {
       const updatedThread: Thread = {
         ...thread,
         title: (thread.metadata?.lastMessage as string) || defaultThreadTitle,
diff --git a/web/containers/SetupRemoteModel/index.tsx b/web/containers/SetupRemoteModel/index.tsx
index 1f5478d73..b4b2cfa42 100644
--- a/web/containers/SetupRemoteModel/index.tsx
+++ b/web/containers/SetupRemoteModel/index.tsx
@@ -1,5 +1,3 @@
-import { useState, useEffect } from 'react'
-
 import { InferenceEngine } from '@janhq/core'
 
 import { Button } from '@janhq/joi'
@@ -8,77 +6,23 @@ import { SettingsIcon, PlusIcon } from 'lucide-react'
 
 import { MainViewState } from '@/constants/screens'
 
-import { isLocalEngine } from '@/utils/modelEngine'
-
-import { extensionManager } from '@/extension'
 import { mainViewStateAtom } from '@/helpers/atoms/App.atom'
 import { selectedSettingAtom } from '@/helpers/atoms/Setting.atom'
 
 type Props = {
   engine: InferenceEngine
+  isConfigured: boolean
 }
 
-const SetupRemoteModel = ({ engine }: Props) => {
+const SetupRemoteModel = ({ engine, isConfigured }: Props) => {
   const setSelectedSetting = useSetAtom(selectedSettingAtom)
   const setMainViewState = useSetAtom(mainViewStateAtom)
 
-  const [extensionHasSettings, setExtensionHasSettings] = useState<
-    { name?: string; setting: string; apiKey: string; provider: string }[]
-  >([])
-
-  useEffect(() => {
-    const getAllSettings = async () => {
-      const extensionsMenu: {
-        name?: string
-        setting: string
-        apiKey: string
-        provider: string
-      }[] = []
-      const extensions = extensionManager.getAll()
-
-      for (const extension of extensions) {
-        if (typeof extension.getSettings === 'function') {
-          const settings = await extension.getSettings()
-
-          if (
-            (settings && settings.length > 0) ||
-            (await extension.installationState()) !== 'NotRequired'
-          ) {
-            extensionsMenu.push({
-              name: extension.productName,
-              setting: extension.name,
-              apiKey:
-                'apiKey' in extension && typeof extension.apiKey === 'string'
-                  ? extension.apiKey
-                  : '',
-              provider:
-                'provider' in extension &&
-                typeof extension.provider === 'string'
-                  ? extension.provider
-                  : '',
-            })
-          }
-        }
-      }
-      setExtensionHasSettings(extensionsMenu)
-    }
-    getAllSettings()
-  }, [])
-
   const onSetupItemClick = (setting: InferenceEngine) => {
+    setSelectedSetting(setting)
     setMainViewState(MainViewState.Settings)
-    setSelectedSetting(
-      extensionHasSettings.filter((x) =>
-        x.provider.toLowerCase().includes(setting)
-      )[0]?.setting
-    )
   }
 
-  const apiKey = !isLocalEngine(engine)
-    ? extensionHasSettings.filter((x) => x.provider === engine)[0]?.apiKey
-        .length > 1
-    : true
-
   return (
     <Button
       theme="icon"
@@ -87,7 +31,7 @@ const SetupRemoteModel = ({ engine }: Props) => {
         onSetupItemClick(engine)
       }}
     >
-      {apiKey ? (
+      {isConfigured ? (
         <SettingsIcon
           size={14}
           className="text-[hsla(var(--text-secondary))]"
diff --git a/web/helpers/atoms/Engines.atom.ts b/web/helpers/atoms/Engines.atom.ts
new file mode 100644
index 000000000..b1b09426a
--- /dev/null
+++ b/web/helpers/atoms/Engines.atom.ts
@@ -0,0 +1,7 @@
+import { Engines } from '@janhq/core'
+import { atom } from 'jotai'
+
+/**
+ * Store all of the installed engines including local and remote engines
+ */
+export const installedEnginesAtom = atom<Engines>()
diff --git a/web/helpers/atoms/Extension.atom.ts b/web/helpers/atoms/Extension.atom.ts
index 257d42996..3f1843dc4 100644
--- a/web/helpers/atoms/Extension.atom.ts
+++ b/web/helpers/atoms/Extension.atom.ts
@@ -55,3 +55,11 @@ export const showSettingActiveLocalEngineAtom = atomWithStorage<string[]>(
   undefined,
   { getOnInit: true }
 )
+
+const SHOW_SETTING_ACTIVE_REMOTE_ENGINE = 'showSettingActiveRemoteEngine'
+export const showSettingActiveRemoteEngineAtom = atomWithStorage<string[]>(
+  SHOW_SETTING_ACTIVE_REMOTE_ENGINE,
+  [],
+  undefined,
+  { getOnInit: true }
+)
diff --git a/web/hooks/useActiveModel.ts b/web/hooks/useActiveModel.ts
index 67023d1d3..25cc7fcc8 100644
--- a/web/hooks/useActiveModel.ts
+++ b/web/hooks/useActiveModel.ts
@@ -1,6 +1,6 @@
 import { useCallback, useEffect, useRef } from 'react'
 
-import { EngineManager, Model } from '@janhq/core'
+import { EngineManager, InferenceEngine, Model } from '@janhq/core'
 import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 
 import { toaster } from '@/containers/Toast'
@@ -10,10 +10,6 @@ import { LAST_USED_MODEL_ID } from './useRecommendedModel'
 import { vulkanEnabledAtom } from '@/helpers/atoms/AppConfig.atom'
 import { activeAssistantAtom } from '@/helpers/atoms/Assistant.atom'
 import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
-import {
-  isGeneratingResponseAtom,
-  resetThreadWaitingForResponseAtom,
-} from '@/helpers/atoms/Thread.atom'
 
 export const activeModelAtom = atom<Model | undefined>(undefined)
 export const loadModelErrorAtom = atom<string | undefined>(undefined)
@@ -99,7 +95,7 @@ export function useActiveModel() {
     }
 
     localStorage.setItem(LAST_USED_MODEL_ID, model.id)
-    const engine = EngineManager.instance().get(model.engine)
+    const engine = EngineManager.instance().get(InferenceEngine.cortex)
     return engine
       ?.loadModel(model)
       .then(() => {
@@ -142,7 +138,7 @@ export function useActiveModel() {
       if (!stoppingModel || (stateModel.state === 'stop' && stateModel.loading))
         return
 
-      const engine = EngineManager.instance().get(stoppingModel.engine)
+      const engine = EngineManager.instance().get(InferenceEngine.cortex)
       return engine
         ?.unloadModel(stoppingModel)
         .catch((e) => console.error(e))
diff --git a/web/hooks/useCreateNewThread.ts b/web/hooks/useCreateNewThread.ts
index 2e1254362..aeef2754f 100644
--- a/web/hooks/useCreateNewThread.ts
+++ b/web/hooks/useCreateNewThread.ts
@@ -5,12 +5,11 @@ import {
   ExtensionTypeEnum,
   Thread,
   ThreadAssistantInfo,
-  ThreadState,
   AssistantTool,
   Model,
   Assistant,
 } from '@janhq/core'
-import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
+import { useAtom, useAtomValue, useSetAtom } from 'jotai'
 
 import { useDebouncedCallback } from 'use-debounce'
 
@@ -18,8 +17,6 @@ import { fileUploadAtom } from '@/containers/Providers/Jotai'
 
 import { toaster } from '@/containers/Toast'
 
-import { isLocalEngine } from '@/utils/modelEngine'
-
 import useRecommendedModel from './useRecommendedModel'
 import useSetActiveThread from './useSetActiveThread'
 
@@ -33,7 +30,6 @@ import {
   threadsAtom,
   updateThreadAtom,
   setThreadModelParamsAtom,
-  isGeneratingResponseAtom,
   createNewThreadAtom,
 } from '@/helpers/atoms/Thread.atom'
 
@@ -90,16 +86,19 @@ export const useCreateNewThread = () => {
     )
 
     const overriddenSettings = {
-      ctx_len: !isLocalEngine(defaultModel?.engine)
-        ? undefined
-        : defaultContextLength,
+      ctx_len: defaultModel?.settings.ctx_len
+        ? Math.min(8192, defaultModel.settings.ctx_len)
+        : undefined,
     }
 
     // Use ctx length by default
     const overriddenParameters = {
-      max_tokens: !isLocalEngine(defaultModel?.engine)
-        ? (defaultModel?.parameters.max_tokens ?? 8192)
-        : defaultContextLength,
+      max_tokens: defaultContextLength
+        ? Math.min(
+            defaultModel?.parameters.max_tokens ?? 8192,
+            defaultContextLength
+          )
+        : defaultModel?.parameters.max_tokens,
     }
 
     const createdAt = Date.now()
@@ -133,7 +132,6 @@ export const useCreateNewThread = () => {
     }
 
     // add the new thread on top of the thread list to the state
-    //TODO: Why do we have thread list then thread states? Should combine them
     try {
       const createdThread = await persistNewThread(thread, assistantInfo)
       if (!createdThread) throw 'Thread created failed.'
diff --git a/web/hooks/useEngineManagement.ts b/web/hooks/useEngineManagement.ts
index 1272da81a..8367ecd20 100644
--- a/web/hooks/useEngineManagement.ts
+++ b/web/hooks/useEngineManagement.ts
@@ -5,6 +5,9 @@ import {
   EngineManagementExtension,
   InferenceEngine,
   EngineReleased,
+  EngineConfig,
+  events,
+  EngineEvent,
 } from '@janhq/core'
 import { useAtom } from 'jotai'
 import { atomWithStorage } from 'jotai/utils'
@@ -61,6 +64,34 @@ export function useGetEngines() {
   return { engines, error, mutate }
 }
 
+/**
+ * @returns A Promise that resolves to an object of remote models.
+ */
+export function useGetRemoteModels(name: string) {
+  const extension = useMemo(
+    () =>
+      extensionManager.get<EngineManagementExtension>(
+        ExtensionTypeEnum.Engine
+      ) ?? null,
+    []
+  )
+
+  const {
+    data: remoteModels,
+    error,
+    mutate,
+  } = useSWR(
+    extension ? 'remoteModels' : null,
+    () => fetchExtensionData(extension, (ext) => ext.getRemoteModels(name)),
+    {
+      revalidateOnFocus: false,
+      revalidateOnReconnect: true,
+    }
+  )
+
+  return { remoteModels, error, mutate }
+}
+
 /**
  * @param name - Inference engine name.
  * @returns A Promise that resolves to an array of installed engine.
@@ -262,7 +293,10 @@ export const setDefaultEngineVariant = async (
  * @body version - string
  * @returns A Promise that resolves to set default engine.
  */
-export const updateEngine = async (name: InferenceEngine) => {
+export const updateEngine = async (
+  name: InferenceEngine,
+  engineConfig?: EngineConfig
+) => {
   const extension = getExtension()
 
   if (!extension) {
@@ -271,7 +305,8 @@ export const updateEngine = async (name: InferenceEngine) => {
 
   try {
     // Call the extension's method
-    const response = await extension.updateEngine(name)
+    const response = await extension.updateEngine(name, engineConfig)
+    events.emit(EngineEvent.OnEngineUpdate, {})
     return response
   } catch (error) {
     console.error('Failed to set default engine variant:', error)
@@ -284,8 +319,8 @@ export const updateEngine = async (name: InferenceEngine) => {
  * @returns A Promise that resolves to intall of engine.
  */
 export const installEngine = async (
-  name: InferenceEngine,
-  engineConfig: { variant: string; version?: string }
+  name: string,
+  engineConfig: EngineConfig
 ) => {
   const extension = getExtension()
 
@@ -296,6 +331,29 @@ export const installEngine = async (
   try {
     // Call the extension's method
     const response = await extension.installEngine(name, engineConfig)
+    events.emit(EngineEvent.OnEngineUpdate, {})
+    return response
+  } catch (error) {
+    console.error('Failed to install engine variant:', error)
+    throw error
+  }
+}
+
+/**
+ * Add a new remote engine
+ * @returns A Promise that resolves to intall of engine.
+ */
+export const addRemoteEngine = async (engineConfig: EngineConfig) => {
+  const extension = getExtension()
+
+  if (!extension) {
+    throw new Error('Extension is not available')
+  }
+
+  try {
+    // Call the extension's method
+    const response = await extension.addRemoteEngine(engineConfig)
+    events.emit(EngineEvent.OnEngineUpdate, {})
     return response
   } catch (error) {
     console.error('Failed to install engine variant:', error)
@@ -309,7 +367,7 @@ export const installEngine = async (
  */
 export const uninstallEngine = async (
   name: InferenceEngine,
-  engineConfig: { variant: string; version: string }
+  engineConfig: EngineConfig
 ) => {
   const extension = getExtension()
 
@@ -320,6 +378,7 @@ export const uninstallEngine = async (
   try {
     // Call the extension's method
     const response = await extension.uninstallEngine(name, engineConfig)
+    events.emit(EngineEvent.OnEngineUpdate, {})
     return response
   } catch (error) {
     console.error('Failed to install engine variant:', error)
diff --git a/web/hooks/useEngines.ts b/web/hooks/useEngines.ts
new file mode 100644
index 000000000..f910394e3
--- /dev/null
+++ b/web/hooks/useEngines.ts
@@ -0,0 +1,53 @@
+import { useCallback, useEffect } from 'react'
+
+import {
+  ExtensionTypeEnum,
+  events,
+  EngineEvent,
+  EngineManagementExtension,
+  Engines,
+} from '@janhq/core'
+
+import { useSetAtom } from 'jotai'
+
+import { useDebouncedCallback } from 'use-debounce'
+
+import { extensionManager } from '@/extension'
+
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
+
+/**
+ * useModels hook - Handles the state of models
+ * It fetches the downloaded models, configured models and default model from Model Extension
+ * and updates the atoms accordingly.
+ */
+const useEngines = () => {
+  const setInstalledEngines = useSetAtom(installedEnginesAtom)
+
+  const getData = useCallback(() => {
+    getEngines().then(setInstalledEngines)
+  }, [setInstalledEngines])
+
+  const reloadData = useDebouncedCallback(() => getData(), 300)
+
+  const getEngines = async (): Promise<Engines> =>
+    extensionManager
+      .get<EngineManagementExtension>(ExtensionTypeEnum.Engine)
+      ?.getEngines()
+      .catch(() => ({}) as Engines) ?? ({} as Engines)
+
+  useEffect(() => {
+    // Listen for engine updates
+    events.on(EngineEvent.OnEngineUpdate, reloadData)
+    return () => {
+      // Remove listener on unmount
+      events.off(EngineEvent.OnEngineUpdate, reloadData)
+    }
+  }, [reloadData])
+
+  return {
+    getData,
+  }
+}
+
+export default useEngines
diff --git a/web/hooks/useModels.ts b/web/hooks/useModels.ts
index 0daedf7f8..40586462b 100644
--- a/web/hooks/useModels.ts
+++ b/web/hooks/useModels.ts
@@ -7,14 +7,13 @@ import {
   ModelExtension,
   events,
   ModelManager,
+  InferenceEngine,
 } from '@janhq/core'
 
 import { useSetAtom } from 'jotai'
 
 import { useDebouncedCallback } from 'use-debounce'
 
-import { isLocalEngine } from '@/utils/modelEngine'
-
 import { extensionManager } from '@/extension'
 
 import {
@@ -43,7 +42,7 @@ const useModels = () => {
       const remoteModels = ModelManager.instance()
         .models.values()
         .toArray()
-        .filter((e) => !isLocalEngine(e.engine))
+        .filter((e) => e.engine !== InferenceEngine.cortex_llamacpp)
       const toUpdate = [
         ...localModels,
         ...remoteModels.filter(
@@ -84,7 +83,7 @@ const useModels = () => {
       ...downloadedModels,
       ...cachedModels.filter(
         (e) =>
-          !isLocalEngine(e.engine) &&
+          e.engine !== InferenceEngine.cortex_llamacpp &&
           !downloadedModels.some((g: Model) => g.id === e.id)
       ),
     ])
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index 66b031849..87a8414a2 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -11,6 +11,7 @@ import {
   EngineManager,
   ToolManager,
   ThreadAssistantInfo,
+  InferenceEngine,
 } from '@janhq/core'
 import { extractInferenceParams, extractModelLoadParams } from '@janhq/core'
 import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
@@ -232,9 +233,7 @@ export default function useSendChatMessage() {
     )
 
     // Request for inference
-    EngineManager.instance()
-      .get(requestBuilder.model?.engine ?? modelRequest.engine ?? '')
-      ?.inference(request)
+    EngineManager.instance().get(InferenceEngine.cortex)?.inference(request)
 
     // Reset states
     setReloadModel(false)
diff --git a/web/hooks/useStarterScreen.ts b/web/hooks/useStarterScreen.ts
index c551ee601..23a659a04 100644
--- a/web/hooks/useStarterScreen.ts
+++ b/web/hooks/useStarterScreen.ts
@@ -1,10 +1,11 @@
-import { useState, useEffect, useMemo } from 'react'
+import { useMemo } from 'react'
 
+import { InferenceEngine, EngineConfig } from '@janhq/core'
 import { useAtomValue } from 'jotai'
 
 import { isLocalEngine } from '@/utils/modelEngine'
 
-import { extensionManager } from '@/extension'
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
 import { threadsAtom } from '@/helpers/atoms/Thread.atom'
 
@@ -12,58 +13,23 @@ export function useStarterScreen() {
   const downloadedModels = useAtomValue(downloadedModelsAtom)
   const threads = useAtomValue(threadsAtom)
 
+  const engines = useAtomValue(installedEnginesAtom)
+
+  const remoteEngines =
+    engines &&
+    Object.entries(engines)
+      .filter(([key]) => !isLocalEngine(engines, key as InferenceEngine))
+      .flatMap(([_, engineArray]) => engineArray as EngineConfig)
+
   const isDownloadALocalModel = useMemo(
-    () => downloadedModels.some((x) => isLocalEngine(x.engine)),
-    [downloadedModels]
+    () =>
+      downloadedModels.some((x) => engines && isLocalEngine(engines, x.engine)),
+    [engines, downloadedModels]
   )
 
-  const [extensionHasSettings, setExtensionHasSettings] = useState<
-    { name?: string; setting: string; apiKey: string; provider: string }[]
-  >([])
-
-  useEffect(() => {
-    const getAllSettings = async () => {
-      const extensionsMenu: {
-        name?: string
-        setting: string
-        apiKey: string
-        provider: string
-      }[] = []
-      const extensions = extensionManager.getAll()
-
-      for (const extension of extensions) {
-        if (typeof extension.getSettings === 'function') {
-          const settings = await extension.getSettings()
-
-          if (
-            (settings && settings.length > 0) ||
-            (await extension.installationState()) !== 'NotRequired'
-          ) {
-            extensionsMenu.push({
-              name: extension.productName,
-              setting: extension.name,
-              apiKey:
-                'apiKey' in extension && typeof extension.apiKey === 'string'
-                  ? extension.apiKey
-                  : '',
-              provider:
-                'provider' in extension &&
-                typeof extension.provider === 'string'
-                  ? extension.provider
-                  : '',
-            })
-          }
-        }
-      }
-      setExtensionHasSettings(extensionsMenu)
-    }
-    getAllSettings()
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
-
   const isAnyRemoteModelConfigured = useMemo(
-    () => extensionHasSettings.some((x) => x.apiKey.length > 1),
-    [extensionHasSettings]
+    () => (remoteEngines ?? []).some((x) => x.api_key && x.api_key.length > 0),
+    [remoteEngines]
   )
 
   const isShowStarterScreen = useMemo(
@@ -73,7 +39,6 @@ export function useStarterScreen() {
   )
 
   return {
-    extensionHasSettings,
     isShowStarterScreen,
   }
 }
diff --git a/web/package.json b/web/package.json
index 598c748d9..c562b6aa6 100644
--- a/web/package.json
+++ b/web/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@janhq/web",
-  "version": "0.5.12",
+  "version": "0.5.13",
   "private": true,
   "homepage": "./",
   "scripts": {
@@ -14,6 +14,7 @@
     "test": "jest"
   },
   "dependencies": {
+    "@hookform/resolvers": "^3.9.1",
     "@janhq/core": "link:../core",
     "@janhq/joi": "link:../joi",
     "@radix-ui/react-icons": "^1.3.2",
@@ -39,6 +40,7 @@
     "react-circular-progressbar": "^2.1.0",
     "react-dom": "18.2.0",
     "react-dropzone": "14.2.3",
+    "react-hook-form": "^7.54.2",
     "react-hot-toast": "^2.4.1",
     "react-icons": "^4.12.0",
     "react-markdown": "^9.0.1",
@@ -57,7 +59,8 @@
     "tailwindcss": "3.3.5",
     "ulidx": "^2.3.0",
     "use-debounce": "^10.0.0",
-    "uuid": "^9.0.1"
+    "uuid": "^9.0.1",
+    "zod": "^3.24.1"
   },
   "devDependencies": {
     "@next/eslint-plugin-next": "^14.0.1",
diff --git a/web/screens/Settings/Engines/DeleteEngineVariant.tsx b/web/screens/Settings/Engines/DeleteEngineVariant.tsx
index 12e30590c..1033164e6 100644
--- a/web/screens/Settings/Engines/DeleteEngineVariant.tsx
+++ b/web/screens/Settings/Engines/DeleteEngineVariant.tsx
@@ -21,8 +21,7 @@ const DeleteEngineVariant = ({
   const [open, setOpen] = useState(false)
 
   const { mutate: mutateInstalledEngines } = useGetInstalledEngines(engine)
-  const { defaultEngineVariant, mutate: mutateDefaultEngineVariant } =
-    useGetDefaultEngineVariant(engine)
+  const { defaultEngineVariant } = useGetDefaultEngineVariant(engine)
 
   return (
     <Modal
diff --git a/web/screens/Settings/Engines/LocalEngineItem.tsx b/web/screens/Settings/Engines/LocalEngineItem.tsx
new file mode 100644
index 000000000..f284ca8a3
--- /dev/null
+++ b/web/screens/Settings/Engines/LocalEngineItem.tsx
@@ -0,0 +1,88 @@
+import React, { useCallback } from 'react'
+
+import { InferenceEngine } from '@janhq/core'
+import { Button, Switch, Badge } from '@janhq/joi'
+
+import { useAtom, useSetAtom } from 'jotai'
+import { SettingsIcon } from 'lucide-react'
+
+import { useGetDefaultEngineVariant } from '@/hooks/useEngineManagement'
+
+import { getTitleByEngine } from '@/utils/modelEngine'
+
+import { showSettingActiveLocalEngineAtom } from '@/helpers/atoms/Extension.atom'
+import { selectedSettingAtom } from '@/helpers/atoms/Setting.atom'
+
+const LocalEngineItems = ({ engine }: { engine: InferenceEngine }) => {
+  const { defaultEngineVariant } = useGetDefaultEngineVariant(engine)
+
+  const manualDescription = (engine: string) => {
+    switch (engine) {
+      case InferenceEngine.cortex_llamacpp:
+        return 'Fast, efficient local inference engine that runs GGUF models directly on your device'
+
+      default:
+        break
+    }
+  }
+
+  const setSelectedSetting = useSetAtom(selectedSettingAtom)
+
+  const [showSettingActiveLocalEngine, setShowSettingActiveLocalEngineAtom] =
+    useAtom(showSettingActiveLocalEngineAtom)
+
+  const onSwitchChange = useCallback(
+    (name: string) => {
+      if (showSettingActiveLocalEngine.includes(name)) {
+        setShowSettingActiveLocalEngineAtom(
+          [...showSettingActiveLocalEngine].filter((x) => x !== name)
+        )
+      } else {
+        setShowSettingActiveLocalEngineAtom([
+          ...showSettingActiveLocalEngine,
+          name,
+        ])
+      }
+    },
+    [showSettingActiveLocalEngine, setShowSettingActiveLocalEngineAtom]
+  )
+  return (
+    <div className="flex w-full flex-col items-start justify-between border-b border-[hsla(var(--app-border))] py-3 sm:flex-row">
+      <div className="w-full flex-shrink-0 space-y-1.5">
+        <div className="flex items-center justify-between gap-x-2">
+          <div>
+            <div className="flex items-center gap-2">
+              <h6 className="line-clamp-1 font-semibold capitalize">
+                {getTitleByEngine(engine as InferenceEngine)}
+              </h6>
+              <Badge variant="outline" theme="secondary">
+                {defaultEngineVariant?.version}
+              </Badge>
+            </div>
+            <div className="mt-2 w-full font-medium leading-relaxed text-[hsla(var(--text-secondary))]">
+              <p>{manualDescription(engine)}</p>
+            </div>
+          </div>
+          <div className="flex items-center gap-x-3">
+            <Switch
+              checked={!showSettingActiveLocalEngine.includes(engine)}
+              onChange={() => onSwitchChange(engine)}
+            />
+            <Button
+              theme="icon"
+              variant="outline"
+              onClick={() => setSelectedSetting(engine)}
+            >
+              <SettingsIcon
+                size={14}
+                className="text-[hsla(var(--text-secondary))]"
+              />
+            </Button>
+          </div>
+        </div>
+      </div>
+    </div>
+  )
+}
+
+export default LocalEngineItems
diff --git a/web/screens/Settings/Engines/Settings.tsx b/web/screens/Settings/Engines/LocalEngineSettings.tsx
similarity index 99%
rename from web/screens/Settings/Engines/Settings.tsx
rename to web/screens/Settings/Engines/LocalEngineSettings.tsx
index 8cc8501ef..41ca622da 100644
--- a/web/screens/Settings/Engines/Settings.tsx
+++ b/web/screens/Settings/Engines/LocalEngineSettings.tsx
@@ -36,7 +36,7 @@ const os = () => {
   }
 }
 
-const EngineSettings = ({ engine }: { engine: InferenceEngine }) => {
+const LocalEngineSettings = ({ engine }: { engine: InferenceEngine }) => {
   const { installedEngines, mutate: mutateInstalledEngines } =
     useGetInstalledEngines(engine)
   const { defaultEngineVariant, mutate: mutateDefaultEngineVariant } =
@@ -343,4 +343,4 @@ const EngineSettings = ({ engine }: { engine: InferenceEngine }) => {
   )
 }
 
-export default EngineSettings
+export default LocalEngineSettings
diff --git a/web/screens/Settings/Engines/ModalAddRemoteEngine.tsx b/web/screens/Settings/Engines/ModalAddRemoteEngine.tsx
new file mode 100644
index 000000000..7ea4877cc
--- /dev/null
+++ b/web/screens/Settings/Engines/ModalAddRemoteEngine.tsx
@@ -0,0 +1,213 @@
+import { memo, useState } from 'react'
+import { useForm } from 'react-hook-form'
+
+import { zodResolver } from '@hookform/resolvers/zod'
+
+import { Button, Input, Modal, TextArea } from '@janhq/joi'
+import { PlusIcon } from 'lucide-react'
+import { z } from 'zod'
+
+import { addRemoteEngine, useGetEngines } from '@/hooks/useEngineManagement'
+
+const engineSchema = z.object({
+  engineName: z.string().min(1, 'Engine name is required'),
+  modelListUrl: z.string().url('Enter a valid Model List URL'),
+  headerTemplate: z.string().optional(),
+  apiKey: z.string().optional(),
+  requestFormat: z.string().optional(),
+  responseFormat: z.string().optional(),
+})
+
+const ModalAddRemoteEngine = () => {
+  const [open, setOpen] = useState(false)
+  const { mutate: mutateListEngines } = useGetEngines()
+  const {
+    register,
+    handleSubmit,
+    formState: { errors },
+  } = useForm({
+    resolver: zodResolver(engineSchema),
+    defaultValues: {
+      engineName: '',
+      apiUrl: '',
+      modelListUrl: '',
+      headerTemplate: '',
+      apiKey: '',
+      requestFormat: '',
+      responseFormat: '',
+    },
+  })
+
+  const onSubmit = async (data: z.infer<typeof engineSchema>) => {
+    await addRemoteEngine({
+      type: 'remote',
+      engine: data.engineName,
+      api_key: data.apiKey,
+      metadata: {
+        header_template: data.headerTemplate,
+        get_models_url: data.modelListUrl,
+        transform_req: {
+          chat_completions: {
+            template: data.requestFormat,
+          },
+        },
+        transform_resp: {
+          chat_completions: {
+            template: data.requestFormat,
+          },
+        },
+      },
+    })
+    mutateListEngines()
+
+    setOpen(false)
+  }
+
+  // Helper to render labels with asterisks for required fields
+  const renderLabel = (label: string, isRequired: boolean, desc?: string) => (
+    <>
+      <span>
+        {label} {isRequired && <span className="text-red-500">*</span>}
+      </span>
+      <p className="mt-1 font-normal text-[hsla(var(--text-secondary))]">
+        {desc}
+      </p>
+    </>
+  )
+
+  return (
+    <Modal
+      title={
+        <div>
+          <p>Install Remote Engine</p>
+          <p className="text-sm font-normal text-[hsla(var(--text-secondary))]">
+            Only OpenAI API-compatible engines are supported
+          </p>
+        </div>
+      }
+      fullPage
+      open={open}
+      onOpenChange={() => setOpen(!open)}
+      trigger={
+        <Button>
+          <PlusIcon className="mr-2" size={14} />
+          Install Engine
+        </Button>
+      }
+      content={
+        <div>
+          <form className="mt-8 space-y-6" onSubmit={handleSubmit(onSubmit)}>
+            <div className="space-y-2">
+              <label htmlFor="engineName" className="font-semibold">
+                {renderLabel('Engine Name', true)}
+              </label>
+              <Input
+                placeholder="Enter engine name"
+                {...register('engineName')}
+              />
+              {errors.engineName && (
+                <p className="text-sm text-red-500">
+                  {errors.engineName.message}
+                </p>
+              )}
+            </div>
+
+            <div className="space-y-2">
+              <label htmlFor="modelListUrl" className="font-semibold">
+                {renderLabel(
+                  'Model List URL',
+                  false,
+                  `URL for fetching available models`
+                )}
+              </label>
+              <Input
+                placeholder="Enter model list URL"
+                {...register('modelListUrl')}
+              />
+              {errors.modelListUrl && (
+                <p className="text-sm text-red-500">
+                  {errors.modelListUrl.message}
+                </p>
+              )}
+            </div>
+
+            <div className="space-y-2">
+              <label htmlFor="apiKey" className="font-semibold">
+                {renderLabel(
+                  'API Key',
+                  false,
+                  `Your authentication key from the provider`
+                )}
+              </label>
+              <Input
+                placeholder="Enter API Key"
+                type="password"
+                {...register('apiKey')}
+              />
+            </div>
+
+            <div className="space-y-2">
+              <label htmlFor="headerTemplate" className="font-semibold">
+                {renderLabel(
+                  'Request Headers Template',
+                  false,
+                  `Template for request headers format.`
+                )}
+              </label>
+              <TextArea
+                placeholder="Enter conversion function"
+                {...register('headerTemplate')}
+              />
+              {errors.headerTemplate && (
+                <p className="text-sm text-red-500">
+                  {errors.headerTemplate.message}
+                </p>
+              )}
+            </div>
+
+            <div className="space-y-2">
+              <label htmlFor="requestFormat" className="font-semibold">
+                {renderLabel(
+                  'Request Format Conversion',
+                  false,
+                  `Function to convert Jan’s request format to this engine API’s format`
+                )}
+              </label>
+              <TextArea
+                placeholder="Enter conversion function"
+                {...register('requestFormat')}
+              />
+            </div>
+
+            <div className="space-y-2">
+              <label htmlFor="responseFormat" className="font-semibold">
+                {renderLabel(
+                  'Response Format Conversion',
+                  false,
+                  `Function to convert this engine API’s response format to Jan’s format`
+                )}
+              </label>
+              <TextArea
+                placeholder="Enter conversion function"
+                {...register('responseFormat')}
+              />
+            </div>
+
+            <div className="mt-8 flex justify-end gap-x-2">
+              <Button
+                theme="ghost"
+                variant="outline"
+                onClick={() => setOpen(false)}
+              >
+                Cancel
+              </Button>
+              <Button type="submit">Install</Button>
+            </div>
+          </form>
+        </div>
+      }
+    />
+  )
+}
+
+export default memo(ModalAddRemoteEngine)
diff --git a/web/screens/Settings/Engines/RemoteEngineItem.tsx b/web/screens/Settings/Engines/RemoteEngineItem.tsx
new file mode 100644
index 000000000..9e54e1872
--- /dev/null
+++ b/web/screens/Settings/Engines/RemoteEngineItem.tsx
@@ -0,0 +1,80 @@
+import React, { useCallback } from 'react'
+
+import { EngineConfig, InferenceEngine } from '@janhq/core'
+import { Button, Switch } from '@janhq/joi'
+
+import { useAtom, useSetAtom } from 'jotai'
+import { SettingsIcon } from 'lucide-react'
+
+import { getTitleByEngine } from '@/utils/modelEngine'
+
+import { showSettingActiveRemoteEngineAtom } from '@/helpers/atoms/Extension.atom'
+import { selectedSettingAtom } from '@/helpers/atoms/Setting.atom'
+
+const RemoteEngineItems = ({
+  engine,
+}: {
+  engine: InferenceEngine
+  values: EngineConfig[]
+}) => {
+  const setSelectedSetting = useSetAtom(selectedSettingAtom)
+
+  const [showSettingActiveRemoteEngine, setShowSettingActiveRemoteEngineAtom] =
+    useAtom(showSettingActiveRemoteEngineAtom)
+
+  const onSwitchChange = useCallback(
+    (name: string) => {
+      if (showSettingActiveRemoteEngine.includes(name)) {
+        setShowSettingActiveRemoteEngineAtom(
+          [...showSettingActiveRemoteEngine].filter((x) => x !== name)
+        )
+      } else {
+        setShowSettingActiveRemoteEngineAtom([
+          ...showSettingActiveRemoteEngine,
+          name,
+        ])
+      }
+    },
+    [showSettingActiveRemoteEngine, setShowSettingActiveRemoteEngineAtom]
+  )
+  return (
+    <div className="flex w-full flex-col items-start justify-between border-b border-[hsla(var(--app-border))] py-3 sm:flex-row">
+      <div className="w-full flex-shrink-0 space-y-1.5">
+        <div className="flex items-center justify-between gap-x-2">
+          <div>
+            <div className="flex items-center gap-2">
+              <h6 className="line-clamp-1 font-semibold capitalize">
+                {getTitleByEngine(engine as InferenceEngine)}
+              </h6>
+            </div>
+            <div className="mt-2 w-full font-medium leading-relaxed text-[hsla(var(--text-secondary))]">
+              <p>
+                Access models from {getTitleByEngine(engine as InferenceEngine)}{' '}
+                via their API
+              </p>
+            </div>
+          </div>
+
+          <div className="flex items-center gap-x-3">
+            <Switch
+              checked={!showSettingActiveRemoteEngine.includes(engine)}
+              onChange={() => onSwitchChange(engine)}
+            />
+            <Button
+              theme="icon"
+              variant="outline"
+              onClick={() => setSelectedSetting(engine)}
+            >
+              <SettingsIcon
+                size={14}
+                className="text-[hsla(var(--text-secondary))]"
+              />
+            </Button>
+          </div>
+        </div>
+      </div>
+    </div>
+  )
+}
+
+export default RemoteEngineItems
diff --git a/web/screens/Settings/Engines/RemoteEngineSettings.tsx b/web/screens/Settings/Engines/RemoteEngineSettings.tsx
new file mode 100644
index 000000000..e2cb946cd
--- /dev/null
+++ b/web/screens/Settings/Engines/RemoteEngineSettings.tsx
@@ -0,0 +1,365 @@
+/* eslint-disable  @typescript-eslint/no-explicit-any */
+/* eslint-disable  react/no-unescaped-entities */
+
+import React, { useCallback, useRef, useState, useEffect } from 'react'
+
+import {
+  EngineConfig as OriginalEngineConfig,
+  InferenceEngine,
+} from '@janhq/core'
+
+interface EngineConfig extends OriginalEngineConfig {
+  [key: string]: any
+}
+
+import { ScrollArea, Input, TextArea } from '@janhq/joi'
+
+import { useAtomValue } from 'jotai'
+
+import { set } from 'lodash'
+import { ChevronRight } from 'lucide-react'
+import { twMerge } from 'tailwind-merge'
+
+import { updateEngine, useGetEngines } from '@/hooks/useEngineManagement'
+
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
+
+const RemoteEngineSettings = ({
+  engine: name,
+}: {
+  engine: InferenceEngine
+}) => {
+  const { engines, mutate } = useGetEngines()
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
+
+  const remoteModels = downloadedModels.filter((e) => e.engine === name)
+  const [isActiveAdvanceSetting, setisActiveAdvanceSetting] = useState(false)
+
+  const engine =
+    engines &&
+    Object.entries(engines)
+      .filter(([key]) => key === name)
+      .flatMap(([_, engineArray]) => engineArray as EngineConfig)[0]
+
+  const debounceRef = useRef<NodeJS.Timeout | null>(null)
+
+  const handleChange = useCallback(
+    (field: string, value: any) => {
+      if (!engine) return
+
+      setData((prevData) => {
+        const updatedData = { ...prevData }
+        set(updatedData, field, value)
+        return updatedData
+      })
+
+      if (debounceRef.current) {
+        clearTimeout(debounceRef.current)
+      }
+
+      debounceRef.current = setTimeout(async () => {
+        const updatedEngine = { ...engine }
+        set(updatedEngine, field, value)
+        await updateEngine(name, updatedEngine)
+        mutate()
+      }, 300)
+    },
+    [engine, name, mutate]
+  )
+
+  const [data, setData] = useState({
+    api_key: '',
+    metadata: {
+      header_template: '',
+      get_models_url: '',
+      transform_req: {
+        chat_completions: {
+          template: '',
+          url: '',
+        },
+      },
+      transform_resp: {
+        chat_completions: {
+          template: '',
+        },
+      },
+    },
+  })
+
+  useEffect(() => {
+    if (engine) {
+      setData({
+        api_key: engine.api_key || '',
+        metadata: {
+          header_template: engine.metadata?.header_template || '',
+          get_models_url: engine.metadata?.get_models_url || '',
+          transform_req: {
+            chat_completions: {
+              template:
+                engine.metadata?.transform_req?.chat_completions?.template ||
+                '',
+              url: engine.metadata?.transform_req?.chat_completions?.url || '',
+            },
+          },
+          transform_resp: {
+            chat_completions: {
+              template:
+                engine.metadata?.transform_resp?.chat_completions?.template ||
+                '',
+            },
+          },
+        },
+      })
+    }
+  }, [engine])
+
+  return (
+    <ScrollArea className="h-full w-full">
+      <div className="block w-full px-4">
+        <div className="mb-3 mt-4 border-b border-[hsla(var(--app-border))] pb-4">
+          <div className="flex w-full flex-col items-start justify-between sm:flex-row">
+            <div className="w-full flex-shrink-0 space-y-1.5">
+              <div className="flex items-start justify-between gap-x-2">
+                <div className="w-full sm:w-3/4">
+                  <h6 className="line-clamp-1 font-semibold">API Key</h6>
+                  <p className="mt-1 text-[hsla(var(--text-secondary))]">
+                    Enter your authentication key to activate this engine.
+                  </p>
+                </div>
+                <div className="w-full">
+                  <Input
+                    placeholder="Enter API Key"
+                    value={data?.api_key}
+                    onChange={(e) => handleChange('api_key', e.target.value)}
+                  />
+                </div>
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+
+      <div className="block w-full px-4">
+        <div className="mb-3 mt-4 border-b border-[hsla(var(--app-border))] pb-4">
+          <div className="flex w-full flex-col items-start justify-between sm:flex-row">
+            <div className="w-full flex-shrink-0 space-y-1.5">
+              <div className="flex items-start justify-between gap-x-2">
+                <div className="w-full sm:w-3/4">
+                  <h6 className="line-clamp-1 font-semibold">
+                    Chat Completion URL
+                  </h6>
+                  <p className="mt-1 text-[hsla(var(--text-secondary))]">
+                    Enter your chat completion URL.
+                  </p>
+                </div>
+                <div className="w-full">
+                  <Input
+                    placeholder="Enter Chat Completion URL"
+                    value={data?.metadata.transform_req.chat_completions.url}
+                    onChange={(e) =>
+                      handleChange(
+                        'metadata.transform_req.chat_completions.url',
+                        e.target.value
+                      )
+                    }
+                  />
+                </div>
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+
+      <div className="block w-full px-4">
+        <div className="mb-3 mt-4 pb-4">
+          <div className="flex w-full flex-col items-start justify-between sm:flex-row">
+            <div className="w-full flex-shrink-0 ">
+              <div className="flex items-center justify-between gap-x-2">
+                <div>
+                  <h6 className="mb-2 line-clamp-1 font-semibold">Model</h6>
+                </div>
+              </div>
+
+              <div>
+                {remoteModels &&
+                  remoteModels?.map((item, i) => {
+                    return (
+                      <div
+                        key={i}
+                        className={twMerge(
+                          'border border-b-0 border-[hsla(var(--app-border))] bg-[hsla(var(--tertiary-bg))] p-4 first:rounded-t-lg last:rounded-b-lg last:border-b',
+                          remoteModels?.length === 1 && 'rounded-lg'
+                        )}
+                      >
+                        <div className="flex flex-col items-start justify-start gap-4 sm:flex-row sm:items-center sm:justify-between">
+                          <div className="flex w-full gap-x-8">
+                            <div className="flex h-full w-full items-center justify-between gap-2">
+                              <h6
+                                className={twMerge(
+                                  'font-medium lg:line-clamp-1 lg:min-w-[280px] lg:max-w-[280px]',
+                                  'max-w-none text-[hsla(var(--text-secondary))]'
+                                )}
+                              >
+                                {item.name}
+                              </h6>
+                            </div>
+                          </div>
+                        </div>
+                      </div>
+                    )
+                  })}
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+
+      <div className="px-4">
+        <p
+          className="flex cursor-pointer items-center text-sm font-medium text-[hsla(var(--text-secondary))]"
+          onClick={() => setisActiveAdvanceSetting(!isActiveAdvanceSetting)}
+        >
+          <span>Advance Settings</span>
+          <span>
+            <ChevronRight size={14} className="ml-1" />
+          </span>
+        </p>
+      </div>
+
+      {isActiveAdvanceSetting && (
+        <div>
+          <div className="block w-full px-4">
+            <div className="mb-3 mt-4 border-b border-[hsla(var(--app-border))] pb-4">
+              <div className="flex w-full flex-col items-start justify-between sm:flex-row">
+                <div className="w-full flex-shrink-0 space-y-1.5">
+                  <div className="flex items-start justify-between gap-x-2">
+                    <div className="w-full sm:w-3/4">
+                      <h6 className="line-clamp-1 font-semibold">
+                        Model List URL
+                      </h6>
+                      <p className="mt-1 text-[hsla(var(--text-secondary))]">
+                        The base URL of the provider's API.
+                      </p>
+                    </div>
+                    <div className="w-full">
+                      <Input
+                        placeholder="Enter model list URL"
+                        value={data?.metadata?.get_models_url}
+                        onChange={(e) =>
+                          handleChange(
+                            'metadata.get_models_url',
+                            e.target.value
+                          )
+                        }
+                      />
+                    </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+          </div>
+          <div className="block w-full px-4">
+            <div className="mb-3 mt-4 border-b border-[hsla(var(--app-border))] pb-4">
+              <div className="flex w-full flex-col items-start justify-between sm:flex-row">
+                <div className="w-full flex-shrink-0 space-y-1.5">
+                  <div className="flex items-start justify-between gap-x-2">
+                    <div className="w-full sm:w-3/4">
+                      <h6 className="line-clamp-1 font-semibold">
+                        Request Headers Template
+                      </h6>
+                      <p className="mt-1 text-[hsla(var(--text-secondary))]">
+                        Template for request headers format.
+                      </p>
+                    </div>
+                    <div className="w-full">
+                      <TextArea
+                        placeholder="Enter headers template"
+                        value={data?.metadata?.header_template}
+                        onChange={(e) =>
+                          handleChange(
+                            'metadata.header_template',
+                            e.target.value
+                          )
+                        }
+                      />
+                    </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+          </div>
+          <div className="block w-full px-4">
+            <div className="mb-3 mt-4 border-b border-[hsla(var(--app-border))] pb-4">
+              <div className="flex w-full flex-col items-start justify-between sm:flex-row">
+                <div className="w-full flex-shrink-0 space-y-1.5">
+                  <div className="flex items-start justify-between gap-x-2">
+                    <div className="w-full sm:w-3/4">
+                      <h6 className="line-clamp-1 font-semibold">
+                        Request Format Conversion
+                      </h6>
+                      <p className="mt-1 text-[hsla(var(--text-secondary))]">
+                        Function to convert Jan’s request format to this engine
+                        API’s format.
+                      </p>
+                    </div>
+                    <div className="w-full">
+                      <TextArea
+                        placeholder="Enter conversion function"
+                        value={
+                          data?.metadata?.transform_req?.chat_completions
+                            ?.template
+                        }
+                        onChange={(e) =>
+                          handleChange(
+                            'metadata.transform_req.chat_completions.template',
+                            e.target.value
+                          )
+                        }
+                      />
+                    </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+          </div>
+          <div className="block w-full px-4">
+            <div className="mb-3 mt-4 pb-4">
+              <div className="flex w-full flex-col items-start justify-between sm:flex-row">
+                <div className="w-full flex-shrink-0 space-y-1.5">
+                  <div className="flex items-start justify-between gap-x-2">
+                    <div className="w-full sm:w-3/4">
+                      <h6 className="line-clamp-1 font-semibold">
+                        Response Format Conversion
+                      </h6>
+                      <p className="mt-1 text-[hsla(var(--text-secondary))]">
+                        Function to convert Jan’s request format to this engine
+                        API’s format.
+                      </p>
+                    </div>
+                    <div className="w-full">
+                      <TextArea
+                        placeholder="Enter conversion function"
+                        value={
+                          data?.metadata?.transform_resp?.chat_completions
+                            ?.template
+                        }
+                        onChange={(e) =>
+                          handleChange(
+                            'metadata.transform_resp.chat_completions.template',
+                            e.target.value
+                          )
+                        }
+                      />
+                    </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+          </div>
+        </div>
+      )}
+    </ScrollArea>
+  )
+}
+
+export default RemoteEngineSettings
diff --git a/web/screens/Settings/Engines/index.tsx b/web/screens/Settings/Engines/index.tsx
index fce23092c..8a797f46f 100644
--- a/web/screens/Settings/Engines/index.tsx
+++ b/web/screens/Settings/Engines/index.tsx
@@ -1,259 +1,55 @@
-/* eslint-disable @typescript-eslint/no-explicit-any */
-import React, { useCallback, useEffect, useState } from 'react'
+import React from 'react'
 
 import { InferenceEngine } from '@janhq/core'
-import { Button, ScrollArea, Input, Switch, Badge } from '@janhq/joi'
+import { ScrollArea } from '@janhq/joi'
 
-import { useAtom, useSetAtom } from 'jotai'
-import { SearchIcon, SettingsIcon } from 'lucide-react'
+import { useGetEngines } from '@/hooks/useEngineManagement'
 
-import { marked } from 'marked'
+import { isLocalEngine } from '@/utils/modelEngine'
 
-import SetupRemoteModel from '@/containers/SetupRemoteModel'
-
-import {
-  useGetDefaultEngineVariant,
-  useGetEngines,
-} from '@/hooks/useEngineManagement'
-
-import { formatExtensionsName } from '@/utils/converter'
-
-import { extensionManager } from '@/extension'
-import Extension from '@/extension/Extension'
-import {
-  inActiveEngineProviderAtom,
-  showSettingActiveLocalEngineAtom,
-} from '@/helpers/atoms/Extension.atom'
-import { selectedSettingAtom } from '@/helpers/atoms/Setting.atom'
-
-type EngineExtension = {
-  provider: InferenceEngine
-} & Extension
-
-const EngineItems = ({ engine }: { engine: InferenceEngine }) => {
-  const { defaultEngineVariant } = useGetDefaultEngineVariant(engine)
-
-  const manualDescription = (engine: string) => {
-    switch (engine) {
-      case InferenceEngine.cortex_llamacpp:
-        return 'Fast, efficient local inference engine that runs GGUFmodels directly on your device'
-
-      default:
-        break
-    }
-  }
-
-  const setSelectedSetting = useSetAtom(selectedSettingAtom)
-
-  const [showSettingActiveLocalEngine, setShowSettingActiveLocalEngineAtom] =
-    useAtom(showSettingActiveLocalEngineAtom)
-
-  const onSwitchChange = useCallback(
-    (name: string) => {
-      if (showSettingActiveLocalEngine.includes(name)) {
-        setShowSettingActiveLocalEngineAtom(
-          [...showSettingActiveLocalEngine].filter((x) => x !== name)
-        )
-      } else {
-        setShowSettingActiveLocalEngineAtom([
-          ...showSettingActiveLocalEngine,
-          name,
-        ])
-      }
-    },
-    [showSettingActiveLocalEngine, setShowSettingActiveLocalEngineAtom]
-  )
-  return (
-    <div className="flex w-full flex-col items-start justify-between border-b border-[hsla(var(--app-border))] py-3 sm:flex-row">
-      <div className="w-full flex-shrink-0 space-y-1.5">
-        <div className="flex items-center justify-between gap-x-2">
-          <div>
-            <div className="flex items-center gap-2">
-              <h6 className="line-clamp-1 font-semibold">{engine}</h6>
-              <Badge variant="outline" theme="secondary">
-                {defaultEngineVariant?.version}
-              </Badge>
-            </div>
-            <div className="mt-2 w-full font-medium leading-relaxed text-[hsla(var(--text-secondary))]">
-              <p>{manualDescription(engine)}</p>
-            </div>
-          </div>
-
-          <div className="flex items-center gap-x-3">
-            <Switch
-              checked={!showSettingActiveLocalEngine.includes(engine)}
-              onChange={() => onSwitchChange(engine)}
-            />
-            <Button
-              theme="icon"
-              variant="outline"
-              onClick={() => setSelectedSetting(engine)}
-            >
-              <SettingsIcon
-                size={14}
-                className="text-[hsla(var(--text-secondary))]"
-              />
-            </Button>
-          </div>
-        </div>
-      </div>
-    </div>
-  )
-}
+import LocalEngineItems from './LocalEngineItem'
+import ModalAddRemoteEngine from './ModalAddRemoteEngine'
+import RemoteEngineItems from './RemoteEngineItem'
 
 const Engines = () => {
-  const [searchText, setSearchText] = useState('')
   const { engines } = useGetEngines()
-  const [engineActiveExtensions, setEngineActiveExtensions] = useState<
-    EngineExtension[]
-  >([])
-  const [inActiveEngineProvider, setInActiveEngineProvider] = useAtom(
-    inActiveEngineProviderAtom
-  )
-
-  useEffect(() => {
-    const getAllSettings = async () => {
-      const extensionsMenu = []
-      const engineMenu = []
-      const extensions = extensionManager.getAll()
-
-      for (const extension of extensions) {
-        const settings = await extension.getSettings()
-        if (
-          typeof extension.getSettings === 'function' &&
-          'provider' in extension &&
-          typeof extension.provider === 'string'
-        ) {
-          if (
-            (settings && settings.length > 0) ||
-            (await extension.installationState()) !== 'NotRequired'
-          ) {
-            engineMenu.push({
-              ...extension,
-              provider:
-                'provider' in extension &&
-                typeof extension.provider === 'string'
-                  ? extension.provider
-                  : '',
-            })
-          }
-        } else {
-          extensionsMenu.push({
-            ...extension,
-          })
-        }
-      }
-
-      setEngineActiveExtensions(engineMenu as any)
-    }
-    getAllSettings()
-  }, [])
-
-  const onSwitchChange = useCallback(
-    (name: string) => {
-      if (inActiveEngineProvider.includes(name)) {
-        setInActiveEngineProvider(
-          [...inActiveEngineProvider].filter((x) => x !== name)
-        )
-      } else {
-        setInActiveEngineProvider([...inActiveEngineProvider, name])
-      }
-    },
-    [inActiveEngineProvider, setInActiveEngineProvider]
-  )
 
   return (
     <ScrollArea className="h-full w-full">
-      <div className="flex w-full flex-col items-start justify-between gap-y-2 p-4 sm:flex-row">
-        <div className="w-full sm:w-[300px]">
-          <Input
-            prefixIcon={<SearchIcon size={16} />}
-            placeholder="Search"
-            value={searchText}
-            onChange={(e) => setSearchText(e.target.value)}
-            clearable={searchText.length > 0}
-            onClear={() => setSearchText('')}
-          />
-        </div>
-        {/* <div>
-          <input type="file" hidden />
-          <Button>Install Engine</Button>
-        </div> */}
-      </div>
-
       <div className="block w-full px-4">
         <div className="mb-3 mt-4 pb-4">
           <h6 className="text-xs text-[hsla(var(--text-secondary))]">
             Local Engine
           </h6>
           {engines &&
-            Object.entries(engines)
-              // eslint-disable-next-line @typescript-eslint/no-unused-vars
-              .filter(([_, value]) => !(value as { type?: string }).type)
-              .map(([key]) => {
-                return <EngineItems engine={key as InferenceEngine} key={key} />
-              })}
+            Object.entries(engines).map(([key]) => {
+              if (!isLocalEngine(engines, key as InferenceEngine)) return
+              return (
+                <LocalEngineItems engine={key as InferenceEngine} key={key} />
+              )
+            })}
         </div>
       </div>
 
-      {engineActiveExtensions.length !== 0 && (
-        <div className="mt-4 block w-full px-4">
-          <div className="mb-3 mt-4 pb-4">
-            <h6 className="text-xs text-[hsla(var(--text-secondary))]">
-              Remote Engine
-            </h6>
-            {engineActiveExtensions
-              .filter((x) => x.name.includes(searchText.toLowerCase().trim()))
-              .sort((a, b) => a.provider.localeCompare(b.provider))
-              .map((item, i) => {
-                return (
-                  <div
-                    key={i}
-                    className="flex w-full flex-col items-start justify-between border-b border-[hsla(var(--app-border))] py-3 sm:flex-row"
-                  >
-                    <div className="w-full flex-shrink-0 space-y-1.5">
-                      <div className="flex items-center justify-between gap-x-2">
-                        <div className="flex items-center gap-x-2">
-                          <h6 className="line-clamp-1 font-semibold">
-                            {item.productName?.replace(
-                              'Inference Engine',
-                              ''
-                            ) ?? formatExtensionsName(item.name)}
-                          </h6>
-                          <Badge variant="outline" theme="secondary">
-                            v{item.version}
-                          </Badge>
-                          <p>{item.provider}</p>
-                        </div>
-                        <div className="flex items-center gap-x-2">
-                          <Switch
-                            checked={
-                              !inActiveEngineProvider.includes(item.provider)
-                            }
-                            onChange={() => onSwitchChange(item.provider)}
-                          />
-                          {!inActiveEngineProvider.includes(item.provider) && (
-                            <SetupRemoteModel engine={item.provider} />
-                          )}
-                        </div>
-                      </div>
-                      {
-                        <div
-                          className="w-full font-medium leading-relaxed text-[hsla(var(--text-secondary))] sm:w-4/5"
-                          dangerouslySetInnerHTML={{
-                            __html: marked.parse(item.description ?? '', {
-                              async: false,
-                            }),
-                          }}
-                        />
-                      }
-                    </div>
-                  </div>
-                )
-              })}
-          </div>
+      <div className="mt-4 block w-full px-4">
+        <div className="mt-4 flex items-center justify-between pb-4">
+          <h6 className="text-xs text-[hsla(var(--text-secondary))]">
+            Remote Engine
+          </h6>
+          <ModalAddRemoteEngine />
         </div>
-      )}
+        {engines &&
+          Object.entries(engines).map(([key, values]) => {
+            if (isLocalEngine(engines, key as InferenceEngine)) return
+            return (
+              <RemoteEngineItems
+                engine={key as InferenceEngine}
+                key={key}
+                values={values}
+              />
+            )
+          })}
+      </div>
     </ScrollArea>
   )
 }
diff --git a/web/screens/Settings/MyModels/MyModelList/index.tsx b/web/screens/Settings/MyModels/MyModelList/index.tsx
index 3c5ec500f..61f22238e 100644
--- a/web/screens/Settings/MyModels/MyModelList/index.tsx
+++ b/web/screens/Settings/MyModels/MyModelList/index.tsx
@@ -2,7 +2,7 @@ import { memo, useState } from 'react'
 
 import { Model } from '@janhq/core'
 import { Badge, Button, Tooltip, useClickOutside } from '@janhq/joi'
-import { useAtom } from 'jotai'
+import { useAtom, useAtomValue } from 'jotai'
 import {
   MoreVerticalIcon,
   PlayIcon,
@@ -18,6 +18,7 @@ import { toGibibytes } from '@/utils/converter'
 
 import { isLocalEngine } from '@/utils/modelEngine'
 
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
 
 type Props = {
@@ -31,6 +32,7 @@ const MyModelList = ({ model }: Props) => {
   const { deleteModel } = useDeleteModel()
   const [more, setMore] = useState(false)
   const [serverEnabled, setServerEnabled] = useAtom(serverEnabledAtom)
+  const engines = useAtomValue(installedEnginesAtom)
 
   const [menu, setMenu] = useState<HTMLDivElement | null>(null)
   const [toggle, setToggle] = useState<HTMLDivElement | null>(null)
@@ -54,14 +56,14 @@ const MyModelList = ({ model }: Props) => {
             <h6
               className={twMerge(
                 'font-medium lg:line-clamp-1 lg:min-w-[280px] lg:max-w-[280px]',
-                !isLocalEngine(model.engine) &&
+                !isLocalEngine(engines, model.engine) &&
                   'max-w-none text-[hsla(var(--text-secondary))]'
               )}
               title={model.name}
             >
               {model.name}
             </h6>
-            {isLocalEngine(model.engine) && (
+            {isLocalEngine(engines, model.engine) && (
               <div className="flex gap-x-8">
                 <p
                   className="line-clamp-1 text-[hsla(var(--text-secondary))] lg:min-w-[160px] lg:max-w-[160px] xl:max-w-none"
@@ -74,7 +76,7 @@ const MyModelList = ({ model }: Props) => {
           </div>
         </div>
 
-        {isLocalEngine(model.engine) && (
+        {isLocalEngine(engines, model.engine) && (
           <div className="flex gap-x-4">
             <div className="md:min-w-[90px] md:max-w-[90px]">
               <Badge theme="secondary" className="sm:mr-8">
diff --git a/web/screens/Settings/MyModels/index.tsx b/web/screens/Settings/MyModels/index.tsx
index 218f8cb62..7128d7016 100644
--- a/web/screens/Settings/MyModels/index.tsx
+++ b/web/screens/Settings/MyModels/index.tsx
@@ -24,18 +24,20 @@ import ModelSearch from '@/containers/ModelSearch'
 import SetupRemoteModel from '@/containers/SetupRemoteModel'
 
 import useDropModelBinaries from '@/hooks/useDropModelBinaries'
+import { useGetEngines } from '@/hooks/useEngineManagement'
+
 import { setImportModelStageAtom } from '@/hooks/useImportModel'
 
 import {
   getLogoEngine,
   getTitleByEngine,
-  isLocalEngine,
   priorityEngine,
 } from '@/utils/modelEngine'
 
 import MyModelList from './MyModelList'
 
 import { extensionManager } from '@/extension'
+
 import {
   downloadedModelsAtom,
   showEngineListModelAtom,
@@ -49,9 +51,27 @@ const MyModels = () => {
   const [showEngineListModel, setShowEngineListModel] = useAtom(
     showEngineListModelAtom
   )
+
   const [extensionHasSettings, setExtensionHasSettings] = useState<
     { name?: string; setting: string; apiKey: string; provider: string }[]
   >([])
+  const { engines } = useGetEngines()
+
+  const isLocalEngine = useCallback(
+    (engine: string) =>
+      Object.values(engines ?? {})
+        .flat()
+        .find((e) => e.name === engine)?.type === 'local' || false,
+    [engines]
+  )
+
+  const isConfigured = useCallback(
+    (engine: string) =>
+      (Object.values(engines ?? {})
+        .flat()
+        .find((e) => e.engine === engine)?.api_key?.length ?? 0) > 0,
+    [engines]
+  )
 
   const filteredDownloadedModels = useMemo(
     () =>
@@ -206,6 +226,7 @@ const MyModels = () => {
                     setShowEngineListModel((prev) => [...prev, engine])
                   }
                 }
+
                 return (
                   <div className="my-6" key={i}>
                     <div className="flex flex-col items-start justify-start gap-2 sm:flex-row sm:items-center sm:justify-between">
@@ -228,7 +249,10 @@ const MyModels = () => {
                       </div>
                       <div className="flex gap-1">
                         {!isLocalEngine(engine) && (
-                          <SetupRemoteModel engine={engine} />
+                          <SetupRemoteModel
+                            engine={engine}
+                            isConfigured={isConfigured(engine)}
+                          />
                         )}
                         {!showModel ? (
                           <Button theme="icon" onClick={onClickChevron}>
diff --git a/web/screens/Settings/SettingDetail/index.tsx b/web/screens/Settings/SettingDetail/index.tsx
index f183aaff5..d0dc8c7b3 100644
--- a/web/screens/Settings/SettingDetail/index.tsx
+++ b/web/screens/Settings/SettingDetail/index.tsx
@@ -5,16 +5,21 @@ import Advanced from '@/screens/Settings/Advanced'
 import AppearanceOptions from '@/screens/Settings/Appearance'
 import ExtensionCatalog from '@/screens/Settings/CoreExtensions'
 import Engines from '@/screens/Settings/Engines'
-import EngineSettings from '@/screens/Settings/Engines/Settings'
+import LocalEngineSettings from '@/screens/Settings/Engines/LocalEngineSettings'
+import RemoteEngineSettings from '@/screens/Settings/Engines/RemoteEngineSettings'
 import ExtensionSetting from '@/screens/Settings/ExtensionSetting'
 import Hotkeys from '@/screens/Settings/Hotkeys'
 import MyModels from '@/screens/Settings/MyModels'
 import Privacy from '@/screens/Settings/Privacy'
 
+import { isLocalEngine } from '@/utils/modelEngine'
+
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import { selectedSettingAtom } from '@/helpers/atoms/Setting.atom'
 
 const SettingDetail = () => {
   const selectedSetting = useAtomValue(selectedSettingAtom)
+  const engines = useAtomValue(installedEnginesAtom)
 
   switch (selectedSetting) {
     case 'Engines':
@@ -38,10 +43,22 @@ const SettingDetail = () => {
     case 'My Models':
       return <MyModels />
 
-    case InferenceEngine.cortex_llamacpp:
-      return <EngineSettings engine={selectedSetting} />
-
     default:
+      if (
+        !selectedSetting.includes('@janhq') &&
+        isLocalEngine(engines, selectedSetting as InferenceEngine)
+      ) {
+        return (
+          <LocalEngineSettings engine={selectedSetting as InferenceEngine} />
+        )
+      } else if (
+        !selectedSetting.includes('@janhq') &&
+        !isLocalEngine(engines, selectedSetting as InferenceEngine)
+      ) {
+        return (
+          <RemoteEngineSettings engine={selectedSetting as InferenceEngine} />
+        )
+      }
       return <ExtensionSetting />
   }
 }
diff --git a/web/screens/Settings/SettingLeftPanel/index.tsx b/web/screens/Settings/SettingLeftPanel/index.tsx
index a8b2a148f..fc797873b 100644
--- a/web/screens/Settings/SettingLeftPanel/index.tsx
+++ b/web/screens/Settings/SettingLeftPanel/index.tsx
@@ -1,69 +1,48 @@
 /* eslint-disable @typescript-eslint/no-unused-vars */
 import { memo, useEffect, useState } from 'react'
 
+import { InferenceEngine } from '@janhq/core'
 import { useAtomValue } from 'jotai'
 
 import LeftPanelContainer from '@/containers/LeftPanelContainer'
 
-import { useGetEngines } from '@/hooks/useEngineManagement'
+import { getTitleByEngine, isLocalEngine } from '@/utils/modelEngine'
 
 import SettingItem from './SettingItem'
 
 import { extensionManager } from '@/extension'
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
+
 import {
-  inActiveEngineProviderAtom,
   showSettingActiveLocalEngineAtom,
+  showSettingActiveRemoteEngineAtom,
 } from '@/helpers/atoms/Extension.atom'
 import { janSettingScreenAtom } from '@/helpers/atoms/Setting.atom'
 
 const SettingLeftPanel = () => {
-  const { engines } = useGetEngines()
+  const engines = useAtomValue(installedEnginesAtom)
   const settingScreens = useAtomValue(janSettingScreenAtom)
-  const inActiveEngineProvider = useAtomValue(inActiveEngineProviderAtom)
+
   const showSettingActiveLocalEngine = useAtomValue(
     showSettingActiveLocalEngineAtom
   )
+  const showSettingActiveRemoteEngine = useAtomValue(
+    showSettingActiveRemoteEngineAtom
+  )
 
   const [extensionHasSettings, setExtensionHasSettings] = useState<
     { name?: string; setting: string }[]
   >([])
 
-  const [engineHasSettings, setEngineHasSettings] = useState<
-    { name?: string; setting: string; provider: string }[]
-  >([])
-
   useEffect(() => {
     const getAllSettings = async () => {
       const extensionsMenu: { name?: string; setting: string }[] = []
-      const engineMenu: {
-        name?: string
-        setting: string
-        provider: string
-      }[] = []
+
       const extensions = extensionManager.getAll()
 
       for (const extension of extensions) {
         const settings = await extension.getSettings()
-        if (
-          typeof extension.getSettings === 'function' &&
-          'provider' in extension &&
-          typeof extension.provider === 'string'
-        ) {
-          if (
-            (settings && settings.length > 0) ||
-            (await extension.installationState()) !== 'NotRequired'
-          ) {
-            engineMenu.push({
-              name: extension.productName,
-              setting: extension.name,
-              provider:
-                'provider' in extension &&
-                typeof extension.provider === 'string'
-                  ? extension.provider
-                  : '',
-            })
-          }
-        } else if (settings && settings.length > 0) {
+        if (settings && settings.length > 0) {
           extensionsMenu.push({
             name: extension.productName,
             setting: extension.name,
@@ -72,7 +51,6 @@ const SettingLeftPanel = () => {
       }
 
       setExtensionHasSettings(extensionsMenu)
-      setEngineHasSettings(engineMenu)
     }
     getAllSettings()
   }, [])
@@ -95,10 +73,11 @@ const SettingLeftPanel = () => {
         ))}
 
         {engines &&
-          Object.entries(engines)
-            .filter(([key]) => !showSettingActiveLocalEngine.includes(key))
-            .filter(([_, value]) => !(value as { type?: string }).type).length >
-            0 && (
+          Object.entries(engines).filter(
+            ([key]) =>
+              isLocalEngine(engines, key as InferenceEngine) &&
+              !showSettingActiveLocalEngine.includes(key)
+          ).length > 0 && (
             <>
               <div className="mb-1 mt-4 px-2">
                 <label className="text-xs font-medium text-[hsla(var(--text-secondary))]">
@@ -108,36 +87,52 @@ const SettingLeftPanel = () => {
 
               {engines &&
                 Object.entries(engines)
-                  .filter(([_, value]) => !(value as { type?: string }).type)
                   .filter(
                     ([key]) => !showSettingActiveLocalEngine.includes(key)
                   )
                   .map(([key]) => {
-                    return <SettingItem key={key} name={key} setting={key} />
+                    if (!isLocalEngine(engines, key as InferenceEngine)) return
+                    return (
+                      <SettingItem
+                        key={key}
+                        name={getTitleByEngine(key as InferenceEngine)}
+                        setting={key}
+                      />
+                    )
                   })}
             </>
           )}
 
-        {engineHasSettings.filter(
-          (x) => !inActiveEngineProvider.includes(x.provider)
-        ).length > 0 && (
-          <div className="mb-1 mt-4 px-2">
-            <label className="text-xs font-medium text-[hsla(var(--text-secondary))]">
-              Remote Engine
-            </label>
-          </div>
-        )}
+        {engines &&
+          Object.entries(engines).filter(
+            ([key]) =>
+              !isLocalEngine(engines, key as InferenceEngine) &&
+              !showSettingActiveRemoteEngine.includes(key)
+          ).length > 0 && (
+            <>
+              <div className="mb-1 mt-4 px-2">
+                <label className="text-xs font-medium text-[hsla(var(--text-secondary))]">
+                  Remote Engine
+                </label>
+              </div>
 
-        {engineHasSettings
-          .sort((a, b) => a.provider.localeCompare(b.provider))
-          .filter((x) => !inActiveEngineProvider.includes(x.provider))
-          .map((item) => (
-            <SettingItem
-              key={item.name}
-              name={item.name?.replace('Inference Engine', '') ?? item.setting}
-              setting={item.setting}
-            />
-          ))}
+              {engines &&
+                Object.entries(engines)
+                  .filter(
+                    ([key]) => !showSettingActiveRemoteEngine.includes(key)
+                  )
+                  .map(([key]) => {
+                    if (isLocalEngine(engines, key as InferenceEngine)) return
+                    return (
+                      <SettingItem
+                        key={key}
+                        name={getTitleByEngine(key as InferenceEngine)}
+                        setting={key}
+                      />
+                    )
+                  })}
+            </>
+          )}
 
         {extensionHasSettings.length > 0 && (
           <div className="mb-1 mt-4 px-2">
diff --git a/web/screens/Thread/ThreadCenterPanel/ChatBody/EmptyThread/index.tsx b/web/screens/Thread/ThreadCenterPanel/ChatBody/EmptyThread/index.tsx
index 57d9298e6..ae377eb24 100644
--- a/web/screens/Thread/ThreadCenterPanel/ChatBody/EmptyThread/index.tsx
+++ b/web/screens/Thread/ThreadCenterPanel/ChatBody/EmptyThread/index.tsx
@@ -1,4 +1,4 @@
-import { memo } from 'react'
+import { memo, useMemo } from 'react'
 
 import { Button } from '@janhq/joi'
 import { useAtomValue, useSetAtom } from 'jotai'
@@ -10,14 +10,20 @@ import { MainViewState } from '@/constants/screens'
 import { isLocalEngine } from '@/utils/modelEngine'
 
 import { mainViewStateAtom } from '@/helpers/atoms/App.atom'
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
 
 const EmptyThread = () => {
   const downloadedModels = useAtomValue(downloadedModelsAtom)
   const setMainViewState = useSetAtom(mainViewStateAtom)
-  const showOnboardingStep =
-    downloadedModels.filter((e) => isLocalEngine(e.engine)).length === 0
-
+  const engines = useAtomValue(installedEnginesAtom)
+  const showOnboardingStep = useMemo(
+    () =>
+      !downloadedModels.some(
+        (e) => isLocalEngine(engines, e.engine) || e.engine
+      ),
+    [downloadedModels, engines]
+  )
   return (
     <div className="mx-auto flex h-full flex-col items-center justify-center text-center">
       <LogoMark className="mx-auto mb-2 animate-wave" width={32} height={32} />
diff --git a/web/screens/Thread/ThreadCenterPanel/ChatBody/OnDeviceStarterScreen/index.tsx b/web/screens/Thread/ThreadCenterPanel/ChatBody/OnDeviceStarterScreen/index.tsx
index 041c37b18..e05e793b5 100644
--- a/web/screens/Thread/ThreadCenterPanel/ChatBody/OnDeviceStarterScreen/index.tsx
+++ b/web/screens/Thread/ThreadCenterPanel/ChatBody/OnDeviceStarterScreen/index.tsx
@@ -24,8 +24,6 @@ import useDownloadModel from '@/hooks/useDownloadModel'
 
 import { modelDownloadStateAtom } from '@/hooks/useDownloadState'
 
-import { useStarterScreen } from '@/hooks/useStarterScreen'
-
 import { formatDownloadPercentage, toGibibytes } from '@/utils/converter'
 import { manualRecommendationModel } from '@/utils/model'
 import {
@@ -35,6 +33,7 @@ import {
 } from '@/utils/modelEngine'
 
 import { mainViewStateAtom } from '@/helpers/atoms/App.atom'
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import {
   configuredModelsAtom,
   getDownloadingModelAtom,
@@ -46,13 +45,13 @@ type Props = {
 }
 
 const OnDeviceStarterScreen = ({ isShowStarterScreen }: Props) => {
-  const { extensionHasSettings } = useStarterScreen()
   const [searchValue, setSearchValue] = useState('')
   const [isOpen, setIsOpen] = useState(Boolean(searchValue.length))
   const downloadingModels = useAtomValue(getDownloadingModelAtom)
   const { downloadModel } = useDownloadModel()
   const downloadStates = useAtomValue(modelDownloadStateAtom)
   const setSelectedSetting = useSetAtom(selectedSettingAtom)
+  const engines = useAtomValue(installedEnginesAtom)
 
   const configuredModels = useAtomValue(configuredModelsAtom)
   const setMainViewState = useSetAtom(mainViewStateAtom)
@@ -74,11 +73,13 @@ const OnDeviceStarterScreen = ({ isShowStarterScreen }: Props) => {
     }
   })
 
-  const remoteModel = configuredModels.filter((x) => !isLocalEngine(x.engine))
+  const remoteModel = configuredModels.filter(
+    (x) => !isLocalEngine(engines, x.engine)
+  )
 
   const filteredModels = configuredModels.filter((model) => {
     return (
-      isLocalEngine(model.engine) &&
+      isLocalEngine(engines, model.engine) &&
       model.name.toLowerCase().includes(searchValue.toLowerCase())
     )
   })
@@ -309,9 +310,7 @@ const OnDeviceStarterScreen = ({ isShowStarterScreen }: Props) => {
                               onClick={() => {
                                 setMainViewState(MainViewState.Settings)
                                 setSelectedSetting(
-                                  extensionHasSettings.find((x) =>
-                                    x.name?.toLowerCase().includes(remoteEngine)
-                                  )?.setting as string
+                                  remoteEngine as InferenceEngine
                                 )
                               }}
                             >
diff --git a/web/screens/Thread/ThreadCenterPanel/ChatInput/index.tsx b/web/screens/Thread/ThreadCenterPanel/ChatInput/index.tsx
index 06e647008..e70047d05 100644
--- a/web/screens/Thread/ThreadCenterPanel/ChatInput/index.tsx
+++ b/web/screens/Thread/ThreadCenterPanel/ChatInput/index.tsx
@@ -1,7 +1,7 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
 import { useEffect, useRef, useState } from 'react'
 
-import { InferenceEngine, MessageStatus } from '@janhq/core'
+import { InferenceEngine } from '@janhq/core'
 
 import { TextArea, Button, Tooltip, useClickOutside, Badge } from '@janhq/joi'
 import { useAtom, useAtomValue } from 'jotai'
@@ -35,6 +35,7 @@ import RichTextEditor from './RichTextEditor'
 import { showRightPanelAtom } from '@/helpers/atoms/App.atom'
 import { experimentalFeatureEnabledAtom } from '@/helpers/atoms/AppConfig.atom'
 import { activeAssistantAtom } from '@/helpers/atoms/Assistant.atom'
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import { selectedModelAtom } from '@/helpers/atoms/Model.atom'
 import { spellCheckAtom } from '@/helpers/atoms/Setting.atom'
 import {
@@ -63,6 +64,7 @@ const ChatInput = () => {
   const textareaRef = useRef<HTMLTextAreaElement>(null)
   const fileInputRef = useRef<HTMLInputElement>(null)
   const imageInputRef = useRef<HTMLInputElement>(null)
+  const engines = useAtomValue(installedEnginesAtom)
   const experimentalFeature = useAtomValue(experimentalFeatureEnabledAtom)
   const isBlockingSend = useAtomValue(isBlockingSendAtom)
   const activeAssistant = useAtomValue(activeAssistantAtom)
@@ -95,6 +97,7 @@ const ChatInput = () => {
   }
 
   const isModelSupportRagAndTools = isLocalEngine(
+    engines,
     selectedModel?.engine as InferenceEngine
   )
 
diff --git a/web/screens/Thread/ThreadRightPanel/index.tsx b/web/screens/Thread/ThreadRightPanel/index.tsx
index dab50aba7..20f365a88 100644
--- a/web/screens/Thread/ThreadRightPanel/index.tsx
+++ b/web/screens/Thread/ThreadRightPanel/index.tsx
@@ -39,6 +39,7 @@ import Tools from './Tools'
 
 import { experimentalFeatureEnabledAtom } from '@/helpers/atoms/AppConfig.atom'
 import { activeAssistantAtom } from '@/helpers/atoms/Assistant.atom'
+import { installedEnginesAtom } from '@/helpers/atoms/Engines.atom'
 import { selectedModelAtom } from '@/helpers/atoms/Model.atom'
 import {
   activeThreadAtom,
@@ -60,12 +61,13 @@ const ThreadRightPanel = () => {
   const [activeTabThreadRightPanel, setActiveTabThreadRightPanel] = useAtom(
     activeTabThreadRightPanelAtom
   )
+  const engines = useAtomValue(installedEnginesAtom)
   const { updateThreadMetadata } = useCreateNewThread()
   const experimentalFeature = useAtomValue(experimentalFeatureEnabledAtom)
 
   const isModelSupportRagAndTools =
     selectedModel?.engine === InferenceEngine.openai ||
-    isLocalEngine(selectedModel?.engine as InferenceEngine)
+    isLocalEngine(engines, selectedModel?.engine as InferenceEngine)
 
   const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
   const { stopModel } = useActiveModel()
diff --git a/web/utils/messageRequestBuilder.ts b/web/utils/messageRequestBuilder.ts
index c3da9cbd8..b75dbecb0 100644
--- a/web/utils/messageRequestBuilder.ts
+++ b/web/utils/messageRequestBuilder.ts
@@ -167,6 +167,7 @@ export class MessageRequestBuilder {
       messages: this.normalizeMessages(this.messages),
       model: this.model,
       thread: this.thread,
+      engine: this.model.engine,
     }
   }
 }
diff --git a/web/utils/modelEngine.test.ts b/web/utils/modelEngine.test.ts
index 04001f726..41d0043ea 100644
--- a/web/utils/modelEngine.test.ts
+++ b/web/utils/modelEngine.test.ts
@@ -25,40 +25,29 @@ describe('isLocalEngine', () => {
 
   it('should return false if engine is not found', () => {
     mockGet.mockReturnValue(null)
-    const result = isLocalEngine('nonexistentEngine')
+    const result = isLocalEngine(
+      {
+        'llama-cpp': [],
+      } as any,
+      'nonexistentEngine'
+    )
     expect(result).toBe(false)
   })
-
-  it('should return true if engine is an instance of LocalOAIEngine', () => {
-    const mockEngineObj = {
-      __proto__: {
-        constructor: {
-          __proto__: {
-            name: LocalOAIEngine.name,
+  it('should return true if this is a local engine', () => {
+    mockGet.mockReturnValue(null)
+    const result = isLocalEngine(
+      {
+        'llama-cpp': [
+          {
+            type: 'local',
           },
-        },
-      },
-    }
-    mockGet.mockReturnValue(mockEngineObj)
-    const result = isLocalEngine('localEngine')
+        ],
+      } as any,
+      'llama-cpp'
+    )
     expect(result).toBe(true)
   })
 
-  it('should return false if engine is not an instance of LocalOAIEngine', () => {
-    const mockEngineObj = {
-      __proto__: {
-        constructor: {
-          __proto__: {
-            name: 'SomeOtherEngine',
-          },
-        },
-      },
-    }
-    mockGet.mockReturnValue(mockEngineObj)
-    const result = isLocalEngine('someOtherEngine')
-    expect(result).toBe(false)
-  })
-
   jest.mock('@janhq/core', () => ({
     ...jest.requireActual('@janhq/core'),
     EngineManager: {
@@ -71,7 +60,7 @@ describe('isLocalEngine', () => {
   describe('getTitleByEngine', () => {
     it('should return correct title for InferenceEngine.nitro', () => {
       const result = getTitleByEngine(InferenceEngine.nitro)
-      expect(result).toBe('Llama.cpp (Cortex)')
+      expect(result).toBe('Llama.cpp')
     })
 
     it('should return correct title for InferenceEngine.nitro_tensorrt_llm', () => {
@@ -81,17 +70,17 @@ describe('isLocalEngine', () => {
 
     it('should return correct title for InferenceEngine.cortex_llamacpp', () => {
       const result = getTitleByEngine(InferenceEngine.cortex_llamacpp)
-      expect(result).toBe('Llama.cpp (Cortex)')
+      expect(result).toBe('Llama.cpp')
     })
 
     it('should return correct title for InferenceEngine.cortex_onnx', () => {
       const result = getTitleByEngine(InferenceEngine.cortex_onnx)
-      expect(result).toBe('Onnx (Cortex)')
+      expect(result).toBe('Onnx')
     })
 
     it('should return correct title for InferenceEngine.cortex_tensorrtllm', () => {
       const result = getTitleByEngine(InferenceEngine.cortex_tensorrtllm)
-      expect(result).toBe('TensorRT-LLM (Cortex)')
+      expect(result).toBe('TensorRT-LLM')
     })
 
     it('should return correct title for InferenceEngine.openai', () => {
diff --git a/web/utils/modelEngine.ts b/web/utils/modelEngine.ts
index d87d8d382..3648fc8c1 100644
--- a/web/utils/modelEngine.ts
+++ b/web/utils/modelEngine.ts
@@ -1,4 +1,4 @@
-import { EngineManager, InferenceEngine, LocalOAIEngine } from '@janhq/core'
+import { Engines, InferenceEngine } from '@janhq/core'
 
 export const getLogoEngine = (engine: InferenceEngine) => {
   switch (engine) {
@@ -38,28 +38,23 @@ export const getLogoEngine = (engine: InferenceEngine) => {
  * @param engine
  * @returns
  */
-export const isLocalEngine = (engine?: string) => {
-  if (!engine) return false
+export const isLocalEngine = (engines?: Engines, engine?: string) => {
+  if (!engines || !engine) return false
 
-  const engineObj = EngineManager.instance().get(engine)
-  if (!engineObj) return false
-  return (
-    Object.getPrototypeOf(engineObj).constructor.__proto__.name ===
-    LocalOAIEngine.name
-  )
+  return engines[engine as InferenceEngine]?.[0]?.type === 'local'
 }
 
 export const getTitleByEngine = (engine: InferenceEngine) => {
   switch (engine) {
     case InferenceEngine.nitro:
     case InferenceEngine.cortex_llamacpp:
-      return 'Llama.cpp (Cortex)'
+      return 'Llama.cpp'
     case InferenceEngine.nitro_tensorrt_llm:
       return 'TensorRT-LLM (Nitro)'
     case InferenceEngine.cortex_onnx:
-      return 'Onnx (Cortex)'
+      return 'Onnx'
     case InferenceEngine.cortex_tensorrtllm:
-      return 'TensorRT-LLM (Cortex)'
+      return 'TensorRT-LLM'
     case InferenceEngine.openai:
       return 'OpenAI'
     case InferenceEngine.openrouter:
diff --git a/yarn.lock b/yarn.lock
index cb2b7789c..035400a11 100644
--- a/yarn.lock
+++ b/yarn.lock
@@ -890,6 +890,15 @@ __metadata:
   languageName: node
   linkType: hard
 
+"@hookform/resolvers@npm:^3.9.1":
+  version: 3.9.1
+  resolution: "@hookform/resolvers@npm:3.9.1"
+  peerDependencies:
+    react-hook-form: ^7.0.0
+  checksum: 10c0/8a4056db3860b12ee30921ba352996104d6ae75ac45996d4c8b6df429e07ee73f5b87c82a22a15403789213f6f52f5fead1c2637b26ef624068b68d213362cd1
+  languageName: node
+  linkType: hard
+
 "@humanwhocodes/config-array@npm:^0.11.13, @humanwhocodes/config-array@npm:^0.11.14":
   version: 0.11.14
   resolution: "@humanwhocodes/config-array@npm:0.11.14"
@@ -1104,6 +1113,7 @@ __metadata:
   version: 0.0.0-use.local
   resolution: "@janhq/web@workspace:web"
   dependencies:
+    "@hookform/resolvers": "npm:^3.9.1"
     "@janhq/core": "link:../core"
     "@janhq/joi": "link:../joi"
     "@next/eslint-plugin-next": "npm:^14.0.1"
@@ -1157,6 +1167,7 @@ __metadata:
     react-circular-progressbar: "npm:^2.1.0"
     react-dom: "npm:18.2.0"
     react-dropzone: "npm:14.2.3"
+    react-hook-form: "npm:^7.54.2"
     react-hot-toast: "npm:^2.4.1"
     react-icons: "npm:^4.12.0"
     react-markdown: "npm:^9.0.1"
@@ -1179,6 +1190,7 @@ __metadata:
     ulidx: "npm:^2.3.0"
     use-debounce: "npm:^10.0.0"
     uuid: "npm:^9.0.1"
+    zod: "npm:^3.24.1"
   languageName: unknown
   linkType: soft
 
@@ -15494,6 +15506,15 @@ __metadata:
   languageName: node
   linkType: hard
 
+"react-hook-form@npm:^7.54.2":
+  version: 7.54.2
+  resolution: "react-hook-form@npm:7.54.2"
+  peerDependencies:
+    react: ^16.8.0 || ^17 || ^18 || ^19
+  checksum: 10c0/6eebead2900e3d369a989e7a20429f390dc75b3897142aa3107f1f6dabb9ae64fed201ea98cdcd8676e40466c97748aeb0c0d83264f5bd3a84dbc0b8e4863415
+  languageName: node
+  linkType: hard
+
 "react-hot-toast@npm:^2.4.1":
   version: 2.4.1
   resolution: "react-hot-toast@npm:2.4.1"
@@ -19249,7 +19270,7 @@ __metadata:
   languageName: node
   linkType: hard
 
-"zod@npm:^3.23.8":
+"zod@npm:^3.23.8, zod@npm:^3.24.1":
   version: 3.24.1
   resolution: "zod@npm:3.24.1"
   checksum: 10c0/0223d21dbaa15d8928fe0da3b54696391d8e3e1e2d0283a1a070b5980a1dbba945ce631c2d1eccc088fdbad0f2dfa40155590bf83732d3ac4fcca2cc9237591b