From 760cdd29d2e04ed2659ddf2508ef0b4727a47534 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 04:39:01 +0000
Subject: [PATCH 01/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)
diff --git a/README.md b/README.md
index faa04e70a..5418f1e74 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-170.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-171.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-170.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-171.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-170.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-171.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-170.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-171.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-170.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-171.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 0f3c0e34e46ce5365a921ac62f172d9b7673ae44 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 05:02:59 +0000
Subject: [PATCH 02/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 5418f1e74..e75725c31 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-171.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-7.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-171.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-7.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-171.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-7.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-171.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-7.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-171.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-7.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 045e544007bd24a36c0a4940ef9c2b33bee5d9ec Mon Sep 17 00:00:00 2001
From: avb-is-me <104213687+avb-is-me@users.noreply.github.com>
Date: Thu, 25 Jan 2024 06:14:47 +0000
Subject: [PATCH 03/65] adds devcontainer

---
 .devcontainer/devcontainer.json | 4 ++++
 1 file changed, 4 insertions(+)
 create mode 100644 .devcontainer/devcontainer.json

diff --git a/.devcontainer/devcontainer.json b/.devcontainer/devcontainer.json
new file mode 100644
index 000000000..f980b9df7
--- /dev/null
+++ b/.devcontainer/devcontainer.json
@@ -0,0 +1,4 @@
+{
+    "name": "jan",
+    "image": "node:20"
+}
\ No newline at end of file

From 3b8e2c55852d03dbf9ed6642639e93ecbb2164d3 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 06:39:28 +0000
Subject: [PATCH 04/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index e75725c31..82c3ae79b 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-7.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-172.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-7.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-172.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-7.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-172.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-7.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-172.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-7.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-172.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 0e48be67e831eccd3d501970a5c2f98eb6b37987 Mon Sep 17 00:00:00 2001
From: Louis <louis@jan.ai>
Date: Thu, 25 Jan 2024 14:05:33 +0700
Subject: [PATCH 05/65] feat: support multiple model binaries (#1659)

* feat: Support multiple model binaries

* fix: Update downloadModel with multiple binaries handler

* feat: Add 3 models with multiple binaries

* chore: fix model download

* fix: model file lookup & model path

* chore: add .prettierrc

* chore: refactor docs

* chore: bump model version

* fix(capybara): add filename

* fix(codeninja): add file name + llama model path

* fix(default): add llama model path

* fix(deepseek coder): add filename

* fix(deepseek 33B): add filename

* fix(dolphin mixtral): add filename

* fix(llama2-chat): add filename

* fix(llama2-70B): add filename

* fix(mistral 7b): add filename + model path

* fix(bakllava): correct size model

* fix(llava-7b): correct size model

* fix(llava-13b): correct size model

* fix(mixtral-8x7b): add file name + modelpath

* fix(noramaid-7b): add file name + modelpath

* fix(openchat-7b): add file name + modelpath

* fix(openhermes-7b): add file name + modelpath

* fix(phi2-3b): add file name + modelpath

* fix(phind): add file name + modelpath

* fix(solarslerp): add file name + modelpath

* fix(starling): add file name + modelpath

* fix(stealth): add file name + modelpath

* fix(tinyllama): add file name + modelpath

* fix(trinity): add file name + modelpath

* fix(tulu): add file name + modelpath

* fix(wizardcoder): add file name + modelpath

* fix(yi): add file name + modelpath

* update from source -> sources

Signed-off-by: James <james@jan.ai>

---------

Signed-off-by: James <james@jan.ai>
Co-authored-by: hiro <vuonghoainam.work@gmail.com>
Co-authored-by: hahuyhoang411 <hahuyhoanghhh41@gmail.com>
Co-authored-by: James <james@jan.ai>
---
 core/.prettierignore                          |  5 ++
 core/src/node/api/common/builder.ts           | 27 ++++----
 core/src/types/model/modelEntity.ts           |  9 ++-
 docs/docs/docs/03-engineering/models.md       | 54 +++++++++-------
 .../04-using-models/02-import-manually.mdx    | 20 +++---
 .../03-integrate-with-remote-server.mdx       | 20 ++++--
 .../02-integrate-openrouter.mdx               | 10 ++-
 .../03-integrate-azure-openai-service.mdx     | 10 ++-
 docs/openapi/specs/models.yaml                | 56 +++++++++++------
 .../src/node/index.ts                         | 10 ++-
 extensions/model-extension/package.json       |  2 +-
 extensions/model-extension/src/index.ts       | 53 +++++++++++++---
 models/bakllava-1/model.json                  | 33 ++++++++++
 models/capybara-34b/model.json                | 61 +++++++++---------
 models/codeninja-1.0-7b/model.json            | 60 +++++++++---------
 models/config/default-model.json              | 10 ++-
 models/deepseek-coder-1.3b/model.json         | 61 +++++++++---------
 models/deepseek-coder-34b/model.json          | 61 +++++++++---------
 models/dolphin-2.7-mixtral-8x7b/model.json    | 60 ++++++++++--------
 models/gpt-3.5-turbo-16k-0613/model.json      | 34 +++++-----
 models/gpt-3.5-turbo/model.json               | 34 +++++-----
 models/gpt-4/model.json                       | 34 +++++-----
 models/llama2-chat-70b-q4/model.json          | 61 +++++++++---------
 models/llama2-chat-7b-q4/model.json           | 61 +++++++++---------
 models/llava-1.5-13b-q5/model.json            | 33 ++++++++++
 models/llava-1.5-7b-q5/model.json             | 33 ++++++++++
 models/mistral-ins-7b-q4/model.json           | 63 ++++++++++---------
 models/mixtral-8x7b-instruct/model.json       | 59 +++++++++--------
 models/noromaid-7b/model.json                 | 61 +++++++++---------
 models/openchat-3.5-7b/model.json             | 60 ++++++++++--------
 models/openhermes-neural-7b/model.json        | 61 +++++++++---------
 models/phi-2-3b/model.json                    | 61 +++++++++---------
 models/phind-34b/model.json                   | 61 +++++++++---------
 models/solar-10.7b-slerp/model.json           | 60 +++++++++---------
 models/starling-7b/model.json                 | 61 +++++++++---------
 models/stealth-v1.2-7b/model.json             | 63 ++++++++++---------
 models/tinyllama-1.1b/model.json              | 20 +++---
 models/trinity-v1.2-7b/model.json             | 61 +++++++++---------
 models/tulu-2-70b/model.json                  | 59 +++++++++--------
 models/wizardcoder-13b/model.json             | 61 +++++++++---------
 models/yarn-mistral-7b/model.json             | 58 ++++++++---------
 models/yi-34b/model.json                      | 61 +++++++++---------
 web/containers/Providers/EventListener.tsx    |  1 +
 web/hooks/useDownloadModel.ts                 | 20 ++++++
 web/hooks/useGetConfiguredModels.ts           |  4 +-
 web/hooks/useGetDownloadedModels.ts           |  5 +-
 web/hooks/useRecommendedModel.ts              |  1 +
 web/hooks/useSettings.ts                      |  1 +
 web/package.json                              |  2 +-
 .../ExploreModelItemHeader/index.tsx          | 10 ++-
 web/types/downloadState.d.ts                  |  2 +
 web/utils/model.ts                            |  2 +-
 web/utils/modelParam.ts                       |  2 +
 53 files changed, 1117 insertions(+), 775 deletions(-)
 create mode 100644 core/.prettierignore
 create mode 100644 models/bakllava-1/model.json
 create mode 100644 models/llava-1.5-13b-q5/model.json
 create mode 100644 models/llava-1.5-7b-q5/model.json

diff --git a/core/.prettierignore b/core/.prettierignore
new file mode 100644
index 000000000..02d9145c1
--- /dev/null
+++ b/core/.prettierignore
@@ -0,0 +1,5 @@
+.next/
+node_modules/
+dist/
+*.hbs
+*.mdx
\ No newline at end of file
diff --git a/core/src/node/api/common/builder.ts b/core/src/node/api/common/builder.ts
index 14946f415..a9819bce6 100644
--- a/core/src/node/api/common/builder.ts
+++ b/core/src/node/api/common/builder.ts
@@ -265,19 +265,22 @@ export const downloadModel = async (
   const modelBinaryPath = join(directoryPath, modelId)
 
   const request = require('request')
-  const rq = request({ url: model.source_url, strictSSL, proxy })
   const progress = require('request-progress')
-  progress(rq, {})
-    .on('progress', function (state: any) {
-      console.log('progress', JSON.stringify(state, null, 2))
-    })
-    .on('error', function (err: Error) {
-      console.error('error', err)
-    })
-    .on('end', function () {
-      console.log('end')
-    })
-    .pipe(fs.createWriteStream(modelBinaryPath))
+
+  for (const source of model.sources) {
+    const rq = request({ url: source, strictSSL, proxy })
+    progress(rq, {})
+      .on('progress', function (state: any) {
+        console.debug('progress', JSON.stringify(state, null, 2))
+      })
+      .on('error', function (err: Error) {
+        console.error('error', err)
+      })
+      .on('end', function () {
+        console.debug('end')
+      })
+      .pipe(fs.createWriteStream(modelBinaryPath))
+  }
 
   return {
     message: `Starting download ${modelId}`,
diff --git a/core/src/types/model/modelEntity.ts b/core/src/types/model/modelEntity.ts
index 80adc9e96..c60ab7650 100644
--- a/core/src/types/model/modelEntity.ts
+++ b/core/src/types/model/modelEntity.ts
@@ -21,6 +21,11 @@ export enum InferenceEngine {
   hf_endpoint = 'hf_endpoint',
 }
 
+export type ModelArtifact = {
+  filename: string
+  url: string
+}
+
 /**
  * Model type defines the shape of a model object.
  * @stored
@@ -45,7 +50,7 @@ export type Model = {
   /**
    * The model download source. It can be an external url or a local filepath.
    */
-  source_url: string
+  sources: ModelArtifact[]
 
   /**
    * The model identifier, which can be referenced in the API endpoints.
@@ -107,6 +112,8 @@ export type ModelSettingParams = {
   system_prompt?: string
   ai_prompt?: string
   user_prompt?: string
+  llama_model_path?: string
+  mmproj?: string
 }
 
 /**
diff --git a/docs/docs/docs/03-engineering/models.md b/docs/docs/docs/03-engineering/models.md
index cb0b44f41..4e4c3c604 100644
--- a/docs/docs/docs/03-engineering/models.md
+++ b/docs/docs/docs/03-engineering/models.md
@@ -56,7 +56,6 @@ jan/                               # Jan root folder
 
 - Each `model` folder contains a `model.json` file, which is a representation of a model.
 - `model.json` contains metadata and default parameters used to run a model.
-- The only required field is `source_url`.
 
 ### Example
 
@@ -64,36 +63,43 @@ Here's a standard example `model.json` for a GGUF model.
 
 ```js
 {
-"id": "zephyr-7b",                  // Defaults to foldername
-"object": "model",                  // Defaults to "model"
-"source_url": "https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q4_K_M.gguf",
-"name": "Zephyr 7B",                // Defaults to foldername
-"owned_by": "you",                  // Defaults to "you"
-"version": "1",                     // Defaults to 1
-"created": 1231231,                 // Defaults to file creation time
-"description": null,                // Defaults to null
-"state": enum[null, "ready"]
-"format": "ggufv3",                 // Defaults to "ggufv3"
-"engine": "nitro",                // engine_id specified in jan/engine folder
-"engine_parameters": {              // Engine parameters inside model.json can override
-    "ctx_len": 2048,                // the value inside the base engine.json
+  "id": "zephyr-7b",        // Defaults to foldername
+  "object": "model",        // Defaults to "model"
+  "sources": [
+    {
+      "filename": "zephyr-7b-beta.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q4_K_M.gguf"
+    }
+  ],
+  "name": "Zephyr 7B",      // Defaults to foldername
+  "owned_by": "you",        // Defaults to "you"
+  "version": "1",           // Defaults to 1
+  "created": 1231231,       // Defaults to file creation time
+  "description": null,      // Defaults to null
+  "format": "ggufv3",       // Defaults to "ggufv3"
+  "engine": "nitro",        // engine_id specified in jan/engine folder
+  "engine_parameters": {
+    // Engine parameters inside model.json can override
+    "ctx_len": 4096,        // the value inside the base engine.json
     "ngl": 100,
     "embedding": true,
-    "n_parallel": 4,
-},
-"model_parameters": {                     // Models are called parameters
+    "n_parallel": 4
+  },
+  "model_parameters": {
+    // Models are called parameters
     "stream": true,
-    "max_tokens": 2048,
-    "stop": ["<endofstring>"],      // This usually can be left blank, only used with specific need from model author
+    "max_tokens": 4096,
+    "stop": ["<endofstring>"], // This usually can be left blank, only used with specific need from model author
     "frequency_penalty": 0,
     "presence_penalty": 0,
     "temperature": 0.7,
     "top_p": 0.95
-},
-"metadata": {},                     // Defaults to {}
-"assets": [                         // Defaults to current dir
-    "file://.../zephyr-7b-q4_k_m.bin",
-]
+  },
+  "metadata": {},           // Defaults to {}
+  "assets": [
+    // Defaults to current dir
+    "file://.../zephyr-7b-q4_k_m.bin"
+  ]
 }
 ```
 
diff --git a/docs/docs/guides/04-using-models/02-import-manually.mdx b/docs/docs/guides/04-using-models/02-import-manually.mdx
index f5ecb5259..68142a8af 100644
--- a/docs/docs/guides/04-using-models/02-import-manually.mdx
+++ b/docs/docs/guides/04-using-models/02-import-manually.mdx
@@ -31,7 +31,6 @@ In this section, we will show you how to import a GGUF model from [HuggingFace](
 
 ## Manually Importing a Downloaded Model (nightly versions and v0.4.4+)
 
-
 ### 1. Create a Model Folder
 
 Navigate to the `~/jan/models` folder. You can find this folder by going to `App Settings` > `Advanced` > `Open App Directory`.
@@ -92,7 +91,7 @@ Drag and drop your model binary into this folder, ensuring the `modelname.gguf`
 
 #### 3. Voila
 
-If your model doesn't show up in the Model Selector in conversations, please restart the app. 
+If your model doesn't show up in the Model Selector in conversations, please restart the app.
 
 If that doesn't work, please feel free to join our [Discord community](https://discord.gg/Dt7MxDyNNZ) for support, updates, and discussions.
 
@@ -190,14 +189,18 @@ Edit `model.json` and include the following configurations:
 - Ensure the filename must be `model.json`.
 - Ensure the `id` property matches the folder name you created.
 - Ensure the GGUF filename should match the `id` property exactly.
-- Ensure the `source_url` property is the direct binary download link ending in `.gguf`. In HuggingFace, you can find the direct links in the `Files and versions` tab.
+- Ensure the `source.url` property is the direct binary download link ending in `.gguf`. In HuggingFace, you can find the direct links in the `Files and versions` tab.
 - Ensure you are using the correct `prompt_template`. This is usually provided in the HuggingFace model's description page.
-- Ensure the `state` property is set to `ready`.
 
 ```json title="model.json"
 {
   // highlight-start
-  "source_url": "https://huggingface.co/janhq/trinity-v1-GGUF/resolve/main/trinity-v1.Q4_K_M.gguf",
+  "sources": [
+    {
+      "filename": "trinity-v1.Q4_K_M.gguf",
+      "url": "https://huggingface.co/janhq/trinity-v1-GGUF/resolve/main/trinity-v1.Q4_K_M.gguf"
+    }
+  ],
   "id": "trinity-v1-7b",
   // highlight-end
   "object": "model",
@@ -208,7 +211,8 @@ Edit `model.json` and include the following configurations:
   "settings": {
     "ctx_len": 4096,
     // highlight-next-line
-    "prompt_template": "{system_message}\n### Instruction:\n{prompt}\n### Response:"
+    "prompt_template": "{system_message}\n### Instruction:\n{prompt}\n### Response:",
+    "llama_model_path": "trinity-v1.Q4_K_M.gguf"
   },
   "parameters": {
     "max_tokens": 4096
@@ -218,9 +222,7 @@ Edit `model.json` and include the following configurations:
     "tags": ["7B", "Merged"],
     "size": 4370000000
   },
-  "engine": "nitro",
-  // highlight-next-line
-  "state": "ready"
+  "engine": "nitro"
 }
 ```
 
diff --git a/docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx b/docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx
index 3ed15bc9f..533797fca 100644
--- a/docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx
+++ b/docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx
@@ -40,7 +40,12 @@ Navigate to the `~/jan/models` folder. Create a folder named `gpt-3.5-turbo-16k`
 
 ```json title="~/jan/models/gpt-3.5-turbo-16k/model.json"
 {
-  "source_url": "https://openai.com",
+  "sources": [
+    {
+      "filename": "openai",
+      "url": "https://openai.com"
+    }
+  ],
   // highlight-next-line
   "id": "gpt-3.5-turbo-16k",
   "object": "model",
@@ -55,8 +60,7 @@ Navigate to the `~/jan/models` folder. Create a folder named `gpt-3.5-turbo-16k`
     "author": "OpenAI",
     "tags": ["General", "Big Context Length"]
   },
-  "engine": "openai",
-  "state": "ready"
+  "engine": "openai"
   // highlight-end
 }
 ```
@@ -118,7 +122,12 @@ Navigate to the `~/jan/models` folder. Create a folder named `mistral-ins-7b-q4`
 
 ```json title="~/jan/models/mistral-ins-7b-q4/model.json"
 {
-  "source_url": "https://jan.ai",
+  "sources": [
+    {
+      "filename": "janai",
+      "url": "https://jan.ai"
+    }
+  ],
   // highlight-next-line
   "id": "mistral-ins-7b-q4",
   "object": "model",
@@ -134,8 +143,7 @@ Navigate to the `~/jan/models` folder. Create a folder named `mistral-ins-7b-q4`
     "tags": ["remote", "awesome"]
   },
   // highlight-start
-  "engine": "openai",
-  "state": "ready"
+  "engine": "openai"
   // highlight-end
 }
 ```
diff --git a/docs/docs/guides/07-integrations/02-integrate-openrouter.mdx b/docs/docs/guides/07-integrations/02-integrate-openrouter.mdx
index 8623a1a4a..e0db0e336 100644
--- a/docs/docs/guides/07-integrations/02-integrate-openrouter.mdx
+++ b/docs/docs/guides/07-integrations/02-integrate-openrouter.mdx
@@ -49,7 +49,12 @@ Navigate to the `~/jan/models` folder. Create a folder named `<openrouter-modeln
 
 ```json title="~/jan/models/openrouter-dolphin-mixtral-8x7b/model.json"
 {
-  "source_url": "https://openrouter.ai/",
+  "sources": [
+    {
+      "filename": "openrouter",
+      "url": "https://openrouter.ai/"
+    }
+  ],
   "id": "cognitivecomputations/dolphin-mixtral-8x7b",
   "object": "model",
   "name": "Dolphin 2.6 Mixtral 8x7B",
@@ -63,8 +68,7 @@ Navigate to the `~/jan/models` folder. Create a folder named `<openrouter-modeln
     "tags": ["General", "Big Context Length"]
   },
   // highlight-start
-  "engine": "openai",
-  "state": "ready"
+  "engine": "openai"
   // highlight-end
 }
 ```
diff --git a/docs/docs/guides/07-integrations/03-integrate-azure-openai-service.mdx b/docs/docs/guides/07-integrations/03-integrate-azure-openai-service.mdx
index 827a8583a..c99be66ea 100644
--- a/docs/docs/guides/07-integrations/03-integrate-azure-openai-service.mdx
+++ b/docs/docs/guides/07-integrations/03-integrate-azure-openai-service.mdx
@@ -59,7 +59,12 @@ Navigate to the `~/jan/models` folder. Create a folder named `<your-deployment-n
 
 ```json title="~/jan/models/gpt-35-hieu-jan/model.json"
 {
-  "source_url": "https://hieujan.openai.azure.com",
+  "sources": [
+    {
+      "filename": "azure_openai",
+      "url": "https://hieujan.openai.azure.com"
+    }
+  ],
   // highlight-next-line
   "id": "gpt-35-hieu-jan",
   "object": "model",
@@ -75,8 +80,7 @@ Navigate to the `~/jan/models` folder. Create a folder named `<your-deployment-n
     "tags": ["General", "Big Context Length"]
   },
   // highlight-start
-  "engine": "openai",
-  "state": "ready"
+  "engine": "openai"
   // highlight-end
 }
 ```
diff --git a/docs/openapi/specs/models.yaml b/docs/openapi/specs/models.yaml
index 418be9563..8113f3ab8 100644
--- a/docs/openapi/specs/models.yaml
+++ b/docs/openapi/specs/models.yaml
@@ -59,18 +59,26 @@ components:
           type: string
           description: State format of the model, distinct from the engine.
           example: ggufv3
-        source_url:
-          type: string
-          format: uri
-          description: URL to the source of the model.
-          example: https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q4_K_M.gguf
+        source:
+          type: array
+          items:
+            type: object
+            properties:
+              url:
+                format: uri
+                description: URL to the source of the model.
+                example: https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q4_K_M.gguf
+              filename:
+                type: string
+                description: Filename of the model.
+                example: zephyr-7b-beta.Q4_K_M.gguf
         settings:
           type: object
           properties:
             ctx_len:
               type: string
               description: Context length.
-              example: "2048"
+              example: "4096"
             ngl:
               type: string
               description: Number of layers.
@@ -94,7 +102,7 @@ components:
             token_limit:
               type: string
               description: Token limit for the model.
-              example: "2048"
+              example: "4096"
             top_k:
               type: string
               description: Top-k setting for the model.
@@ -117,7 +125,7 @@ components:
             type: string
           description: List of assets related to the model.
       required:
-        - source_url
+        - source
     ModelObject:
       type: object
       properties:
@@ -169,11 +177,19 @@ components:
             - running
             - stopped
           description: The current state of the model.
-        source_url:
-          type: string
-          format: uri
-          description: URL to the source of the model.
-          example: https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q4_K_M.gguf
+        source:
+          type: array
+          items:
+            type: object
+            properties:
+              url:
+                format: uri
+                description: URL to the source of the model.
+                example: https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q4_K_M.gguf
+              filename:
+                type: string
+                description: Filename of the model.
+                example: zephyr-7b-beta.Q4_K_M.gguf
         engine_parameters:
           type: object
           properties:
@@ -208,8 +224,8 @@ components:
                 model.
               minimum: 128
               maximum: 4096
-              default: 2048
-              example: 2048
+              default: 4096
+              example: 4096
             n_parallel:
               type: integer
               description: Number of parallel operations, relevant when continuous batching is
@@ -241,8 +257,8 @@ components:
               description: Maximum context length the model can handle.
               minimum: 0
               maximum: 4096
-              default: 2048
-              example: 2048
+              default: 4096
+              example: 4096
             ngl:
               type: integer
               description: Number of layers in the neural network.
@@ -276,8 +292,8 @@ components:
                 response.
               minimum: 1
               maximum: 4096
-              default: 2048
-              example: 2048
+              default: 4096
+              example: 4096
             top_k:
               type: integer
               description: Limits the model to consider only the top k most likely next tokens
@@ -318,7 +334,7 @@ components:
         - created
         - owned_by
         - state
-        - source_url
+        - source
         - parameters
         - metadata
     DeleteModelResponse:
diff --git a/extensions/inference-nitro-extension/src/node/index.ts b/extensions/inference-nitro-extension/src/node/index.ts
index 0a7a2e33e..a75f33df2 100644
--- a/extensions/inference-nitro-extension/src/node/index.ts
+++ b/extensions/inference-nitro-extension/src/node/index.ts
@@ -119,11 +119,19 @@ async function runModel(
       wrapper.model.settings.ai_prompt = prompt.ai_prompt;
     }
 
+    const modelFolderPath = path.join(janRoot, "models", wrapper.model.id);
+    const modelPath = wrapper.model.settings.llama_model_path
+      ? path.join(modelFolderPath, wrapper.model.settings.llama_model_path)
+      : currentModelFile;
+
     currentSettings = {
-      llama_model_path: currentModelFile,
       ...wrapper.model.settings,
+      llama_model_path: modelPath,
       // This is critical and requires real CPU physical core count (or performance core)
       cpu_threads: Math.max(1, nitroResourceProbe.numCpuPhysicalCore),
+      ...(wrapper.model.settings.mmproj && {
+        mmproj: path.join(modelFolderPath, wrapper.model.settings.mmproj),
+      }),
     };
     console.log(currentSettings);
     return runNitroAndLoadModel();
diff --git a/extensions/model-extension/package.json b/extensions/model-extension/package.json
index 376e724b4..86f177d14 100644
--- a/extensions/model-extension/package.json
+++ b/extensions/model-extension/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@janhq/model-extension",
-  "version": "1.0.22",
+  "version": "1.0.23",
   "description": "Model Management Extension provides model exploration and seamless downloads",
   "main": "dist/index.js",
   "module": "dist/module.js",
diff --git a/extensions/model-extension/src/index.ts b/extensions/model-extension/src/index.ts
index f41999bd8..5640177a0 100644
--- a/extensions/model-extension/src/index.ts
+++ b/extensions/model-extension/src/index.ts
@@ -80,16 +80,34 @@ export default class JanModelExtension extends ModelExtension {
     const modelDirPath = await joinPath([JanModelExtension._homeDir, model.id])
     if (!(await fs.existsSync(modelDirPath))) await fs.mkdirSync(modelDirPath)
 
-    // try to retrieve the download file name from the source url
-    // if it fails, use the model ID as the file name
-    const extractedFileName = await model.source_url.split('/').pop()
+    if (model.sources.length > 1) {
+      // path to model binaries
+      for (const source of model.sources) {
+        let path = this.extractFileName(source.url)
+        if (source.filename) {
+          path = await joinPath([modelDirPath, source.filename])
+        }
+
+        downloadFile(source.url, path, network)
+      }
+    } else {
+      const fileName = this.extractFileName(model.sources[0]?.url)
+      const path = await joinPath([modelDirPath, fileName])
+      downloadFile(model.sources[0]?.url, path, network)
+    }
+  }
+
+  /**
+   *  try to retrieve the download file name from the source url
+   */
+  private extractFileName(url: string): string {
+    const extractedFileName = url.split('/').pop()
     const fileName = extractedFileName
       .toLowerCase()
       .endsWith(JanModelExtension._supportedModelFormat)
       ? extractedFileName
-      : model.id
-    const path = await joinPath([modelDirPath, fileName])
-    downloadFile(model.source_url, path, network)
+      : extractedFileName + JanModelExtension._supportedModelFormat
+    return fileName
   }
 
   /**
@@ -98,6 +116,7 @@ export default class JanModelExtension extends ModelExtension {
    * @returns {Promise<void>} A promise that resolves when the download has been cancelled.
    */
   async cancelModelDownload(modelId: string): Promise<void> {
+    const model = await this.getConfiguredModels()
     return abortDownload(
       await joinPath([JanModelExtension._homeDir, modelId, modelId])
     ).then(async () => {
@@ -163,15 +182,16 @@ export default class JanModelExtension extends ModelExtension {
           .then((files: string[]) => {
             // or model binary exists in the directory
             // model binary name can match model ID or be a .gguf file and not be an incompleted model file
+            // TODO: Check diff between urls, filenames
             return (
               files.includes(modelDir) ||
-              files.some(
+              files.filter(
                 (file) =>
                   file
                     .toLowerCase()
                     .includes(JanModelExtension._supportedModelFormat) &&
                   !file.endsWith(JanModelExtension._incompletedModelFileName)
-              )
+              )?.length >= model.sources.length
             )
           })
       }
@@ -198,7 +218,6 @@ export default class JanModelExtension extends ModelExtension {
 
       const readJsonPromises = allDirectories.map(async (dirName) => {
         // filter out directories that don't match the selector
-
         // read model.json
         const jsonPath = await joinPath([
           JanModelExtension._homeDir,
@@ -226,7 +245,21 @@ export default class JanModelExtension extends ModelExtension {
       const modelData = results.map((result) => {
         if (result.status === 'fulfilled') {
           try {
-            return result.value as Model
+            // This to ensure backward compatibility with `model.json` with `source_url`
+            const tmpModel =
+              typeof result.value === 'object'
+                ? result.value
+                : JSON.parse(result.value)
+            if (tmpModel['source_url'] != null) {
+              tmpModel['source'] = [
+                {
+                  filename: tmpModel.id,
+                  url: tmpModel['source_url'],
+                },
+              ]
+            }
+
+            return tmpModel as Model
           } catch {
             console.debug(`Unable to parse model metadata: ${result.value}`)
             return undefined
diff --git a/models/bakllava-1/model.json b/models/bakllava-1/model.json
new file mode 100644
index 000000000..91f6f4136
--- /dev/null
+++ b/models/bakllava-1/model.json
@@ -0,0 +1,33 @@
+{
+  "sources": [
+    {
+      "filename": "ggml-model-q5_k.gguf",
+      "url": "https://huggingface.co/mys/ggml_bakllava-1/resolve/main/ggml-model-q5_k.gguf"
+    },
+    {
+      "filename": "mmproj-model-f16.gguf",
+      "url": "https://huggingface.co/mys/ggml_bakllava-1/resolve/main/mmproj-model-f16.gguf"
+    }
+  ],
+  "id": "bakllava-1",
+  "object": "model",
+  "name": "BakLlava 1",
+  "version": "1.0",
+  "description": "BakLlava 1 can bring vision understanding to Jan",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "\n### Instruction:\n{prompt}\n### Response:\n",
+    "llama_model_path": "ggml-model-q5_k.gguf",
+    "mmproj": "mmproj-model-f16.gguf"
+  },
+  "parameters": {
+    "max_tokens": 4096
+  },
+  "metadata": {
+    "author": "Mys",
+    "tags": ["Vision"],
+    "size": 5750000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/capybara-34b/model.json b/models/capybara-34b/model.json
index ffca28c6d..af029bbb0 100644
--- a/models/capybara-34b/model.json
+++ b/models/capybara-34b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Nous-Capybara-34B-GGUF/resolve/main/nous-capybara-34b.Q5_K_M.gguf",
-    "id": "capybara-34b",
-    "object": "model",
-    "name": "Capybara 200k 34B Q5",
-    "version": "1.0",
-    "description": "Nous Capybara 34B is a long context length model that supports 200K tokens.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "USER:\n{prompt}\nASSISTANT:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "NousResearch, The Bloke",
-      "tags": ["34B", "Finetuned"],
-      "size": 24320000000
-    }, 
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "nous-capybara-34b.Q5_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/Nous-Capybara-34B-GGUF/resolve/main/nous-capybara-34b.Q5_K_M.gguf"
+    }
+  ],
+  "id": "capybara-34b",
+  "object": "model",
+  "name": "Capybara 200k 34B Q5",
+  "version": "1.0",
+  "description": "Nous Capybara 34B is a long context length model that supports 200K tokens.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "USER:\n{prompt}\nASSISTANT:",
+    "llama_model_path": "nous-capybara-34b.Q5_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "NousResearch, The Bloke",
+    "tags": ["34B", "Finetuned"],
+    "size": 24320000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/codeninja-1.0-7b/model.json b/models/codeninja-1.0-7b/model.json
index 98fbac5df..4ffe355d1 100644
--- a/models/codeninja-1.0-7b/model.json
+++ b/models/codeninja-1.0-7b/model.json
@@ -1,29 +1,33 @@
 {
-    "source_url": "https://huggingface.co/beowolx/CodeNinja-1.0-OpenChat-7B-GGUF/resolve/main/codeninja-1.0-openchat-7b.Q4_K_M.gguf",
-    "id": "codeninja-1.0-7b",
-    "object": "model",
-    "name": "CodeNinja 7B Q4",
-    "version": "1.0",
-    "description": "CodeNinja is good for coding tasks and can handle various languages including Python, C, C++, Rust, Java, JavaScript, and more.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "GPT4 Correct User: {prompt}<|end_of_turn|>GPT4 Correct Assistant:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": ["<|end_of_turn|>"],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Beowolx",
-      "tags": ["7B", "Finetuned"],
-      "size": 4370000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "codeninja-1.0-openchat-7b.Q4_K_M.gguf",
+      "url": "https://huggingface.co/beowolx/CodeNinja-1.0-OpenChat-7B-GGUF/resolve/main/codeninja-1.0-openchat-7b.Q4_K_M.gguf"
+    }
+  ],
+  "id": "codeninja-1.0-7b",
+  "object": "model",
+  "name": "CodeNinja 7B Q4",
+  "version": "1.0",
+  "description": "CodeNinja is good for coding tasks and can handle various languages including Python, C, C++, Rust, Java, JavaScript, and more.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "GPT4 Correct User: {prompt}<|end_of_turn|>GPT4 Correct Assistant:",
+    "llama_model_path": "codeninja-1.0-openchat-7b.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Beowolx",
+    "tags": ["7B", "Finetuned"],
+    "size": 4370000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/config/default-model.json b/models/config/default-model.json
index 2263625f4..2fa2df2ee 100644
--- a/models/config/default-model.json
+++ b/models/config/default-model.json
@@ -2,7 +2,12 @@
   "object": "model",
   "version": 1,
   "format": "gguf",
-  "source_url": "N/A",
+  "sources": [
+    {
+      "url": "N/A",
+      "filename": "N/A"
+    }
+  ],
   "id": "N/A",
   "name": "N/A",
   "created": 0,
@@ -10,7 +15,8 @@
   "settings": {
     "ctx_len": 4096,
     "embedding": false,
-    "prompt_template": "{system_message}\n### Instruction: {prompt}\n### Response:"
+    "prompt_template": "{system_message}\n### Instruction: {prompt}\n### Response:",
+    "llama_model_path": "N/A"
   },
   "parameters": {
     "temperature": 0.7,
diff --git a/models/deepseek-coder-1.3b/model.json b/models/deepseek-coder-1.3b/model.json
index 8c454802f..365dbfd2f 100644
--- a/models/deepseek-coder-1.3b/model.json
+++ b/models/deepseek-coder-1.3b/model.json
@@ -1,29 +1,34 @@
-
 {
-    "source_url": "https://huggingface.co/TheBloke/deepseek-coder-1.3b-instruct-GGUF/resolve/main/deepseek-coder-1.3b-instruct.Q8_0.gguf",
-    "id": "deepseek-coder-1.3b",
-    "object": "model",
-    "name": "Deepseek Coder 1.3B Q8",
-    "version": "1.0",
-    "description": "Deepseek Coder excelled in project-level code completion with advanced capabilities across multiple programming languages.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "### Instruction:\n{prompt}\n### Response:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Deepseek, The Bloke",
-      "tags": ["Tiny", "Foundational Model"],
-      "size": 1430000000
-    },
-    "engine": "nitro"
-  }
+  "sources": [
+    {
+      "filename": "deepseek-coder-1.3b-instruct.Q8_0.gguf",
+      "url": "https://huggingface.co/TheBloke/deepseek-coder-1.3b-instruct-GGUF/resolve/main/deepseek-coder-1.3b-instruct.Q8_0.gguf"
+    }
+  ],
+  "id": "deepseek-coder-1.3b",
+  "object": "model",
+  "name": "Deepseek Coder 1.3B Q8",
+  "version": "1.0",
+  "description": "Deepseek Coder excelled in project-level code completion with advanced capabilities across multiple programming languages.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "### Instruction:\n{prompt}\n### Response:",
+    "llama_model_path": "deepseek-coder-1.3b-instruct.Q8_0.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Deepseek, The Bloke",
+    "tags": ["Tiny", "Foundational Model"],
+    "size": 1430000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/deepseek-coder-34b/model.json b/models/deepseek-coder-34b/model.json
index 905a66033..8e17b9563 100644
--- a/models/deepseek-coder-34b/model.json
+++ b/models/deepseek-coder-34b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/deepseek-coder-33B-instruct-GGUF/resolve/main/deepseek-coder-33b-instruct.Q5_K_M.gguf",
-    "id": "deepseek-coder-34b",
-    "object": "model",
-    "name": "Deepseek Coder 33B Q5",
-    "version": "1.0",
-    "description": "Deepseek Coder excelled in project-level code completion with advanced capabilities across multiple programming languages.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "### Instruction:\n{prompt}\n### Response:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Deepseek, The Bloke",
-      "tags": ["34B", "Foundational Model"],
-      "size": 19940000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "deepseek-coder-33b-instruct.Q5_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/deepseek-coder-33B-instruct-GGUF/resolve/main/deepseek-coder-33b-instruct.Q5_K_M.gguf"
+    }
+  ],
+  "id": "deepseek-coder-34b",
+  "object": "model",
+  "name": "Deepseek Coder 33B Q5",
+  "version": "1.0",
+  "description": "Deepseek Coder excelled in project-level code completion with advanced capabilities across multiple programming languages.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "### Instruction:\n{prompt}\n### Response:",
+    "llama_model_path": "deepseek-coder-33b-instruct.Q5_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Deepseek, The Bloke",
+    "tags": ["34B", "Foundational Model"],
+    "size": 19940000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/dolphin-2.7-mixtral-8x7b/model.json b/models/dolphin-2.7-mixtral-8x7b/model.json
index 67bc6737c..7df4fbfbd 100644
--- a/models/dolphin-2.7-mixtral-8x7b/model.json
+++ b/models/dolphin-2.7-mixtral-8x7b/model.json
@@ -1,28 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/dolphin-2.7-mixtral-8x7b-GGUF/resolve/main/dolphin-2.7-mixtral-8x7b.Q4_K_M.gguf",
-    "id": "dolphin-2.7-mixtral-8x7b",
-    "object": "model",
-    "name": "Dolphin 8x7B Q4",
-    "version": "1.0",
-    "description": "Dolphin is an uncensored model built on Mixtral-8x7b. It is good at programming tasks.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Cognitive Computations, TheBloke",
-      "tags": ["70B", "Finetuned"],
-      "size": 26440000000
-    },
-    "engine": "nitro"
-  }
+  "sources": [
+    {
+      "filename": "dolphin-2.7-mixtral-8x7b.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/dolphin-2.7-mixtral-8x7b-GGUF/resolve/main/dolphin-2.7-mixtral-8x7b.Q4_K_M.gguf"
+    }
+  ],
+  "id": "dolphin-2.7-mixtral-8x7b",
+  "object": "model",
+  "name": "Dolphin 8x7B Q4",
+  "version": "1.0",
+  "description": "Dolphin is an uncensored model built on Mixtral-8x7b. It is good at programming tasks.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+    "llama_model_path": "dolphin-2.7-mixtral-8x7b.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Cognitive Computations, TheBloke",
+    "tags": ["70B", "Finetuned"],
+    "size": 26440000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/gpt-3.5-turbo-16k-0613/model.json b/models/gpt-3.5-turbo-16k-0613/model.json
index 0df4119a5..aa57e1154 100644
--- a/models/gpt-3.5-turbo-16k-0613/model.json
+++ b/models/gpt-3.5-turbo-16k-0613/model.json
@@ -1,18 +1,20 @@
 {
-    "source_url": "https://openai.com",
-    "id": "gpt-3.5-turbo-16k-0613",
-    "object": "model",
-    "name": "OpenAI GPT 3.5 Turbo 16k 0613",
-    "version": "1.0",
-    "description": "OpenAI GPT 3.5 Turbo 16k 0613 model is extremely good",
-    "format": "api",
-    "settings": {},
-    "parameters": {},
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General", "Big Context Length"]
-    },
-    "engine": "openai",
-    "state": "ready"
+  "sources": [
+    {
+      "url": "https://openai.com"
+    }
+  ],
+  "id": "gpt-3.5-turbo-16k-0613",
+  "object": "model",
+  "name": "OpenAI GPT 3.5 Turbo 16k 0613",
+  "version": "1.0",
+  "description": "OpenAI GPT 3.5 Turbo 16k 0613 model is extremely good",
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "OpenAI",
+    "tags": ["General", "Big Context Length"]
+  },
+  "engine": "openai"
 }
-  
\ No newline at end of file
diff --git a/models/gpt-3.5-turbo/model.json b/models/gpt-3.5-turbo/model.json
index a7dbf3d4e..617f0d056 100644
--- a/models/gpt-3.5-turbo/model.json
+++ b/models/gpt-3.5-turbo/model.json
@@ -1,18 +1,20 @@
 {
-    "source_url": "https://openai.com",
-    "id": "gpt-3.5-turbo",
-    "object": "model",
-    "name": "OpenAI GPT 3.5 Turbo",
-    "version": "1.0",
-    "description": "OpenAI GPT 3.5 Turbo model is extremely good",
-    "format": "api",
-    "settings": {},
-    "parameters": {},
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General", "Big Context Length"]
-    },
-    "engine": "openai",
-    "state": "ready"
+  "sources": [
+    {
+      "url": "https://openai.com"
+    }
+  ],
+  "id": "gpt-3.5-turbo",
+  "object": "model",
+  "name": "OpenAI GPT 3.5 Turbo",
+  "version": "1.0",
+  "description": "OpenAI GPT 3.5 Turbo model is extremely good",
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "OpenAI",
+    "tags": ["General", "Big Context Length"]
+  },
+  "engine": "openai"
 }
-  
\ No newline at end of file
diff --git a/models/gpt-4/model.json b/models/gpt-4/model.json
index 3f17e65cb..7aa2338e3 100644
--- a/models/gpt-4/model.json
+++ b/models/gpt-4/model.json
@@ -1,18 +1,20 @@
 {
-    "source_url": "https://openai.com",
-    "id": "gpt-4",
-    "object": "model",
-    "name": "OpenAI GPT 4",
-    "version": "1.0",
-    "description": "OpenAI GPT 4 model is extremely good",
-    "format": "api",
-    "settings": {},
-    "parameters": {},
-    "metadata": {
-      "author": "OpenAI",
-      "tags": ["General", "Big Context Length"]
-    },
-    "engine": "openai",
-    "state": "ready"
+  "sources": [
+    {
+      "url": "https://openai.com"
+    }
+  ],
+  "id": "gpt-4",
+  "object": "model",
+  "name": "OpenAI GPT 4",
+  "version": "1.0",
+  "description": "OpenAI GPT 4 model is extremely good",
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "OpenAI",
+    "tags": ["General", "Big Context Length"]
+  },
+  "engine": "openai"
 }
-  
\ No newline at end of file
diff --git a/models/llama2-chat-70b-q4/model.json b/models/llama2-chat-70b-q4/model.json
index 2595ab677..2459e426f 100644
--- a/models/llama2-chat-70b-q4/model.json
+++ b/models/llama2-chat-70b-q4/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Llama-2-70B-Chat-GGUF/resolve/main/llama-2-70b-chat.Q4_K_M.gguf",
-    "id": "llama2-chat-70b-q4",
-    "object": "model",
-    "name": "Llama 2 Chat 70B Q4",
-    "version": "1.0",
-    "description": "Llama 2 Chat 7b model, specifically designed for a comprehensive understanding through training on extensive internet data.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "[INST] <<SYS>>\n{system_message}<</SYS>>\n{prompt}[/INST]"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "MetaAI, The Bloke",
-      "tags": ["70B", "Foundational Model"],
-      "size": 43920000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "llama-2-70b-chat.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/Llama-2-70B-Chat-GGUF/resolve/main/llama-2-70b-chat.Q4_K_M.gguf"
+    }
+  ],
+  "id": "llama2-chat-70b-q4",
+  "object": "model",
+  "name": "Llama 2 Chat 70B Q4",
+  "version": "1.0",
+  "description": "Llama 2 Chat 7b model, specifically designed for a comprehensive understanding through training on extensive internet data.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "[INST] <<SYS>>\n{system_message}<</SYS>>\n{prompt}[/INST]",
+    "llama_model_path": "llama-2-70b-chat.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "MetaAI, The Bloke",
+    "tags": ["70B", "Foundational Model"],
+    "size": 43920000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/llama2-chat-7b-q4/model.json b/models/llama2-chat-7b-q4/model.json
index 68eab3790..bc9847eef 100644
--- a/models/llama2-chat-7b-q4/model.json
+++ b/models/llama2-chat-7b-q4/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Llama-2-7B-Chat-GGUF/resolve/main/llama-2-7b-chat.Q4_K_M.gguf",
-    "id": "llama2-chat-7b-q4",
-    "object": "model",
-    "name": "Llama 2 Chat 7B Q4",
-    "version": "1.0",
-    "description": "Llama 2 Chat 7b model, specifically designed for a comprehensive understanding through training on extensive internet data.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "[INST] <<SYS>>\n{system_message}<</SYS>>\n{prompt}[/INST]"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "MetaAI, The Bloke",
-      "tags": ["7B", "Foundational Model"],
-      "size": 4080000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "llama-2-7b-chat.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/Llama-2-7B-Chat-GGUF/resolve/main/llama-2-7b-chat.Q4_K_M.gguf"
+    }
+  ],
+  "id": "llama2-chat-7b-q4",
+  "object": "model",
+  "name": "Llama 2 Chat 7B Q4",
+  "version": "1.0",
+  "description": "Llama 2 Chat 7b model, specifically designed for a comprehensive understanding through training on extensive internet data.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "[INST] <<SYS>>\n{system_message}<</SYS>>\n{prompt}[/INST]",
+    "llama_model_path": "llama-2-7b-chat.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "MetaAI, The Bloke",
+    "tags": ["7B", "Foundational Model"],
+    "size": 4080000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/llava-1.5-13b-q5/model.json b/models/llava-1.5-13b-q5/model.json
new file mode 100644
index 000000000..027b8398f
--- /dev/null
+++ b/models/llava-1.5-13b-q5/model.json
@@ -0,0 +1,33 @@
+{
+  "sources": [
+    {
+      "filename": "ggml-model-q5_k.gguf",
+      "url": "https://huggingface.co/mys/ggml_llava-v1.5-13b/resolve/main/ggml-model-q5_k.gguf"
+    },
+    {
+      "filename": "mmproj-model-f16.gguf",
+      "url": "https://huggingface.co/mys/ggml_llava-v1.5-13b/resolve/main/mmproj-model-f16.gguf"
+    }
+  ],
+  "id": "llava-1.5-13b-q5",
+  "object": "model",
+  "name": "LlaVa 1.5 13B Q5 K",
+  "version": "1.0",
+  "description": "LlaVa 1.5 can bring vision understanding to Jan",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "\n### Instruction:\n{prompt}\n### Response:\n",
+    "llama_model_path": "ggml-model-q5_k.gguf",
+    "mmproj": "mmproj-model-f16.gguf"
+  },
+  "parameters": {
+    "max_tokens": 4096
+  },
+  "metadata": {
+    "author": "Mys",
+    "tags": ["Vision"],
+    "size": 9850000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/llava-1.5-7b-q5/model.json b/models/llava-1.5-7b-q5/model.json
new file mode 100644
index 000000000..658b98880
--- /dev/null
+++ b/models/llava-1.5-7b-q5/model.json
@@ -0,0 +1,33 @@
+{
+  "sources": [
+    {
+      "filename": "ggml-model-q5_k.gguf",
+      "url": "https://huggingface.co/mys/ggml_llava-v1.5-7b/resolve/main/ggml-model-q5_k.gguf"
+    },
+    {
+      "filename": "mmproj-model-f16.gguf",
+      "url": "https://huggingface.co/mys/ggml_llava-v1.5-7b/resolve/main/mmproj-model-f16.gguf"
+    }
+  ],
+  "id": "llava-1.5-7b-q5",
+  "object": "model",
+  "name": "LlaVa 1.5 7B Q5 K",
+  "version": "1.0",
+  "description": "LlaVa 1.5 can bring vision understanding to Jan",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "\n### Instruction:\n{prompt}\n### Response:\n",
+    "llama_model_path": "ggml-model-q5_k.gguf",
+    "mmproj": "mmproj-model-f16.gguf"
+  },
+  "parameters": {
+    "max_tokens": 4096
+  },
+  "metadata": {
+    "author": "Mys",
+    "tags": ["Vision"],
+    "size": 5400000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/mistral-ins-7b-q4/model.json b/models/mistral-ins-7b-q4/model.json
index 6db1aa35b..bfdaffa90 100644
--- a/models/mistral-ins-7b-q4/model.json
+++ b/models/mistral-ins-7b-q4/model.json
@@ -1,30 +1,35 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_K_M.gguf",
-    "id": "mistral-ins-7b-q4",
-    "object": "model",
-    "name": "Mistral Instruct 7B Q4",
-    "version": "1.0",
-    "description": "Mistral Instruct 7b model, specifically designed for a comprehensive understanding through training on extensive internet data.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "[INST] {prompt} [/INST]"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "MistralAI, The Bloke",
-      "tags": ["Featured", "7B", "Foundational Model"],
-      "size": 4370000000,
-      "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/mistral-ins-7b-q4/cover.png"
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "mistral-7b-instruct-v0.2.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_K_M.gguf"
+    }
+  ],
+  "id": "mistral-ins-7b-q4",
+  "object": "model",
+  "name": "Mistral Instruct 7B Q4",
+  "version": "1.0",
+  "description": "Mistral Instruct 7b model, specifically designed for a comprehensive understanding through training on extensive internet data.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "[INST] {prompt} [/INST]",
+    "llama_model_path": "mistral-7b-instruct-v0.2.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "MistralAI, The Bloke",
+    "tags": ["Featured", "7B", "Foundational Model"],
+    "size": 4370000000,
+    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/mistral-ins-7b-q4/cover.png"
+  },
+  "engine": "nitro"
+}
diff --git a/models/mixtral-8x7b-instruct/model.json b/models/mixtral-8x7b-instruct/model.json
index 31ff2838a..e0a0ee040 100644
--- a/models/mixtral-8x7b-instruct/model.json
+++ b/models/mixtral-8x7b-instruct/model.json
@@ -1,28 +1,33 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Mixtral-8x7B-Instruct-v0.1-GGUF/resolve/main/mixtral-8x7b-instruct-v0.1.Q4_K_M.gguf",
-    "id": "mixtral-8x7b-instruct",
-    "object": "model",
-    "name": "Mixtral 8x7B Instruct Q4",
-    "version": "1.0",
-    "description": "The Mixtral-8x7B is a pretrained generative Sparse Mixture of Experts. The Mixtral-8x7B outperforms 70B models on most benchmarks.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "[INST] {prompt} [/INST]"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "MistralAI, TheBloke",
-      "tags": ["70B", "Foundational Model"],
-      "size": 26440000000
-    },
-    "engine": "nitro"
-  }
+  "sources": [
+    {
+      "filename": "mixtral-8x7b-instruct-v0.1.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/Mixtral-8x7B-Instruct-v0.1-GGUF/resolve/main/mixtral-8x7b-instruct-v0.1.Q4_K_M.gguf"
+    }
+  ],
+  "id": "mixtral-8x7b-instruct",
+  "object": "model",
+  "name": "Mixtral 8x7B Instruct Q4",
+  "version": "1.0",
+  "description": "The Mixtral-8x7B is a pretrained generative Sparse Mixture of Experts. The Mixtral-8x7B outperforms 70B models on most benchmarks.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "[INST] {prompt} [/INST]",
+    "llama_model_path": "mixtral-8x7b-instruct-v0.1.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "MistralAI, TheBloke",
+    "tags": ["70B", "Foundational Model"],
+    "size": 26440000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/noromaid-7b/model.json b/models/noromaid-7b/model.json
index fbb7858e1..78d579a64 100644
--- a/models/noromaid-7b/model.json
+++ b/models/noromaid-7b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/NeverSleep/Noromaid-7b-v0.1.1-GGUF/resolve/main/Noromaid-7b-v0.1.1.q5_k_m.gguf",
-    "id": "noromaid-7b",
-    "object": "model",
-    "name": "Noromaid 7B Q5",
-    "version": "1.0",
-    "description": "The Noromaid 7b model is designed for role-playing with human-like behavior.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "### Instruction:{prompt}\n### Response:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "NeverSleep",
-      "tags": ["7B", "Merged"],
-      "size": 4370000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "Noromaid-7b-v0.1.1.q5_k_m.gguf",
+      "url": "https://huggingface.co/NeverSleep/Noromaid-7b-v0.1.1-GGUF/resolve/main/Noromaid-7b-v0.1.1.q5_k_m.gguf"
+    }
+  ],
+  "id": "noromaid-7b",
+  "object": "model",
+  "name": "Noromaid 7B Q5",
+  "version": "1.0",
+  "description": "The Noromaid 7b model is designed for role-playing with human-like behavior.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "### Instruction:{prompt}\n### Response:",
+    "llama_model_path": "Noromaid-7b-v0.1.1.q5_k_m.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "NeverSleep",
+    "tags": ["7B", "Merged"],
+    "size": 4370000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/openchat-3.5-7b/model.json b/models/openchat-3.5-7b/model.json
index e4b72f9c6..294f7d269 100644
--- a/models/openchat-3.5-7b/model.json
+++ b/models/openchat-3.5-7b/model.json
@@ -1,28 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/openchat-3.5-1210-GGUF/resolve/main/openchat-3.5-1210.Q4_K_M.gguf",
-    "id": "openchat-3.5-7b",
-    "object": "model",
-    "name": "Openchat-3.5 7B Q4",
-    "version": "1.0",
-    "description": "The performance of this open-source model surpasses that of ChatGPT-3.5 and Grok-1 across various benchmarks.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "GPT4 Correct User: {prompt}<|end_of_turn|>GPT4 Correct Assistant:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": ["<|end_of_turn|>"],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Openchat",
-      "tags": ["Recommended", "7B", "Finetuned"],
-      "size": 4370000000
-    },
-    "engine": "nitro"
-  }
+  "sources": [
+    {
+      "filename": "openchat-3.5-1210.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/openchat-3.5-1210-GGUF/resolve/main/openchat-3.5-1210.Q4_K_M.gguf"
+    }
+  ],
+  "id": "openchat-3.5-7b",
+  "object": "model",
+  "name": "Openchat-3.5 7B Q4",
+  "version": "1.0",
+  "description": "The performance of this open-source model surpasses that of ChatGPT-3.5 and Grok-1 across various benchmarks.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "GPT4 Correct User: {prompt}<|end_of_turn|>GPT4 Correct Assistant:",
+    "llama_model_path": "openchat-3.5-1210.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": ["<|end_of_turn|>"],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Openchat",
+    "tags": ["Recommended", "7B", "Finetuned"],
+    "size": 4370000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/openhermes-neural-7b/model.json b/models/openhermes-neural-7b/model.json
index ca3e88502..87e1df143 100644
--- a/models/openhermes-neural-7b/model.json
+++ b/models/openhermes-neural-7b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/janhq/openhermes-2.5-neural-chat-v3-3-slerp-GGUF/resolve/main/openhermes-2.5-neural-chat-v3-3-slerp.Q4_K_M.gguf",
-    "id": "openhermes-neural-7b",
-    "object": "model",
-    "name": "OpenHermes Neural 7B Q4",
-    "version": "1.0",
-    "description": "OpenHermes Neural is a merged model using the TIES method. It performs well in various benchmarks.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Intel, Jan",
-      "tags": ["7B", "Merged", "Featured"],
-      "size": 4370000000,
-      "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/openhermes-neural-7b/cover.png"
-    },
-    "engine": "nitro"
-  }
+  "sources": [
+    {
+      "filename": "openhermes-2.5-neural-chat-v3-3-slerp.Q4_K_M.gguf",
+      "url": "https://huggingface.co/janhq/openhermes-2.5-neural-chat-v3-3-slerp-GGUF/resolve/main/openhermes-2.5-neural-chat-v3-3-slerp.Q4_K_M.gguf"
+    }
+  ],
+  "id": "openhermes-neural-7b",
+  "object": "model",
+  "name": "OpenHermes Neural 7B Q4",
+  "version": "1.0",
+  "description": "OpenHermes Neural is a merged model using the TIES method. It performs well in various benchmarks.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+    "llama_model_path": "openhermes-2.5-neural-chat-v3-3-slerp.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Intel, Jan",
+    "tags": ["7B", "Merged", "Featured"],
+    "size": 4370000000,
+    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/openhermes-neural-7b/cover.png"
+  },
+  "engine": "nitro"
+}
diff --git a/models/phi-2-3b/model.json b/models/phi-2-3b/model.json
index 97ff369e7..e452fdb55 100644
--- a/models/phi-2-3b/model.json
+++ b/models/phi-2-3b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/phi-2-GGUF/resolve/main/phi-2.Q8_0.gguf",
-    "id": "phi-2-3b",
-    "object": "model",
-    "name": "Phi-2 3B Q8",
-    "version": "1.0",
-    "description": "Phi-2 is a 2.7B model, excelling in common sense and logical reasoning benchmarks, trained with synthetic texts and filtered websites.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "Intruct:\n{prompt}\nOutput:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Microsoft",
-      "tags": ["3B","Foundational Model"],
-      "size": 2960000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "phi-2.Q8_0.gguf",
+      "url": "https://huggingface.co/TheBloke/phi-2-GGUF/resolve/main/phi-2.Q8_0.gguf"
+    }
+  ],
+  "id": "phi-2-3b",
+  "object": "model",
+  "name": "Phi-2 3B Q8",
+  "version": "1.0",
+  "description": "Phi-2 is a 2.7B model, excelling in common sense and logical reasoning benchmarks, trained with synthetic texts and filtered websites.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "Intruct:\n{prompt}\nOutput:",
+    "llama_model_path": "phi-2.Q8_0.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Microsoft",
+    "tags": ["3B", "Foundational Model"],
+    "size": 2960000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/phind-34b/model.json b/models/phind-34b/model.json
index 7fc77ed71..60309cb9b 100644
--- a/models/phind-34b/model.json
+++ b/models/phind-34b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Phind-CodeLlama-34B-v2-GGUF/resolve/main/phind-codellama-34b-v2.Q5_K_M.gguf",
-    "id": "phind-34b",
-    "object": "model",
-    "name": "Phind 34B Q5",
-    "version": "1.0",
-    "description": "Phind 34B is fine-tuned on 1.5B tokens of high-quality programming data. This multi-lingual model excels in various programming languages and is designed to be steerable and user-friendly.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "### System Prompt\n{system_message}\n### User Message\n{prompt}\n### Assistant"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Phind, The Bloke",
-      "tags": ["34B", "Finetuned"],
-      "size": 20220000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "phind-codellama-34b-v2.Q5_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/Phind-CodeLlama-34B-v2-GGUF/resolve/main/phind-codellama-34b-v2.Q5_K_M.gguf"
+    }
+  ],
+  "id": "phind-34b",
+  "object": "model",
+  "name": "Phind 34B Q5",
+  "version": "1.0",
+  "description": "Phind 34B is fine-tuned on 1.5B tokens of high-quality programming data. This multi-lingual model excels in various programming languages and is designed to be steerable and user-friendly.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "### System Prompt\n{system_message}\n### User Message\n{prompt}\n### Assistant",
+    "llama_model_path": "phind-codellama-34b-v2.Q5_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Phind, The Bloke",
+    "tags": ["34B", "Finetuned"],
+    "size": 20220000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/solar-10.7b-slerp/model.json b/models/solar-10.7b-slerp/model.json
index 9177fa013..8e62fa25b 100644
--- a/models/solar-10.7b-slerp/model.json
+++ b/models/solar-10.7b-slerp/model.json
@@ -1,29 +1,33 @@
 {
-    "source_url": "https://huggingface.co/janhq/Solar-10.7B-SLERP-GGUF/resolve/main/solar-10.7b-slerp.Q4_K_M.gguf",
-    "id": "solar-10.7b-slerp",
-    "object": "model",
-    "name": "Solar Slerp 10.7B Q4",
-    "version": "1.0",
-    "description": "This model uses the Slerp merge method from SOLAR Instruct and Pandora-v1",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "### User: {prompt}\n### Assistant:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Jan",
-      "tags": ["13B","Finetuned"],
-      "size": 6360000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "solar-10.7b-slerp.Q4_K_M.gguf",
+      "url": "https://huggingface.co/janhq/Solar-10.7B-SLERP-GGUF/resolve/main/solar-10.7b-slerp.Q4_K_M.gguf"
+    }
+  ],
+  "id": "solar-10.7b-slerp",
+  "object": "model",
+  "name": "Solar Slerp 10.7B Q4",
+  "version": "1.0",
+  "description": "This model uses the Slerp merge method from SOLAR Instruct and Pandora-v1",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "### User: {prompt}\n### Assistant:",
+    "llama_model_path": "solar-10.7b-slerp.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Jan",
+    "tags": ["13B", "Finetuned"],
+    "size": 6360000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/starling-7b/model.json b/models/starling-7b/model.json
index 1a6d7e55c..eaa540bd9 100644
--- a/models/starling-7b/model.json
+++ b/models/starling-7b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Starling-LM-7B-alpha-GGUF/resolve/main/starling-lm-7b-alpha.Q4_K_M.gguf",
-    "id": "starling-7b",
-    "object": "model",
-    "name": "Starling alpha 7B Q4",
-    "version": "1.0",
-    "description": "Starling 7B, an upgrade of Openchat 3.5 using RLAIF, is really good at various benchmarks, especially with GPT-4 judging its performance.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "GPT4 User: {prompt}<|end_of_turn|>GPT4 Assistant:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": ["<|end_of_turn|>"],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Berkeley-nest, The Bloke",
-      "tags": ["7B","Finetuned"],
-      "size": 4370000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "starling-lm-7b-alpha.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/Starling-LM-7B-alpha-GGUF/resolve/main/starling-lm-7b-alpha.Q4_K_M.gguf"
+    }
+  ],
+  "id": "starling-7b",
+  "object": "model",
+  "name": "Starling alpha 7B Q4",
+  "version": "1.0",
+  "description": "Starling 7B, an upgrade of Openchat 3.5 using RLAIF, is really good at various benchmarks, especially with GPT-4 judging its performance.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "GPT4 User: {prompt}<|end_of_turn|>GPT4 Assistant:",
+    "llama_model_path": "starling-lm-7b-alpha.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": ["<|end_of_turn|>"],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Berkeley-nest, The Bloke",
+    "tags": ["7B", "Finetuned"],
+    "size": 4370000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/stealth-v1.2-7b/model.json b/models/stealth-v1.2-7b/model.json
index 92bfe46e1..235cbbb88 100644
--- a/models/stealth-v1.2-7b/model.json
+++ b/models/stealth-v1.2-7b/model.json
@@ -1,32 +1,33 @@
 {
-    "source_url": "https://huggingface.co/janhq/stealth-v1.3-GGUF/resolve/main/stealth-v1.3.Q4_K_M.gguf",
-    "id": "stealth-v1.2-7b",
-    "object": "model",
-    "name": "Stealth 7B Q4",
-    "version": "1.0",
-    "description": "This is a new experimental family designed to enhance Mathematical and Logical abilities.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Jan",
-      "tags": [
-        "7B",
-        "Finetuned",
-        "Featured"
-      ],
-      "size": 4370000000
-    },
-    "engine": "nitro"
-  }
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "stealth-v1.3.Q4_K_M.gguf",
+      "url": "https://huggingface.co/janhq/stealth-v1.3-GGUF/resolve/main/stealth-v1.3.Q4_K_M.gguf"
+    }
+  ],
+  "id": "stealth-v1.2-7b",
+  "object": "model",
+  "name": "Stealth 7B Q4",
+  "version": "1.0",
+  "description": "This is a new experimental family designed to enhance Mathematical and Logical abilities.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+    "llama_model_path": "stealth-v1.3.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Jan",
+    "tags": ["7B", "Finetuned", "Featured"],
+    "size": 4370000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/tinyllama-1.1b/model.json b/models/tinyllama-1.1b/model.json
index 641511569..6a9187fa5 100644
--- a/models/tinyllama-1.1b/model.json
+++ b/models/tinyllama-1.1b/model.json
@@ -1,5 +1,10 @@
 {
-  "source_url": "https://huggingface.co/TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF/resolve/main/tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf",
+  "sources": [
+    {
+      "filename": "tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF/resolve/main/tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf"
+    }
+  ],
   "id": "tinyllama-1.1b",
   "object": "model",
   "name": "TinyLlama Chat 1.1B Q4",
@@ -7,8 +12,9 @@
   "description": "TinyLlama is a tiny model with only 1.1B. It's a good model for less powerful computers.",
   "format": "gguf",
   "settings": {
-      "ctx_len": 2048,
-      "prompt_template": "<|system|>\n{system_message}<|user|>\n{prompt}<|assistant|>"
+    "ctx_len": 4096,
+    "prompt_template": "<|system|>\n{system_message}<|user|>\n{prompt}<|assistant|>",
+    "llama_model_path": "tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf"
   },
   "parameters": {
     "temperature": 0.7,
@@ -20,9 +26,9 @@
     "presence_penalty": 0
   },
   "metadata": {
-      "author": "TinyLlama",
-      "tags": ["Tiny", "Foundation Model"],
-      "size": 669000000
+    "author": "TinyLlama",
+    "tags": ["Tiny", "Foundation Model"],
+    "size": 669000000
   },
   "engine": "nitro"
-}
\ No newline at end of file
+}
diff --git a/models/trinity-v1.2-7b/model.json b/models/trinity-v1.2-7b/model.json
index ce5e7a4cf..2dda120e6 100644
--- a/models/trinity-v1.2-7b/model.json
+++ b/models/trinity-v1.2-7b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/janhq/trinity-v1.2-GGUF/resolve/main/trinity-v1.2.Q4_K_M.gguf",
-    "id": "trinity-v1.2-7b",
-    "object": "model",
-    "name": "Trinity-v1.2 7B Q4",
-    "version": "1.0",
-    "description": "Trinity is an experimental model merge using the Slerp method. Recommended for daily assistance purposes.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Jan",
-      "tags": ["7B", "Merged", "Featured"],
-      "size": 4370000000,
-      "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/trinity-v1.2-7b/cover.png"
-    },
-    "engine": "nitro"
-  }  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "trinity-v1.2.Q4_K_M.gguf",
+      "url": "https://huggingface.co/janhq/trinity-v1.2-GGUF/resolve/main/trinity-v1.2.Q4_K_M.gguf"
+    }
+  ],
+  "id": "trinity-v1.2-7b",
+  "object": "model",
+  "name": "Trinity-v1.2 7B Q4",
+  "version": "1.0",
+  "description": "Trinity is an experimental model merge using the Slerp method. Recommended for daily assistance purposes.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+    "llama_model_path": "trinity-v1.2.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Jan",
+    "tags": ["7B", "Merged", "Featured"],
+    "size": 4370000000,
+    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/trinity-v1.2-7b/cover.png"
+  },
+  "engine": "nitro"
+}
diff --git a/models/tulu-2-70b/model.json b/models/tulu-2-70b/model.json
index ae95b870d..06b96e50d 100644
--- a/models/tulu-2-70b/model.json
+++ b/models/tulu-2-70b/model.json
@@ -1,28 +1,33 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/tulu-2-dpo-70B-GGUF/resolve/main/tulu-2-dpo-70b.Q4_K_M.gguf",
-    "id": "tulu-2-70b",
-    "object": "model",
-    "name": "Tulu 2 70B Q4",
-    "version": "1.0",
-    "description": "Tulu 70B is a strong alternative to Llama 2 70b Chat to act as helpful assistants.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "<|user|>\n{prompt}\n<|assistant|>"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "Lizpreciatior, The Bloke",
-      "tags": ["70B", "Finetuned"],
-      "size": 41400000000
-    },
-    "engine": "nitro"
-  }
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "tulu-2-dpo-70b.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/tulu-2-dpo-70B-GGUF/resolve/main/tulu-2-dpo-70b.Q4_K_M.gguf"
+    }
+  ],
+  "id": "tulu-2-70b",
+  "object": "model",
+  "name": "Tulu 2 70B Q4",
+  "version": "1.0",
+  "description": "Tulu 70B is a strong alternative to Llama 2 70b Chat to act as helpful assistants.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "<|user|>\n{prompt}\n<|assistant|>",
+    "llama_model_path": "tulu-2-dpo-70b.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "Lizpreciatior, The Bloke",
+    "tags": ["70B", "Finetuned"],
+    "size": 41400000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/wizardcoder-13b/model.json b/models/wizardcoder-13b/model.json
index 1605ed362..051c739a0 100644
--- a/models/wizardcoder-13b/model.json
+++ b/models/wizardcoder-13b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/WizardCoder-Python-13B-V1.0-GGUF/resolve/main/wizardcoder-python-13b-v1.0.Q5_K_M.gguf",
-    "id": "wizardcoder-13b",
-    "object": "model",
-    "name": "Wizard Coder Python 13B Q5",
-    "version": "1.0",
-    "description": "WizardCoder 13B is a Python coding model. This model demonstrate high proficiency in specific domains like coding and mathematics.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "### Instruction:\n{prompt}\n### Response:"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "WizardLM, The Bloke",
-      "tags": ["Recommended", "13B", "Finetuned"],
-      "size": 7870000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "wizardcoder-python-13b-v1.0.Q5_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/WizardCoder-Python-13B-V1.0-GGUF/resolve/main/wizardcoder-python-13b-v1.0.Q5_K_M.gguf"
+    }
+  ],
+  "id": "wizardcoder-13b",
+  "object": "model",
+  "name": "Wizard Coder Python 13B Q5",
+  "version": "1.0",
+  "description": "WizardCoder 13B is a Python coding model. This model demonstrate high proficiency in specific domains like coding and mathematics.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "### Instruction:\n{prompt}\n### Response:",
+    "llama_model_path": "wizardcoder-python-13b-v1.0.Q5_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "WizardLM, The Bloke",
+    "tags": ["Recommended", "13B", "Finetuned"],
+    "size": 7870000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/yarn-mistral-7b/model.json b/models/yarn-mistral-7b/model.json
index 2676fbb58..ee6de1319 100644
--- a/models/yarn-mistral-7b/model.json
+++ b/models/yarn-mistral-7b/model.json
@@ -1,29 +1,31 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Yarn-Mistral-7B-128k-GGUF/resolve/main/yarn-mistral-7b-128k.Q4_K_M.gguf",
-    "id": "yarn-mistral-7b",
-    "object": "model",
-    "name": "Yarn Mistral 7B Q4",
-    "version": "1.0",
-    "description": "Yarn Mistral 7B is a language model for long context and supports a 128k token context window.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "{prompt}"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "NousResearch, The Bloke",
-      "tags": ["7B","Finetuned"],
-      "size": 4370000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "url": "https://huggingface.co/TheBloke/Yarn-Mistral-7B-128k-GGUF/resolve/main/yarn-mistral-7b-128k.Q4_K_M.gguf"
+    }
+  ],
+  "id": "yarn-mistral-7b",
+  "object": "model",
+  "name": "Yarn Mistral 7B Q4",
+  "version": "1.0",
+  "description": "Yarn Mistral 7B is a language model for long context and supports a 128k token context window.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "{prompt}"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "NousResearch, The Bloke",
+    "tags": ["7B", "Finetuned"],
+    "size": 4370000000
+  },
+  "engine": "nitro"
+}
diff --git a/models/yi-34b/model.json b/models/yi-34b/model.json
index 8ff23aaa0..3697a9e22 100644
--- a/models/yi-34b/model.json
+++ b/models/yi-34b/model.json
@@ -1,29 +1,34 @@
 {
-    "source_url": "https://huggingface.co/TheBloke/Yi-34B-Chat-GGUF/resolve/main/yi-34b-chat.Q5_K_M.gguf",
-    "id": "yi-34b",
-    "object": "model",
-    "name": "Yi 34B Q5",
-    "version": "1.0",
-    "description": "Yi-34B, a specialized chat model, is known for its diverse and creative responses and excels across various NLP tasks and benchmarks.",
-    "format": "gguf",
-    "settings": {
-      "ctx_len": 4096,
-      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant"
-    },
-    "parameters": {
-      "temperature": 0.7,
-      "top_p": 0.95,
-      "stream": true,
-      "max_tokens": 4096,
-      "stop": [],
-      "frequency_penalty": 0,
-      "presence_penalty": 0
-    },
-    "metadata": {
-      "author": "01-ai, The Bloke",
-      "tags": ["34B", "Foundational Model"],
-      "size": 20660000000
-    },
-    "engine": "nitro"
-  }
-  
\ No newline at end of file
+  "sources": [
+    {
+      "filename": "yi-34b-chat.Q5_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/Yi-34B-Chat-GGUF/resolve/main/yi-34b-chat.Q5_K_M.gguf"
+    }
+  ],
+  "id": "yi-34b",
+  "object": "model",
+  "name": "Yi 34B Q5",
+  "version": "1.0",
+  "description": "Yi-34B, a specialized chat model, is known for its diverse and creative responses and excels across various NLP tasks and benchmarks.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+    "llama_model_path": "yi-34b-chat.Q5_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 4096,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "01-ai, The Bloke",
+    "tags": ["34B", "Foundational Model"],
+    "size": 20660000000
+  },
+  "engine": "nitro"
+}
diff --git a/web/containers/Providers/EventListener.tsx b/web/containers/Providers/EventListener.tsx
index d91a877d6..2816c88e2 100644
--- a/web/containers/Providers/EventListener.tsx
+++ b/web/containers/Providers/EventListener.tsx
@@ -105,6 +105,7 @@ export default function EventListenerWrapper({ children }: PropsWithChildren) {
       })
     }
     return () => {}
+    // eslint-disable-next-line react-hooks/exhaustive-deps
   }, [])
 
   return (
diff --git a/web/hooks/useDownloadModel.ts b/web/hooks/useDownloadModel.ts
index 49dbe1d5b..528108d18 100644
--- a/web/hooks/useDownloadModel.ts
+++ b/web/hooks/useDownloadModel.ts
@@ -6,6 +6,7 @@ import {
   ModelExtension,
   abortDownload,
   joinPath,
+  ModelArtifact,
 } from '@janhq/core'
 
 import { useSetAtom } from 'jotai'
@@ -25,6 +26,23 @@ export default function useDownloadModel() {
   const addNewDownloadingModel = useSetAtom(addNewDownloadingModelAtom)
 
   const downloadModel = async (model: Model) => {
+    const childrenDownloadProgress: DownloadState[] = []
+    model.sources.forEach((source: ModelArtifact) => {
+      childrenDownloadProgress.push({
+        modelId: source.filename,
+        time: {
+          elapsed: 0,
+          remaining: 0,
+        },
+        speed: 0,
+        percent: 0,
+        size: {
+          total: 0,
+          transferred: 0,
+        },
+      })
+    })
+
     // set an initial download state
     setDownloadState({
       modelId: model.id,
@@ -38,6 +56,7 @@ export default function useDownloadModel() {
         total: 0,
         transferred: 0,
       },
+      children: childrenDownloadProgress,
     })
 
     addNewDownloadingModel(model)
@@ -46,6 +65,7 @@ export default function useDownloadModel() {
       .get<ModelExtension>(ExtensionTypeEnum.Model)
       ?.downloadModel(model, { ignoreSSL, proxy })
   }
+
   const abortModelDownload = async (model: Model) => {
     await abortDownload(
       await joinPath(['models', model.id, modelBinFileName(model)])
diff --git a/web/hooks/useGetConfiguredModels.ts b/web/hooks/useGetConfiguredModels.ts
index 5662d534e..919f43754 100644
--- a/web/hooks/useGetConfiguredModels.ts
+++ b/web/hooks/useGetConfiguredModels.ts
@@ -1,7 +1,6 @@
 import { useEffect, useState } from 'react'
 
-import { ExtensionTypeEnum, ModelExtension } from '@janhq/core'
-import { Model } from '@janhq/core'
+import { ExtensionTypeEnum, ModelExtension, Model } from '@janhq/core'
 
 import { extensionManager } from '@/extension/ExtensionManager'
 
@@ -25,6 +24,7 @@ export function useGetConfiguredModels() {
 
   useEffect(() => {
     fetchModels()
+    // eslint-disable-next-line react-hooks/exhaustive-deps
   }, [])
 
   return { loading, models }
diff --git a/web/hooks/useGetDownloadedModels.ts b/web/hooks/useGetDownloadedModels.ts
index f509fce63..bba420858 100644
--- a/web/hooks/useGetDownloadedModels.ts
+++ b/web/hooks/useGetDownloadedModels.ts
@@ -6,7 +6,7 @@ import { atom, useAtom } from 'jotai'
 
 import { extensionManager } from '@/extension/ExtensionManager'
 
-const downloadedModelsAtom = atom<Model[]>([])
+export const downloadedModelsAtom = atom<Model[]>([])
 
 export function useGetDownloadedModels() {
   const [downloadedModels, setDownloadedModels] = useAtom(downloadedModelsAtom)
@@ -15,7 +15,8 @@ export function useGetDownloadedModels() {
     getDownloadedModels().then((downloadedModels) => {
       setDownloadedModels(downloadedModels)
     })
-  }, [setDownloadedModels])
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [])
 
   return { downloadedModels, setDownloadedModels }
 }
diff --git a/web/hooks/useRecommendedModel.ts b/web/hooks/useRecommendedModel.ts
index dd474d0b5..2ee4c1a7f 100644
--- a/web/hooks/useRecommendedModel.ts
+++ b/web/hooks/useRecommendedModel.ts
@@ -110,6 +110,7 @@ export default function useRecommendedModel() {
 
     console.debug(`Using last used model ${lastUsedModel.id}`)
     setRecommendedModel(lastUsedModel)
+    // eslint-disable-next-line react-hooks/exhaustive-deps
   }, [getAndSortDownloadedModels, activeThread])
 
   useEffect(() => {
diff --git a/web/hooks/useSettings.ts b/web/hooks/useSettings.ts
index 34d123359..ef4e08480 100644
--- a/web/hooks/useSettings.ts
+++ b/web/hooks/useSettings.ts
@@ -13,6 +13,7 @@ export const useSettings = () => {
 
   useEffect(() => {
     setTimeout(() => validateSettings, 3000)
+    // eslint-disable-next-line react-hooks/exhaustive-deps
   }, [])
 
   const validateSettings = async () => {
diff --git a/web/package.json b/web/package.json
index bba3dd48b..5293cf765 100644
--- a/web/package.json
+++ b/web/package.json
@@ -21,7 +21,7 @@
     "class-variance-authority": "^0.7.0",
     "framer-motion": "^10.16.4",
     "highlight.js": "^11.9.0",
-    "jotai": "^2.4.0",
+    "jotai": "^2.6.0",
     "lodash": "^4.17.21",
     "lucide-react": "^0.291.0",
     "marked": "^9.1.2",
diff --git a/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx b/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
index b56e20404..656a671c7 100644
--- a/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
+++ b/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
@@ -26,7 +26,7 @@ import { useCreateNewThread } from '@/hooks/useCreateNewThread'
 import useDownloadModel from '@/hooks/useDownloadModel'
 import { useDownloadState } from '@/hooks/useDownloadState'
 import { getAssistants } from '@/hooks/useGetAssistants'
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
+import { downloadedModelsAtom } from '@/hooks/useGetDownloadedModels'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import { toGibibytes } from '@/utils/converter'
@@ -43,8 +43,8 @@ type Props = {
 
 const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
   const { downloadModel } = useDownloadModel()
-  const { downloadedModels } = useGetDownloadedModels()
-  const { modelDownloadStateAtom, downloadStates } = useDownloadState()
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
+  const { modelDownloadStateAtom } = useDownloadState()
   const { requestCreateNewThread } = useCreateNewThread()
   const totalRam = useAtomValue(totalRamAtom)
   const serverEnabled = useAtomValue(serverEnabledAtom)
@@ -100,9 +100,7 @@ const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
         )}
       </Tooltip>
     )
-  }
-
-  if (downloadState != null && downloadStates.length > 0) {
+  } else if (downloadState != null) {
     downloadButton = <ModalCancelDownload model={model} />
   }
 
diff --git a/web/types/downloadState.d.ts b/web/types/downloadState.d.ts
index 3c3389b4f..cca526bf1 100644
--- a/web/types/downloadState.d.ts
+++ b/web/types/downloadState.d.ts
@@ -4,6 +4,8 @@ type DownloadState = {
   speed: number
   percent: number
   size: DownloadSize
+  isFinished?: boolean
+  children?: DownloadState[]
   error?: string
 }
 
diff --git a/web/utils/model.ts b/web/utils/model.ts
index 2dd6fbdd3..eab4076d8 100644
--- a/web/utils/model.ts
+++ b/web/utils/model.ts
@@ -2,7 +2,7 @@ import { Model } from '@janhq/core'
 
 export const modelBinFileName = (model: Model) => {
   const modelFormatExt = '.gguf'
-  const extractedFileName = model.source_url?.split('/').pop() ?? model.id
+  const extractedFileName = model.sources[0]?.url.split('/').pop() ?? model.id
   const fileName = extractedFileName.toLowerCase().endsWith(modelFormatExt)
     ? extractedFileName
     : model.id
diff --git a/web/utils/modelParam.ts b/web/utils/modelParam.ts
index 7d559c313..2deffce66 100644
--- a/web/utils/modelParam.ts
+++ b/web/utils/modelParam.ts
@@ -40,6 +40,8 @@ export const toSettingParams = (
     n_parallel: undefined,
     cpu_threads: undefined,
     prompt_template: undefined,
+    llama_model_path: undefined,
+    mmproj: undefined,
   }
   const settingParams: ModelSettingParams = {}
 

From dea35dad9e366e60afa3bb3f1bb8d586812ebe1d Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 09:18:42 +0000
Subject: [PATCH 06/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 82c3ae79b..d69c9cde5 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-172.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-177.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-172.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-177.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-172.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-177.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-172.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-177.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-172.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-177.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 01fcfb7097237c20c1ea93640e5753e0147a20fa Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 10:35:24 +0000
Subject: [PATCH 07/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index d69c9cde5..b45cd8413 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-177.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-178.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-177.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-178.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-177.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-178.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-177.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-178.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-177.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-178.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 75f32614e7838e48ad37c3a42972720c1e1db4f1 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 11:27:46 +0000
Subject: [PATCH 08/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index b45cd8413..6c1fc44a4 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-178.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-179.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-178.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-179.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-178.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-179.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-178.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-179.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-178.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-179.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From b291b3da7164252af5c25ba4a38ce285450e0852 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 13:12:20 +0000
Subject: [PATCH 09/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 6c1fc44a4..2722a2870 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-179.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-180.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-179.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-180.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-179.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-180.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-179.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-180.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-179.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-180.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 837fa8a82dbb185050aaa2a39ef11823b188d08d Mon Sep 17 00:00:00 2001
From: hiento09 <136591877+hiento09@users.noreply.github.com>
Date: Thu, 25 Jan 2024 21:18:45 +0700
Subject: [PATCH 10/65] Docs publish to github page trigger on push to docs
 branch (#1782)

Co-authored-by: Hien To <tominhhien97@gmail.com>
---
 .github/workflows/jan-docs.yml | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/jan-docs.yml b/.github/workflows/jan-docs.yml
index 8ce4e91ed..8135935bd 100644
--- a/.github/workflows/jan-docs.yml
+++ b/.github/workflows/jan-docs.yml
@@ -5,6 +5,7 @@ on:
     branches:
       - main
       - dev
+      - docs
     paths:
       - 'docs/**'
       - '.github/workflows/jan-docs.yml'
@@ -12,6 +13,7 @@ on:
     branches:
       - main
       - dev
+      - docs
     paths:
       - 'docs/**'
       - '.github/workflows/jan-docs.yml'
@@ -91,13 +93,13 @@ jobs:
               Preview URL: ${{ steps.deployCloudflarePages.outputs.url }}
 
       - name: Add Custome Domain file
-        if: github.event_name == 'push' && github.ref == 'refs/heads/main' && github.event.pull_request.head.repo.full_name != github.repository
+        if: github.event_name == 'push' && github.ref == 'refs/heads/docs' && github.event.pull_request.head.repo.full_name != github.repository
         run: echo "${{ vars.DOCUSAURUS_DOMAIN }}" > ./docs/build/CNAME
 
       # Popular action to deploy to GitHub Pages:
       # Docs: https://github.com/peaceiris/actions-gh-pages#%EF%B8%8F-docusaurus
       - name: Deploy to GitHub Pages
-        if: github.event_name == 'push' && github.ref == 'refs/heads/main' && github.event.pull_request.head.repo.full_name != github.repository
+        if: github.event_name == 'push' && github.ref == 'refs/heads/docs' && github.event.pull_request.head.repo.full_name != github.repository
         uses: peaceiris/actions-gh-pages@v3
         with:
           github_token: ${{ secrets.GITHUB_TOKEN }}

From b2b1479fc34a34a10129a765ac37906e86d7ee54 Mon Sep 17 00:00:00 2001
From: copyhold <ilya.novojilov@logz.io>
Date: Thu, 25 Jan 2024 16:38:32 +0200
Subject: [PATCH 11/65] Added focus

---
 web/screens/Chat/index.tsx | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index 684027e49..f86460f1c 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -74,6 +74,9 @@ const ChatScreen = () => {
   }
 
   useEffect(() => {
+    if (textareaRef.current) {
+      textareaRef.current.focus()
+    }
     if (isWaitingToSend && activeThreadId) {
       setIsWaitingToSend(false)
       sendChatMessage()
@@ -85,6 +88,7 @@ const ChatScreen = () => {
     if (textareaRef.current) {
       textareaRef.current.style.height = '40px'
       textareaRef.current.style.height = textareaRef.current.scrollHeight + 'px'
+      textareaRef.current.focus()
     }
   }, [currentPrompt])
 

From a78e183eeb71825de3341fb11ac7719dd6bb1ac8 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 15:36:30 +0000
Subject: [PATCH 12/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 2722a2870..fb11cfbde 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-180.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-182.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-180.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-182.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-180.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-182.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-180.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-182.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-180.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-182.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From e8796a7ad860536a91fb45f56a2cb181bbaa3b81 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 15:43:16 +0000
Subject: [PATCH 13/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index fb11cfbde..53558185c 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-182.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-183.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-182.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-183.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-182.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-183.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-182.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-183.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-182.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-183.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From b0d63c988d6fff570130e5b4fcba471b7951c107 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 16:30:09 +0000
Subject: [PATCH 14/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 53558185c..8811dbe0c 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-183.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-184.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-183.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-184.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-183.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-184.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-183.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-184.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-183.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-184.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From a52d81c79a979b234882c468ad056049f7c8d757 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 25 Jan 2024 20:16:35 +0000
Subject: [PATCH 15/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 8811dbe0c..9183b0652 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-184.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-185.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-184.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-185.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-184.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-185.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-184.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-185.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-184.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-185.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 99025cb02f6affabd2c4786b6e5247e5177ffc37 Mon Sep 17 00:00:00 2001
From: hiento09 <136591877+hiento09@users.noreply.github.com>
Date: Fri, 26 Jan 2024 09:24:09 +0700
Subject: [PATCH 16/65] CI nightly update trigger to 3AM UTC +7 Tuesday,
 Wednesday, and Thursday (#1798)

Co-authored-by: Hien To <tominhhien97@gmail.com>
---
 .github/workflows/jan-electron-build-nightly.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/jan-electron-build-nightly.yml b/.github/workflows/jan-electron-build-nightly.yml
index f961ccd6f..08b6ad476 100644
--- a/.github/workflows/jan-electron-build-nightly.yml
+++ b/.github/workflows/jan-electron-build-nightly.yml
@@ -2,7 +2,7 @@ name: Jan Build Electron App Nightly or Manual
 
 on:
   schedule:
-    - cron: '0 20 * * 2,3,4' # At 8 PM UTC on Tuesday, Wednesday, and Thursday, which is 3 AM UTC+7
+    - cron: '0 20 * * 1,2,3' # At 8 PM UTC on Monday, Tuesday, and Wednesday which is 3 AM UTC+7 Tuesday, Wednesday, and Thursday
   workflow_dispatch:
     inputs:
       public_provider:

From 85b58eb82400cb9d75af4f16ca6e1b4ef96c8224 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Fri, 26 Jan 2024 04:00:07 +0000
Subject: [PATCH 17/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 9183b0652..770b88266 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-185.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-187.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-185.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-187.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-185.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-187.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-185.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-187.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-185.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-187.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 143e76a0dedcf49fb3d32a9715fc3958aaad6907 Mon Sep 17 00:00:00 2001
From: NamH <NamNh0122@gmail.com>
Date: Fri, 26 Jan 2024 12:19:02 +0700
Subject: [PATCH 18/65] chore: clean up code and remove some lint suppression
 (#1777)

* chore: clean up code and remove some lint suppression

Signed-off-by: James <james@jan.ai>

* Update .gitignore

---------

Signed-off-by: James <james@jan.ai>
Co-authored-by: James <james@jan.ai>
Co-authored-by: Louis <louis@jan.ai>
---
 .gitignore                                   |   3 +
 extensions/assistant-extension/src/index.ts  |   3 +-
 extensions/monitoring-extension/src/index.ts |   3 +-
 web/containers/Layout/index.tsx              |   2 +-
 web/containers/Providers/EventHandler.tsx    | 118 +++++++++++--------
 web/containers/Providers/EventListener.tsx   |  16 +--
 web/hooks/useGetConfiguredModels.ts          |  23 ++--
 web/screens/Chat/MessageToolbar/index.tsx    |   2 +-
 8 files changed, 96 insertions(+), 74 deletions(-)

diff --git a/.gitignore b/.gitignore
index e3e4635fc..4540e5c7a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -12,6 +12,8 @@ build
 electron/renderer
 electron/models
 electron/docs
+electron/engines
+server/pre-install
 package-lock.json
 
 *.log
@@ -26,3 +28,4 @@ extensions/inference-nitro-extension/bin/*/*.exp
 extensions/inference-nitro-extension/bin/*/*.lib
 extensions/inference-nitro-extension/bin/saved-*
 extensions/inference-nitro-extension/bin/*.tar.gz
+
diff --git a/extensions/assistant-extension/src/index.ts b/extensions/assistant-extension/src/index.ts
index 96de33b7b..098ab1f54 100644
--- a/extensions/assistant-extension/src/index.ts
+++ b/extensions/assistant-extension/src/index.ts
@@ -1,5 +1,4 @@
-import { fs, Assistant } from "@janhq/core";
-import { AssistantExtension } from "@janhq/core";
+import { fs, Assistant, AssistantExtension } from "@janhq/core";
 import { join } from "path";
 
 export default class JanAssistantExtension extends AssistantExtension {
diff --git a/extensions/monitoring-extension/src/index.ts b/extensions/monitoring-extension/src/index.ts
index d3f20b437..9297a770f 100644
--- a/extensions/monitoring-extension/src/index.ts
+++ b/extensions/monitoring-extension/src/index.ts
@@ -1,5 +1,4 @@
-import { MonitoringExtension } from "@janhq/core";
-import { executeOnMain } from "@janhq/core";
+import { MonitoringExtension, executeOnMain } from "@janhq/core";
 
 /**
  * JanMonitoringExtension is a extension that provides system monitoring functionality.
diff --git a/web/containers/Layout/index.tsx b/web/containers/Layout/index.tsx
index 54a7845a4..e7bde49c0 100644
--- a/web/containers/Layout/index.tsx
+++ b/web/containers/Layout/index.tsx
@@ -28,7 +28,7 @@ const BaseLayout = (props: PropsWithChildren) => {
     if (localStorage.getItem(SUCCESS_SET_NEW_DESTINATION) === 'true') {
       setMainViewState(MainViewState.Settings)
     }
-  }, [])
+  }, [setMainViewState])
 
   return (
     <div className="flex h-screen w-screen flex-1 overflow-hidden">
diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index 1f9d6d7af..114370359 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -1,5 +1,5 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
-import { ReactNode, useEffect, useRef } from 'react'
+import { ReactNode, useCallback, useEffect, useRef } from 'react'
 
 import {
   events,
@@ -48,48 +48,61 @@ export default function EventHandler({ children }: { children: ReactNode }) {
     modelsRef.current = downloadedModels
   }, [downloadedModels])
 
-  async function handleNewMessageResponse(message: ThreadMessage) {
-    addNewMessage(message)
-  }
+  const onNewMessageResponse = useCallback(
+    (message: ThreadMessage) => {
+      addNewMessage(message)
+    },
+    [addNewMessage]
+  )
 
-  async function handleModelReady(model: Model) {
-    setActiveModel(model)
-    toaster({
-      title: 'Success!',
-      description: `Model ${model.id} has been started.`,
-    })
-    setStateModel(() => ({
-      state: 'stop',
-      loading: false,
-      model: model.id,
-    }))
-  }
+  const onModelReady = useCallback(
+    (model: Model) => {
+      setActiveModel(model)
+      toaster({
+        title: 'Success!',
+        description: `Model ${model.id} has been started.`,
+      })
+      setStateModel(() => ({
+        state: 'stop',
+        loading: false,
+        model: model.id,
+      }))
+    },
+    [setActiveModel, setStateModel]
+  )
 
-  async function handleModelStopped() {
-    setTimeout(async () => {
+  const onModelStopped = useCallback(() => {
+    setTimeout(() => {
       setActiveModel(undefined)
       setStateModel({ state: 'start', loading: false, model: '' })
     }, 500)
-  }
+  }, [setActiveModel, setStateModel])
 
-  async function handleModelFail(res: any) {
-    const errorMessage = `${res.error}`
-    alert(errorMessage)
-    setStateModel(() => ({
-      state: 'start',
-      loading: false,
-      model: res.modelId,
-    }))
-  }
+  const onModelInitFailed = useCallback(
+    (res: any) => {
+      const errorMessage = `${res.error}`
+      console.error('Failed to load model: ' + errorMessage)
+      setStateModel(() => ({
+        state: 'start',
+        loading: false,
+        model: res.modelId,
+      }))
+    },
+    [setStateModel]
+  )
+
+  const onMessageResponseUpdate = useCallback(
+    (message: ThreadMessage) => {
+      updateMessage(
+        message.id,
+        message.thread_id,
+        message.content,
+        message.status
+      )
+      if (message.status === MessageStatus.Pending) {
+        return
+      }
 
-  async function handleMessageResponseUpdate(message: ThreadMessage) {
-    updateMessage(
-      message.id,
-      message.thread_id,
-      message.content,
-      message.status
-    )
-    if (message.status !== MessageStatus.Pending) {
       // Mark the thread as not waiting for response
       updateThreadWaiting(message.thread_id, false)
 
@@ -111,26 +124,33 @@ export default function EventHandler({ children }: { children: ReactNode }) {
           .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
           ?.addNewMessage(message)
       }
-    }
-  }
+    },
+    [updateMessage, updateThreadWaiting]
+  )
 
   useEffect(() => {
+    console.log('Registering events')
     if (window.core?.events) {
-      events.on(MessageEvent.OnMessageResponse, handleNewMessageResponse)
-      events.on(MessageEvent.OnMessageUpdate, handleMessageResponseUpdate)
-      events.on(ModelEvent.OnModelReady, handleModelReady)
-      events.on(ModelEvent.OnModelFail, handleModelFail)
-      events.on(ModelEvent.OnModelStopped, handleModelStopped)
+      events.on(MessageEvent.OnMessageResponse, onNewMessageResponse)
+      events.on(MessageEvent.OnMessageUpdate, onMessageResponseUpdate)
+
+      events.on(ModelEvent.OnModelReady, onModelReady)
+      events.on(ModelEvent.OnModelFail, onModelInitFailed)
+      events.on(ModelEvent.OnModelStopped, onModelStopped)
     }
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
+  }, [
+    onNewMessageResponse,
+    onMessageResponseUpdate,
+    onModelReady,
+    onModelInitFailed,
+    onModelStopped,
+  ])
 
   useEffect(() => {
     return () => {
-      events.off(MessageEvent.OnMessageResponse, handleNewMessageResponse)
-      events.off(MessageEvent.OnMessageUpdate, handleMessageResponseUpdate)
+      events.off(MessageEvent.OnMessageResponse, onNewMessageResponse)
+      events.off(MessageEvent.OnMessageUpdate, onMessageResponseUpdate)
     }
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
+  }, [onNewMessageResponse, onMessageResponseUpdate])
   return <>{children}</>
 }
diff --git a/web/containers/Providers/EventListener.tsx b/web/containers/Providers/EventListener.tsx
index 2816c88e2..62d4cacb6 100644
--- a/web/containers/Providers/EventListener.tsx
+++ b/web/containers/Providers/EventListener.tsx
@@ -105,12 +105,14 @@ export default function EventListenerWrapper({ children }: PropsWithChildren) {
       })
     }
     return () => {}
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
+  }, [
+    setDownloadState,
+    setDownloadStateCancelled,
+    setDownloadStateFailed,
+    setDownloadStateSuccess,
+    setDownloadedModels,
+    setProgress,
+  ])
 
-  return (
-    <div id="eventlistener">
-      <EventHandler>{children}</EventHandler>
-    </div>
-  )
+  return <EventHandler>{children}</EventHandler>
 }
diff --git a/web/hooks/useGetConfiguredModels.ts b/web/hooks/useGetConfiguredModels.ts
index 919f43754..8be052ae2 100644
--- a/web/hooks/useGetConfiguredModels.ts
+++ b/web/hooks/useGetConfiguredModels.ts
@@ -1,4 +1,4 @@
-import { useEffect, useState } from 'react'
+import { useCallback, useEffect, useState } from 'react'
 
 import { ExtensionTypeEnum, ModelExtension, Model } from '@janhq/core'
 
@@ -8,24 +8,23 @@ export function useGetConfiguredModels() {
   const [loading, setLoading] = useState<boolean>(false)
   const [models, setModels] = useState<Model[]>([])
 
-  const getConfiguredModels = async (): Promise<Model[]> => {
-    const models = await extensionManager
-      .get<ModelExtension>(ExtensionTypeEnum.Model)
-      ?.getConfiguredModels()
-    return models ?? []
-  }
-
-  async function fetchModels() {
+  const fetchModels = useCallback(async () => {
     setLoading(true)
     const models = await getConfiguredModels()
     setLoading(false)
     setModels(models)
-  }
+  }, [])
 
   useEffect(() => {
     fetchModels()
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
+  }, [fetchModels])
 
   return { loading, models }
 }
+
+const getConfiguredModels = async (): Promise<Model[]> => {
+  const models = await extensionManager
+    .get<ModelExtension>(ExtensionTypeEnum.Model)
+    ?.getConfiguredModels()
+  return models ?? []
+}
diff --git a/web/screens/Chat/MessageToolbar/index.tsx b/web/screens/Chat/MessageToolbar/index.tsx
index 183eae814..dfa8d63c6 100644
--- a/web/screens/Chat/MessageToolbar/index.tsx
+++ b/web/screens/Chat/MessageToolbar/index.tsx
@@ -3,8 +3,8 @@ import {
   ExtensionTypeEnum,
   ThreadMessage,
   ChatCompletionRole,
+  ConversationalExtension,
 } from '@janhq/core'
-import { ConversationalExtension } from '@janhq/core'
 import { useAtomValue, useSetAtom } from 'jotai'
 import { RefreshCcw, CopyIcon, Trash2Icon, CheckIcon } from 'lucide-react'
 

From b15650269e406d9119bc10d24993bc5e7202c1cf Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Fri, 26 Jan 2024 05:35:57 +0000
Subject: [PATCH 19/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 770b88266..20f7e4f34 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-187.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-186.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-187.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-186.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-187.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-186.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-187.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-186.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-187.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-186.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 2d96b69fdc47bdc11c10f237662671cf84f835d2 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Fri, 26 Jan 2024 06:02:39 +0000
Subject: [PATCH 20/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 20f7e4f34..68035beca 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-186.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-188.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-186.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-188.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-186.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-188.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-186.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-188.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-186.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-188.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From c4d56362e2bc2e2157cc119268a15d79360e6647 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Fri, 26 Jan 2024 06:05:46 +0000
Subject: [PATCH 21/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 68035beca..36e8a171f 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-188.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-189.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-188.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-189.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-188.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-189.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-188.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-189.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-188.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-189.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From ba07f92636f39ef82646d19a638c605d47c85246 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Fri, 26 Jan 2024 07:58:45 +0000
Subject: [PATCH 22/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 36e8a171f..d7397a8da 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-189.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-190.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-189.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-190.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-189.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-190.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-189.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-190.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-189.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-190.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 8bd539aac518277e8bf07e3dda20e76ff5e25736 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Fri, 26 Jan 2024 12:13:58 +0000
Subject: [PATCH 23/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index d7397a8da..e20fb5dbe 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-190.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-191.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-190.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-191.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-190.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-191.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-190.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-191.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-190.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-191.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 38f757dd4d8a3463f0a53f8dcd5437681b16a7b9 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Fri, 26 Jan 2024 13:26:21 +0000
Subject: [PATCH 24/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index e20fb5dbe..f5ce84e70 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-191.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-193.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-191.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-193.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-191.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-193.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-191.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-193.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-191.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-193.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 28e4405498c5de9558b1e39d890b17aa6689c42a Mon Sep 17 00:00:00 2001
From: hiro <vuonghoainam.work@gmail.com>
Date: Tue, 19 Dec 2023 23:33:27 +0700
Subject: [PATCH 25/65] feat: support RAG

chore: Update new model.json with multiple binaries

feat: Add updates for handling multiple model binaries

chore: jan can see

Update Model.json (#1005)

* add(mixtral): add model.json for mixtral

* archived some models + update the model.json

* add(model): add pandora 10.7b

* fix(model): update description

* fix(model): pump vers and change the featured model to trinity

* fix(model): archive neuralchat

* fix(model): decapriated all old models

* fix(trinity): add cover image and change description

* fix(trinity): update cover png

* add(pandora): cover image

* fix(pandora): cover image

* add(mixtral): add model.json for mixtral

* archived some models + update the model.json

* add(model): add pandora 10.7b

* fix(model): update description

* fix(model): pump vers and change the featured model to trinity

* fix(model): archive neuralchat

* fix(model): decapriated all old models

* fix(trinity): add cover image and change description

* fix(trinity): update cover png

* add(pandora): cover image

* fix(pandora): cover image

* chore: model desc nits

* fix(models): adjust the size for solars and pandoras

* add(mixtral): description

---------

Co-authored-by: 0xSage <n@pragmatic.vc>

chore: reformat model.json and use new template

fix(Model): download/abort model (#1163)

* fix(Model): download/abort model
* fix: image preview

Signed-off-by: James <james@jan.ai>

---------

Signed-off-by: James <james@jan.ai>
Co-authored-by: James <james@jan.ai>
Co-authored-by: Louis <louis@jan.ai>

add preview and reduce time re-render all chat screen

Signed-off-by: James <james@jan.ai>

store files under thread_id/files

Signed-off-by: James <james@jan.ai>

fix: Update llava 1.5 size

fix: Nitro extension path resolver

feat: Add upload preview clearance

chore: Update FileType to multiple targets

fix: delete file preview once new thread created

chore: Add langchain import

support storing pdf file

Signed-off-by: James <james@jan.ai>

feat: add retrieval tool in node runtime

fix: import module done

Co-authored-by: Louis <louis-jan@users.noreply.github.com>

feat: Add type assistant tool

chore: Add tool_retrieval_enabled to InferenceEngine

chore: Add AssistantTool to thread entity

chore: refactor tool retrieval base class

feat: Add handler for assistant with rag enabled

chore: Update inferenceEngine type properly

chore: Update inferenceEngine type properly

fix: Update retrieval tool

chore: main entry correction

refactor: tsconfig files

chore: Update ModelRuntimeParams type

refactor: Remove unused files

fix: wip

chore: remove unused console.log for FileUploadPreview

fix: Update mapping correctly for engine and proxyEngine

feat: Add proxyEngine to type ModelInfo

fix: WIP with test route

fix: Add bundleDependencies to package.json

chore: remove conversational history memory

fix: refactor data passing

reafactor: remove unused code

fix: Update module

chore: export import correction

fix conflict

Signed-off-by: James <james@jan.ai>

fix: resolve after rebased

fix: Update llava 1.5 model json

feat: Add bakllava 1 model json

refactor: node module export, ES syntax and langchain import

fix: WIP

fix: WIP

fix: WIP

fix: external module import

fix: WIP

Add UI attachment fot file upload

Prepare Thumbnail UI image

chore: rebase model folder to dev branch

chore: remove multiple binaries related commits

fix: remove multiple binaries related commits part 2

fix: Remove transformer.js related deps

Fix truncate file name attachment

remove unused code image preview attachment

fix: remove multi binaries error

chore: remove commented code for ModelArtifacts type

Dropzone for drag and drop attachment

Avoid conditional showing 0 using length

fix symbol windows

avoid undefined tools

fix: add tool retrieval to true by default and disable the change

chore: remove unused code

fix: Enable nitro embedding by default

fix: Update code WIP with nitro embedding

chore: remove unused running function

fix: assistant extension missing module

feat: Retrieval ingest, query and reforward

fix: Update hnswlib version conflict

fix: Add tool settings

fix: Update path to thread_id/memory

fix: Add support for nitro embedding usage

fix: RAG does not work with plain content message

fix(Model): #1662 imported model does not use gpu (#1723)

Signed-off-by: James <james@jan.ai>
Co-authored-by: James <james@jan.ai>

feat: allow users to update retrieval settings

chore: pass thread assistant settings to assistant extensions

chore: eslint fix

fix bug border right panel showing in thread while not have active thread

Update setting layout retrieval assistant

Renaming file settingcomponent

change default value in core extention

add fake loader generate response

fix conditional fake loader

remove unused import

Proper error message on file typr

fix: loading indicator

fix: chunk size and overlap constraint

conditional drag and drop when retrieval off

fix: enable retrieval middleware as soon as its tool is enabled

fix: configure embedding engine according to request

fix: Retrieval false by default

fix: engine json

chore: migrate assistant

disabled collapse panel when retrieval or children null

chore: remove unused log

chore: Bump nitro version to 0.2.14 for batch embedding

chore: remove unused console.log
---
 core/src/api/index.ts                         |   1 +
 core/src/fs.ts                                |  16 +-
 core/src/node/api/routes/fs.ts                |   9 +-
 core/src/types/assistant/assistantEntity.ts   |   9 +-
 core/src/types/inference/inferenceEntity.ts   |  29 +-
 core/src/types/message/messageEntity.ts       |  15 +-
 core/src/types/model/modelEntity.ts           |  12 +-
 core/src/types/thread/index.ts                |   1 +
 core/src/types/thread/threadEntity.ts         |   2 +
 core/src/types/thread/threadEvent.ts          |   4 +
 electron/handlers/fileManager.ts              |  16 +
 electron/handlers/fs.ts                       |   8 +-
 extensions/assistant-extension/package.json   |  28 +-
 .../assistant-extension/rollup.config.ts      |  81 +++++
 .../src/@types/global.d.ts                    |   4 +-
 extensions/assistant-extension/src/index.ts   | 197 +++++++++++-
 .../assistant-extension/src/node/engine.ts    |  13 +
 .../assistant-extension/src/node/index.ts     |  39 +++
 .../src/node/tools/retrieval/index.ts         |  78 +++++
 extensions/assistant-extension/tsconfig.json  |  22 +-
 .../assistant-extension/webpack.config.js     |  38 ---
 .../conversational-extension/src/index.ts     |  56 +++-
 .../inference-nitro-extension/bin/version.txt |   2 +-
 .../inference-nitro-extension/package.json    |   1 +
 .../inference-nitro-extension/src/index.ts    |  14 +-
 .../src/node/index.ts                         |  23 +-
 .../inference-openai-extension/src/index.ts   |  15 +-
 .../inference-openai-extension/tsconfig.json  |   5 +-
 .../tsconfig.json                             |   5 +-
 web/containers/CardSidebar/index.tsx          |  44 +--
 web/containers/Checkbox/index.tsx             |  50 +--
 web/containers/Layout/TopBar/index.tsx        |  18 +-
 web/containers/Loader/GenerateResponse.tsx    |  39 +++
 web/containers/ModelConfigInput/index.tsx     |  51 +---
 web/containers/Providers/EventHandler.tsx     |   5 +-
 web/containers/Providers/Jotai.tsx            |   8 +
 web/containers/Shortcut/index.tsx             |   2 +-
 web/containers/SliderRightPanel/index.tsx     |  58 +---
 web/helpers/atoms/ChatMessage.atom.ts         |   2 +
 web/hooks/useCreateNewThread.ts               |  10 +-
 web/hooks/usePath.ts                          |  17 ++
 web/hooks/useSendChatMessage.ts               | 100 +++++-
 web/hooks/useSetActiveThread.ts               |   2 +
 web/next.config.js                            |   3 -
 web/package.json                              |   2 +
 web/screens/Chat/AssistantSetting/index.tsx   |  78 +++++
 web/screens/Chat/ChatBody/index.tsx           |  24 +-
 web/screens/Chat/ChatInput/index.tsx          | 254 ++++++++++++++++
 web/screens/Chat/EngineSetting/index.tsx      |  17 +-
 web/screens/Chat/FileUploadPreview/Icon.tsx   |  95 ++++++
 web/screens/Chat/FileUploadPreview/index.tsx  |  47 +++
 web/screens/Chat/ImageUploadPreview/index.tsx |  54 ++++
 .../Chat/MessageQueuedBanner/index.tsx        |  19 ++
 ...ponentBuilder.tsx => SettingComponent.tsx} |  73 ++++-
 web/screens/Chat/ModelSetting/index.tsx       |   7 +-
 .../Chat/ModelSetting/predefinedComponent.ts  |  50 ++-
 .../Chat/RequestDownloadModel/index.tsx       |  42 +++
 web/screens/Chat/Sidebar/index.tsx            | 108 +++++--
 web/screens/Chat/SimpleTextMessage/index.tsx  | 114 +++++--
 web/screens/Chat/ThreadList/index.tsx         |   1 +
 web/screens/Chat/index.tsx                    | 286 +++++++++---------
 .../ExploreModelItemHeader/index.tsx          |   2 +
 web/screens/LocalServer/index.tsx             |  10 +-
 web/tsconfig.json                             |  10 +-
 web/types/index.d.ts                          |   1 -
 web/utils/base64.ts                           |   9 +
 web/utils/componentSettings.ts                |  25 +-
 web/utils/modelParam.ts                       |   4 +-
 68 files changed, 1959 insertions(+), 525 deletions(-)
 create mode 100644 core/src/types/thread/threadEvent.ts
 create mode 100644 extensions/assistant-extension/rollup.config.ts
 create mode 100644 extensions/assistant-extension/src/node/engine.ts
 create mode 100644 extensions/assistant-extension/src/node/index.ts
 create mode 100644 extensions/assistant-extension/src/node/tools/retrieval/index.ts
 delete mode 100644 extensions/assistant-extension/webpack.config.js
 create mode 100644 web/containers/Loader/GenerateResponse.tsx
 create mode 100644 web/screens/Chat/AssistantSetting/index.tsx
 create mode 100644 web/screens/Chat/ChatInput/index.tsx
 create mode 100644 web/screens/Chat/FileUploadPreview/Icon.tsx
 create mode 100644 web/screens/Chat/FileUploadPreview/index.tsx
 create mode 100644 web/screens/Chat/ImageUploadPreview/index.tsx
 create mode 100644 web/screens/Chat/MessageQueuedBanner/index.tsx
 rename web/screens/Chat/ModelSetting/{settingComponentBuilder.tsx => SettingComponent.tsx} (50%)
 create mode 100644 web/screens/Chat/RequestDownloadModel/index.tsx
 create mode 100644 web/utils/base64.ts

diff --git a/core/src/api/index.ts b/core/src/api/index.ts
index a3d0361e7..a232c4090 100644
--- a/core/src/api/index.ts
+++ b/core/src/api/index.ts
@@ -62,6 +62,7 @@ export enum FileManagerRoute {
   getJanDataFolderPath = 'getJanDataFolderPath',
   getResourcePath = 'getResourcePath',
   fileStat = 'fileStat',
+  writeBlob = 'writeBlob',
 }
 
 export type ApiFunction = (...args: any[]) => any
diff --git a/core/src/fs.ts b/core/src/fs.ts
index ea636977a..0e570d1f5 100644
--- a/core/src/fs.ts
+++ b/core/src/fs.ts
@@ -1,4 +1,4 @@
-import { FileStat } from "./types"
+import { FileStat } from './types'
 
 /**
  * Writes data to a file at the specified path.
@@ -6,6 +6,15 @@ import { FileStat } from "./types"
  */
 const writeFileSync = (...args: any[]) => global.core.api?.writeFileSync(...args)
 
+/**
+ * Writes blob data to a file at the specified path.
+ * @param path - The path to file.
+ * @param data - The blob data.
+ * @returns
+ */
+const writeBlob: (path: string, data: string) => Promise<any> = (path, data) =>
+  global.core.api?.writeBlob(path, data)
+
 /**
  * Reads the contents of a file at the specified path.
  * @returns {Promise<any>} A Promise that resolves with the contents of the file.
@@ -60,7 +69,6 @@ const syncFile: (src: string, dest: string) => Promise<any> = (src, dest) =>
  */
 const copyFileSync = (...args: any[]) => global.core.api?.copyFileSync(...args)
 
-
 /**
  * Gets the file's stats.
  *
@@ -70,7 +78,6 @@ const copyFileSync = (...args: any[]) => global.core.api?.copyFileSync(...args)
 const fileStat: (path: string) => Promise<FileStat | undefined> = (path) =>
   global.core.api?.fileStat(path)
 
-
 // TODO: Export `dummy` fs functions automatically
 // Currently adding these manually
 export const fs = {
@@ -84,5 +91,6 @@ export const fs = {
   appendFileSync,
   copyFileSync,
   syncFile,
-  fileStat
+  fileStat,
+  writeBlob,
 }
diff --git a/core/src/node/api/routes/fs.ts b/core/src/node/api/routes/fs.ts
index 5f511af27..c5404ccce 100644
--- a/core/src/node/api/routes/fs.ts
+++ b/core/src/node/api/routes/fs.ts
@@ -2,6 +2,7 @@ import { FileSystemRoute } from '../../../api'
 import { join } from 'path'
 import { HttpServer } from '../HttpServer'
 import { getJanDataFolderPath } from '../../utils'
+import { normalizeFilePath } from '../../path'
 
 export const fsRouter = async (app: HttpServer) => {
   const moduleName = 'fs'
@@ -13,10 +14,10 @@ export const fsRouter = async (app: HttpServer) => {
         const result = await import(moduleName).then((mdl) => {
           return mdl[route](
             ...body.map((arg: any) =>
-              typeof arg === 'string' && arg.includes('file:/')
-                ? join(getJanDataFolderPath(), arg.replace('file:/', ''))
-                : arg,
-            ),
+              typeof arg === 'string' && (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
+                ? join(getJanDataFolderPath(), normalizeFilePath(arg))
+                : arg
+            )
           )
         })
         res.status(200).send(result)
diff --git a/core/src/types/assistant/assistantEntity.ts b/core/src/types/assistant/assistantEntity.ts
index 91bb2bb22..733dbea8d 100644
--- a/core/src/types/assistant/assistantEntity.ts
+++ b/core/src/types/assistant/assistantEntity.ts
@@ -2,6 +2,13 @@
  * Assistant type defines the shape of an assistant object.
  * @stored
  */
+
+export type AssistantTool = {
+  type: string
+  enabled: boolean
+  settings: any
+}
+
 export type Assistant = {
   /** Represents the avatar of the user. */
   avatar: string
@@ -22,7 +29,7 @@ export type Assistant = {
   /** Represents the instructions for the object. */
   instructions?: string
   /** Represents the tools associated with the object. */
-  tools?: any
+  tools?: AssistantTool[]
   /** Represents the file identifiers associated with the object. */
   file_ids: string[]
   /** Represents the metadata of the object. */
diff --git a/core/src/types/inference/inferenceEntity.ts b/core/src/types/inference/inferenceEntity.ts
index 58b838ae7..c37e3b079 100644
--- a/core/src/types/inference/inferenceEntity.ts
+++ b/core/src/types/inference/inferenceEntity.ts
@@ -1,3 +1,5 @@
+import { ContentType, ContentValue } from '../message'
+
 /**
  * The role of the author of this message.
  */
@@ -13,7 +15,32 @@ export enum ChatCompletionRole {
  */
 export type ChatCompletionMessage = {
   /** The contents of the message. **/
-  content?: string
+  content?: ChatCompletionMessageContent
   /** The role of the author of this message. **/
   role: ChatCompletionRole
 }
+
+export type ChatCompletionMessageContent =
+  | string
+  | (ChatCompletionMessageContentText &
+      ChatCompletionMessageContentImage &
+      ChatCompletionMessageContentDoc)[]
+
+export enum ChatCompletionMessageContentType {
+  Text = 'text',
+  Image = 'image_url',
+  Doc = 'doc_url',
+}
+
+export type ChatCompletionMessageContentText = {
+  type: ChatCompletionMessageContentType
+  text: string
+}
+export type ChatCompletionMessageContentImage = {
+  type: ChatCompletionMessageContentType
+  image_url: { url: string }
+}
+export type ChatCompletionMessageContentDoc = {
+  type: ChatCompletionMessageContentType
+  doc_url: { url: string }
+}
diff --git a/core/src/types/message/messageEntity.ts b/core/src/types/message/messageEntity.ts
index 199743796..87e4b1997 100644
--- a/core/src/types/message/messageEntity.ts
+++ b/core/src/types/message/messageEntity.ts
@@ -1,5 +1,6 @@
 import { ChatCompletionMessage, ChatCompletionRole } from '../inference'
 import { ModelInfo } from '../model'
+import { Thread } from '../thread'
 
 /**
  * The `ThreadMessage` type defines the shape of a thread's message object.
@@ -35,7 +36,10 @@ export type ThreadMessage = {
 export type MessageRequest = {
   id?: string
 
-  /** The thread id of the message request. **/
+  /**
+   * @deprecated Use thread object instead
+   * The thread id of the message request.
+   */
   threadId: string
 
   /**
@@ -48,6 +52,10 @@ export type MessageRequest = {
 
   /** Settings for constructing a chat completion request **/
   model?: ModelInfo
+
+  /** The thread of this message is belong to. **/
+  // TODO: deprecate threadId field
+  thread?: Thread
 }
 
 /**
@@ -62,7 +70,7 @@ export enum MessageStatus {
   /** Message loaded with error. **/
   Error = 'error',
   /** Message is cancelled streaming */
-  Stopped = "stopped"
+  Stopped = 'stopped',
 }
 
 /**
@@ -71,6 +79,7 @@ export enum MessageStatus {
 export enum ContentType {
   Text = 'text',
   Image = 'image',
+  Pdf = 'pdf',
 }
 
 /**
@@ -80,6 +89,8 @@ export enum ContentType {
 export type ContentValue = {
   value: string
   annotations: string[]
+  name?: string
+  size?: number
 }
 
 /**
diff --git a/core/src/types/model/modelEntity.ts b/core/src/types/model/modelEntity.ts
index c60ab7650..727ff085f 100644
--- a/core/src/types/model/modelEntity.ts
+++ b/core/src/types/model/modelEntity.ts
@@ -7,6 +7,7 @@ export type ModelInfo = {
   settings: ModelSettingParams
   parameters: ModelRuntimeParams
   engine?: InferenceEngine
+  proxyEngine?: InferenceEngine
 }
 
 /**
@@ -18,7 +19,8 @@ export enum InferenceEngine {
   nitro = 'nitro',
   openai = 'openai',
   triton_trtllm = 'triton_trtllm',
-  hf_endpoint = 'hf_endpoint',
+
+  tool_retrieval_enabled = 'tool_retrieval_enabled',
 }
 
 export type ModelArtifact = {
@@ -90,6 +92,13 @@ export type Model = {
    * The model engine.
    */
   engine: InferenceEngine
+
+  proxyEngine?: InferenceEngine
+
+  /**
+   * Is multimodal or not.
+   */
+  visionModel?: boolean
 }
 
 export type ModelMetadata = {
@@ -129,4 +138,5 @@ export type ModelRuntimeParams = {
   stop?: string[]
   frequency_penalty?: number
   presence_penalty?: number
+  engine?: string
 }
diff --git a/core/src/types/thread/index.ts b/core/src/types/thread/index.ts
index c6ff6204a..32155e1cd 100644
--- a/core/src/types/thread/index.ts
+++ b/core/src/types/thread/index.ts
@@ -1,2 +1,3 @@
 export * from './threadEntity'
 export * from './threadInterface'
+export * from './threadEvent'
diff --git a/core/src/types/thread/threadEntity.ts b/core/src/types/thread/threadEntity.ts
index 4ff3aa1fc..37136eae6 100644
--- a/core/src/types/thread/threadEntity.ts
+++ b/core/src/types/thread/threadEntity.ts
@@ -1,3 +1,4 @@
+import { AssistantTool } from '../assistant'
 import { ModelInfo } from '../model'
 
 /**
@@ -30,6 +31,7 @@ export type ThreadAssistantInfo = {
   assistant_name: string
   model: ModelInfo
   instructions?: string
+  tools?: AssistantTool[]
 }
 
 /**
diff --git a/core/src/types/thread/threadEvent.ts b/core/src/types/thread/threadEvent.ts
new file mode 100644
index 000000000..4b19b09c1
--- /dev/null
+++ b/core/src/types/thread/threadEvent.ts
@@ -0,0 +1,4 @@
+export enum ThreadEvent {
+  /** The `OnThreadStarted` event is emitted when a thread is started. */
+  OnThreadStarted = 'OnThreadStarted',
+}
diff --git a/electron/handlers/fileManager.ts b/electron/handlers/fileManager.ts
index f41286934..2528aef71 100644
--- a/electron/handlers/fileManager.ts
+++ b/electron/handlers/fileManager.ts
@@ -59,4 +59,20 @@ export function handleFileMangerIPCs() {
       return fileStat
     }
   )
+
+  ipcMain.handle(
+    FileManagerRoute.writeBlob,
+    async (_event, path: string, data: string): Promise<void> => {
+      try {
+        const normalizedPath = normalizeFilePath(path)
+        const dataBuffer = Buffer.from(data, 'base64')
+        fs.writeFileSync(
+          join(getJanDataFolderPath(), normalizedPath),
+          dataBuffer
+        )
+      } catch (err) {
+        console.error(`writeFile ${path} result: ${err}`)
+      }
+    }
+  )
 }
diff --git a/electron/handlers/fs.ts b/electron/handlers/fs.ts
index 408a5fd10..34026b940 100644
--- a/electron/handlers/fs.ts
+++ b/electron/handlers/fs.ts
@@ -1,9 +1,9 @@
 import { ipcMain } from 'electron'
 
-import { FileSystemRoute } from '@janhq/core'
-import { join } from 'path'
 import { getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
-
+import fs from 'fs'
+import { FileManagerRoute, FileSystemRoute } from '@janhq/core'
+import { join } from 'path'
 /**
  * Handles file system operations.
  */
@@ -15,7 +15,7 @@ export function handleFsIPCs() {
         mdl[route](
           ...args.map((arg) =>
             typeof arg === 'string' &&
-            (arg.includes(`file:/`) || arg.includes(`file:\\`))
+            (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
               ? join(getJanDataFolderPath(), normalizeFilePath(arg))
               : arg
           )
diff --git a/extensions/assistant-extension/package.json b/extensions/assistant-extension/package.json
index 4e84aa573..f4e4dd825 100644
--- a/extensions/assistant-extension/package.json
+++ b/extensions/assistant-extension/package.json
@@ -3,26 +3,46 @@
   "version": "1.0.0",
   "description": "This extension enables assistants, including Jan, a default assistant that can call all downloaded models",
   "main": "dist/index.js",
-  "module": "dist/module.js",
+  "node": "dist/node/index.js",
   "author": "Jan <service@jan.ai>",
   "license": "AGPL-3.0",
   "scripts": {
-    "build": "tsc -b . && webpack --config webpack.config.js",
+    "build": "tsc --module commonjs && rollup -c rollup.config.ts",
     "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
   },
   "devDependencies": {
+    "@rollup/plugin-commonjs": "^25.0.7",
+    "@rollup/plugin-json": "^6.1.0",
+    "@rollup/plugin-node-resolve": "^15.2.3",
+    "@rollup/plugin-replace": "^5.0.5",
+    "@types/pdf-parse": "^1.1.4",
+    "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
-    "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "rollup": "^2.38.5",
+    "rollup-plugin-define": "^1.0.1",
+    "rollup-plugin-sourcemaps": "^0.6.3",
+    "rollup-plugin-typescript2": "^0.36.0",
+    "typescript": "^5.3.3"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
+    "@langchain/community": "0.0.13",
+    "hnswlib-node": "^1.4.2",
+    "langchain": "^0.0.214",
     "path-browserify": "^1.0.1",
+    "pdf-parse": "^1.1.1",
     "ts-loader": "^9.5.0"
   },
   "files": [
     "dist/*",
     "package.json",
     "README.md"
+  ],
+  "bundleDependencies": [
+    "@janhq/core",
+    "@langchain/community",
+    "hnswlib-node",
+    "langchain",
+    "pdf-parse"
   ]
 }
diff --git a/extensions/assistant-extension/rollup.config.ts b/extensions/assistant-extension/rollup.config.ts
new file mode 100644
index 000000000..7916ef9c8
--- /dev/null
+++ b/extensions/assistant-extension/rollup.config.ts
@@ -0,0 +1,81 @@
+import resolve from "@rollup/plugin-node-resolve";
+import commonjs from "@rollup/plugin-commonjs";
+import sourceMaps from "rollup-plugin-sourcemaps";
+import typescript from "rollup-plugin-typescript2";
+import json from "@rollup/plugin-json";
+import replace from "@rollup/plugin-replace";
+
+const packageJson = require("./package.json");
+
+const pkg = require("./package.json");
+
+export default [
+  {
+    input: `src/index.ts`,
+    output: [{ file: pkg.main, format: "es", sourcemap: true }],
+    // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
+    external: [],
+    watch: {
+      include: "src/**",
+    },
+    plugins: [
+      replace({
+        NODE: JSON.stringify(`${packageJson.name}/${packageJson.node}`),
+        EXTENSION_NAME: JSON.stringify(packageJson.name),
+        VERSION: JSON.stringify(packageJson.version),
+      }),
+      // Allow json resolution
+      json(),
+      //     Compile TypeScript files
+      typescript({ useTsconfigDeclarationDir: true }),
+      // Compile TypeScript files
+      // Allow bundling cjs modules (unlike webpack, rollup doesn't understand cjs)
+      commonjs(),
+      // Allow node_modules resolution, so you can use 'external' to control
+      // which external modules to include in the bundle
+      // https://github.com/rollup/rollup-plugin-node-resolve#usage
+      resolve({
+        extensions: [".js", ".ts", ".svelte"],
+      }),
+
+      // Resolve source maps to the original source
+      sourceMaps(),
+    ],
+  },
+  {
+    input: `src/node/index.ts`,
+    output: [{ dir: "dist/node", format: "cjs", sourcemap: false }],
+    // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
+    external: [
+      "@janhq/core/node",
+      "@langchain/community",
+      "langchain",
+      "langsmith",
+      "path",
+      "hnswlib-node",
+    ],
+    watch: {
+      include: "src/node/**",
+    },
+    // inlineDynamicImports: true,
+    plugins: [
+      // Allow json resolution
+      json(),
+      // Compile TypeScript files
+      typescript({ useTsconfigDeclarationDir: true }),
+      // Allow bundling cjs modules (unlike webpack, rollup doesn't understand cjs)
+      commonjs({
+        ignoreDynamicRequires: true,
+      }),
+      // Allow node_modules resolution, so you can use 'external' to control
+      // which external modules to include in the bundle
+      // https://github.com/rollup/rollup-plugin-node-resolve#usage
+      resolve({
+        extensions: [".ts", ".js", ".json"],
+      }),
+
+      // Resolve source maps to the original source
+      // sourceMaps(),
+    ],
+  },
+];
diff --git a/extensions/assistant-extension/src/@types/global.d.ts b/extensions/assistant-extension/src/@types/global.d.ts
index 3b45ccc5a..dc11709a4 100644
--- a/extensions/assistant-extension/src/@types/global.d.ts
+++ b/extensions/assistant-extension/src/@types/global.d.ts
@@ -1 +1,3 @@
-declare const MODULE: string;
+declare const NODE: string;
+declare const EXTENSION_NAME: string;
+declare const VERSION: string;
diff --git a/extensions/assistant-extension/src/index.ts b/extensions/assistant-extension/src/index.ts
index 098ab1f54..6495ea786 100644
--- a/extensions/assistant-extension/src/index.ts
+++ b/extensions/assistant-extension/src/index.ts
@@ -1,15 +1,151 @@
-import { fs, Assistant, AssistantExtension } from "@janhq/core";
-import { join } from "path";
+import {
+  fs,
+  Assistant,
+  MessageRequest,
+  events,
+  InferenceEngine,
+  MessageEvent,
+  InferenceEvent,
+  joinPath,
+  executeOnMain,
+  AssistantExtension,
+} from "@janhq/core";
 
 export default class JanAssistantExtension extends AssistantExtension {
   private static readonly _homeDir = "file://assistants";
 
+  controller = new AbortController();
+  isCancelled = false;
+  retrievalThreadId: string | undefined = undefined;
+
   async onLoad() {
     // making the assistant directory
-    if (!(await fs.existsSync(JanAssistantExtension._homeDir)))
-      fs.mkdirSync(JanAssistantExtension._homeDir).then(() => {
-        this.createJanAssistant();
-      });
+    const assistantDirExist = await fs.existsSync(
+      JanAssistantExtension._homeDir,
+    );
+    if (
+      localStorage.getItem(`${EXTENSION_NAME}-version`) !== VERSION ||
+      !assistantDirExist
+    ) {
+      if (!assistantDirExist)
+        await fs.mkdirSync(JanAssistantExtension._homeDir);
+
+      // Write assistant metadata
+      this.createJanAssistant();
+      // Finished migration
+      localStorage.setItem(`${EXTENSION_NAME}-version`, VERSION);
+    }
+
+    // Events subscription
+    events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
+      JanAssistantExtension.handleMessageRequest(data, this),
+    );
+
+    events.on(InferenceEvent.OnInferenceStopped, () => {
+      JanAssistantExtension.handleInferenceStopped(this);
+    });
+  }
+
+  private static async handleInferenceStopped(instance: JanAssistantExtension) {
+    instance.isCancelled = true;
+    instance.controller?.abort();
+  }
+
+  private static async handleMessageRequest(
+    data: MessageRequest,
+    instance: JanAssistantExtension,
+  ) {
+    instance.isCancelled = false;
+    instance.controller = new AbortController();
+
+    if (
+      data.model?.engine !== InferenceEngine.tool_retrieval_enabled ||
+      !data.messages ||
+      !data.thread?.assistants[0]?.tools
+    ) {
+      return;
+    }
+
+    const latestMessage = data.messages[data.messages.length - 1];
+
+    // Ingest the document if needed
+    if (
+      latestMessage &&
+      latestMessage.content &&
+      typeof latestMessage.content !== "string"
+    ) {
+      const docFile = latestMessage.content[1]?.doc_url?.url;
+      if (docFile) {
+        await executeOnMain(
+          NODE,
+          "toolRetrievalIngestNewDocument",
+          docFile,
+          data.model?.proxyEngine,
+        );
+      }
+    }
+
+    // Load agent on thread changed
+    if (instance.retrievalThreadId !== data.threadId) {
+      await executeOnMain(NODE, "toolRetrievalLoadThreadMemory", data.threadId);
+
+      instance.retrievalThreadId = data.threadId;
+
+      // Update the text splitter
+      await executeOnMain(
+        NODE,
+        "toolRetrievalUpdateTextSplitter",
+        data.thread.assistants[0].tools[0]?.settings?.chunk_size ?? 4000,
+        data.thread.assistants[0].tools[0]?.settings?.chunk_overlap ?? 200,
+      );
+    }
+
+    if (latestMessage.content) {
+      const prompt =
+        typeof latestMessage.content === "string"
+          ? latestMessage.content
+          : latestMessage.content[0].text;
+      // Retrieve the result
+      console.debug("toolRetrievalQuery", latestMessage.content);
+      const retrievalResult = await executeOnMain(
+        NODE,
+        "toolRetrievalQueryResult",
+        prompt,
+      );
+
+      // Update the message content
+      // Using the retrieval template with the result and query
+      if (data.thread?.assistants[0].tools)
+        data.messages[data.messages.length - 1].content =
+          data.thread.assistants[0].tools[0].settings?.retrieval_template
+            ?.replace("{CONTEXT}", retrievalResult)
+            .replace("{QUESTION}", prompt);
+    }
+
+    // Filter out all the messages that are not text
+    data.messages = data.messages.map((message) => {
+      if (
+        message.content &&
+        typeof message.content !== "string" &&
+        (message.content.length ?? 0) > 0
+      ) {
+        return {
+          ...message,
+          content: [message.content[0]],
+        };
+      }
+      return message;
+    });
+
+    // Reroute the result to inference engine
+    const output = {
+      ...data,
+      model: {
+        ...data.model,
+        engine: data.model.proxyEngine,
+      },
+    };
+    events.emit(MessageEvent.OnMessageSent, output);
   }
 
   /**
@@ -18,15 +154,21 @@ export default class JanAssistantExtension extends AssistantExtension {
   onUnload(): void {}
 
   async createAssistant(assistant: Assistant): Promise<void> {
-    const assistantDir = join(JanAssistantExtension._homeDir, assistant.id);
+    const assistantDir = await joinPath([
+      JanAssistantExtension._homeDir,
+      assistant.id,
+    ]);
     if (!(await fs.existsSync(assistantDir))) await fs.mkdirSync(assistantDir);
 
     // store the assistant metadata json
-    const assistantMetadataPath = join(assistantDir, "assistant.json");
+    const assistantMetadataPath = await joinPath([
+      assistantDir,
+      "assistant.json",
+    ]);
     try {
       await fs.writeFileSync(
         assistantMetadataPath,
-        JSON.stringify(assistant, null, 2)
+        JSON.stringify(assistant, null, 2),
       );
     } catch (err) {
       console.error(err);
@@ -38,14 +180,17 @@ export default class JanAssistantExtension extends AssistantExtension {
     // get all the assistant metadata json
     const results: Assistant[] = [];
     const allFileName: string[] = await fs.readdirSync(
-      JanAssistantExtension._homeDir
+      JanAssistantExtension._homeDir,
     );
     for (const fileName of allFileName) {
-      const filePath = join(JanAssistantExtension._homeDir, fileName);
+      const filePath = await joinPath([
+        JanAssistantExtension._homeDir,
+        fileName,
+      ]);
 
       if (filePath.includes(".DS_Store")) continue;
       const jsonFiles: string[] = (await fs.readdirSync(filePath)).filter(
-        (file: string) => file === "assistant.json"
+        (file: string) => file === "assistant.json",
       );
 
       if (jsonFiles.length !== 1) {
@@ -54,8 +199,8 @@ export default class JanAssistantExtension extends AssistantExtension {
       }
 
       const content = await fs.readFileSync(
-        join(filePath, jsonFiles[0]),
-        "utf-8"
+        await joinPath([filePath, jsonFiles[0]]),
+        "utf-8",
       );
       const assistant: Assistant =
         typeof content === "object" ? content : JSON.parse(content);
@@ -72,7 +217,10 @@ export default class JanAssistantExtension extends AssistantExtension {
     }
 
     // remove the directory
-    const assistantDir = join(JanAssistantExtension._homeDir, assistant.id);
+    const assistantDir = await joinPath([
+      JanAssistantExtension._homeDir,
+      assistant.id,
+    ]);
     await fs.rmdirSync(assistantDir);
     return Promise.resolve();
   }
@@ -88,7 +236,24 @@ export default class JanAssistantExtension extends AssistantExtension {
       description: "A default assistant that can use all downloaded models",
       model: "*",
       instructions: "",
-      tools: undefined,
+      tools: [
+        {
+          type: "retrieval",
+          enabled: false,
+          settings: {
+            top_k: 2,
+            chunk_size: 1024,
+            chunk_overlap: 64,
+            retrieval_template: `Use the following pieces of context to answer the question at the end. If you don't know the answer, just say that you don't know, don't try to make up an answer.
+            ----------------
+            CONTEXT: {CONTEXT}
+            ----------------
+            QUESTION: {QUESTION}
+            ----------------
+            Helpful Answer:`,
+          },
+        },
+      ],
       file_ids: [],
       metadata: undefined,
     };
diff --git a/extensions/assistant-extension/src/node/engine.ts b/extensions/assistant-extension/src/node/engine.ts
new file mode 100644
index 000000000..54b2a6ba1
--- /dev/null
+++ b/extensions/assistant-extension/src/node/engine.ts
@@ -0,0 +1,13 @@
+import fs from "fs";
+import path from "path";
+import { getJanDataFolderPath } from "@janhq/core/node";
+
+// Sec: Do not send engine settings over requests
+// Read it manually instead
+export const readEmbeddingEngine = (engineName: string) => {
+  const engineSettings = fs.readFileSync(
+    path.join(getJanDataFolderPath(), "engines", `${engineName}.json`),
+    "utf-8",
+  );
+  return JSON.parse(engineSettings);
+};
diff --git a/extensions/assistant-extension/src/node/index.ts b/extensions/assistant-extension/src/node/index.ts
new file mode 100644
index 000000000..95a7243a4
--- /dev/null
+++ b/extensions/assistant-extension/src/node/index.ts
@@ -0,0 +1,39 @@
+import { getJanDataFolderPath, normalizeFilePath } from "@janhq/core/node";
+import { Retrieval } from "./tools/retrieval";
+import path from "path";
+
+const retrieval = new Retrieval();
+
+export async function toolRetrievalUpdateTextSplitter(
+  chunkSize: number,
+  chunkOverlap: number,
+) {
+  retrieval.updateTextSplitter(chunkSize, chunkOverlap);
+  return Promise.resolve();
+}
+export async function toolRetrievalIngestNewDocument(
+  file: string,
+  engine: string,
+) {
+  const filePath = path.join(getJanDataFolderPath(), normalizeFilePath(file));
+  const threadPath = path.dirname(filePath.replace("files", ""));
+  retrieval.updateEmbeddingEngine(engine);
+  await retrieval.ingestAgentKnowledge(filePath, `${threadPath}/memory`);
+  return Promise.resolve();
+}
+
+export async function toolRetrievalLoadThreadMemory(threadId: string) {
+  try {
+    await retrieval.loadRetrievalAgent(
+      path.join(getJanDataFolderPath(), "threads", threadId, "memory"),
+    );
+    return Promise.resolve();
+  } catch (err) {
+    console.debug(err);
+  }
+}
+
+export async function toolRetrievalQueryResult(query: string) {
+  const res = await retrieval.generateResult(query);
+  return Promise.resolve(res);
+}
diff --git a/extensions/assistant-extension/src/node/tools/retrieval/index.ts b/extensions/assistant-extension/src/node/tools/retrieval/index.ts
new file mode 100644
index 000000000..f9d5c4029
--- /dev/null
+++ b/extensions/assistant-extension/src/node/tools/retrieval/index.ts
@@ -0,0 +1,78 @@
+import { RecursiveCharacterTextSplitter } from "langchain/text_splitter";
+import { formatDocumentsAsString } from "langchain/util/document";
+import { PDFLoader } from "langchain/document_loaders/fs/pdf";
+
+import { HNSWLib } from "langchain/vectorstores/hnswlib";
+
+import { OpenAIEmbeddings } from "langchain/embeddings/openai";
+import { readEmbeddingEngine } from "../../engine";
+
+export class Retrieval {
+  public chunkSize: number = 100;
+  public chunkOverlap?: number = 0;
+  private retriever: any;
+
+  private embeddingModel: any = undefined;
+  private textSplitter?: RecursiveCharacterTextSplitter;
+
+  constructor(chunkSize: number = 4000, chunkOverlap: number = 200) {
+    this.updateTextSplitter(chunkSize, chunkOverlap);
+    this.embeddingModel = new OpenAIEmbeddings({});
+  }
+
+  public updateTextSplitter(chunkSize: number, chunkOverlap: number): void {
+    this.chunkSize = chunkSize;
+    this.chunkOverlap = chunkOverlap;
+    this.textSplitter = new RecursiveCharacterTextSplitter({
+      chunkSize: chunkSize,
+      chunkOverlap: chunkOverlap,
+    });
+  }
+
+  public updateEmbeddingEngine(engine: string): void {
+    // Engine settings are not compatible with the current embedding model params
+    // Switch case manually for now
+    const settings = readEmbeddingEngine(engine);
+    if (engine === "nitro") {
+      this.embeddingModel = new OpenAIEmbeddings(
+        { openAIApiKey: "nitro-embedding" },
+        { basePath: "http://127.0.0.1:3928/v1" },
+      );
+    } else {
+      // Fallback to OpenAI Settings
+      this.embeddingModel = new OpenAIEmbeddings({
+        configuration: {
+          apiKey: settings.api_key,
+        },
+      });
+    }
+  }
+
+  public ingestAgentKnowledge = async (
+    filePath: string,
+    memoryPath: string,
+  ): Promise<any> => {
+    const loader = new PDFLoader(filePath, {
+      splitPages: true,
+    });
+    const doc = await loader.load();
+    const docs = await this.textSplitter!.splitDocuments(doc);
+    const vectorStore = await HNSWLib.fromDocuments(docs, this.embeddingModel);
+    return vectorStore.save(memoryPath);
+  };
+
+  public loadRetrievalAgent = async (memoryPath: string): Promise<void> => {
+    const vectorStore = await HNSWLib.load(memoryPath, this.embeddingModel);
+    this.retriever = vectorStore.asRetriever(2);
+    return Promise.resolve();
+  };
+
+  public generateResult = async (query: string): Promise<string> => {
+    if (!this.retriever) {
+      return Promise.resolve(" ");
+    }
+    const relevantDocs = await this.retriever.getRelevantDocuments(query);
+    const serializedDoc = formatDocumentsAsString(relevantDocs);
+    return Promise.resolve(serializedDoc);
+  };
+}
diff --git a/extensions/assistant-extension/tsconfig.json b/extensions/assistant-extension/tsconfig.json
index 2477d58ce..d3794cace 100644
--- a/extensions/assistant-extension/tsconfig.json
+++ b/extensions/assistant-extension/tsconfig.json
@@ -1,14 +1,20 @@
 {
   "compilerOptions": {
-    "target": "es2016",
-    "module": "ES6",
     "moduleResolution": "node",
-    "outDir": "./dist",
-    "esModuleInterop": true,
-    "forceConsistentCasingInFileNames": true,
-    "strict": false,
+    "target": "es5",
+    "module": "ES2020",
+    "lib": ["es2015", "es2016", "es2017", "dom"],
+    "strict": true,
+    "sourceMap": true,
+    "declaration": true,
+    "allowSyntheticDefaultImports": true,
+    "experimentalDecorators": true,
+    "emitDecoratorMetadata": true,
+    "declarationDir": "dist/types",
+    "outDir": "dist",
+    "importHelpers": true,
+    "typeRoots": ["node_modules/@types"],
     "skipLibCheck": true,
-    "rootDir": "./src"
   },
-  "include": ["./src"]
+  "include": ["src"],
 }
diff --git a/extensions/assistant-extension/webpack.config.js b/extensions/assistant-extension/webpack.config.js
deleted file mode 100644
index 74d16fc8e..000000000
--- a/extensions/assistant-extension/webpack.config.js
+++ /dev/null
@@ -1,38 +0,0 @@
-const path = require("path");
-const webpack = require("webpack");
-const packageJson = require("./package.json");
-
-module.exports = {
-  experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
-  module: {
-    rules: [
-      {
-        test: /\.tsx?$/,
-        use: "ts-loader",
-        exclude: /node_modules/,
-      },
-    ],
-  },
-  output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
-  },
-  plugins: [
-    new webpack.DefinePlugin({
-      MODULE: JSON.stringify(`${packageJson.name}/${packageJson.module}`),
-    }),
-  ],
-  resolve: {
-    extensions: [".ts", ".js"],
-    fallback: {
-      path: require.resolve("path-browserify"),
-    },
-  },
-  optimization: {
-    minimize: false,
-  },
-  // Add loaders and other configuration as needed for your project
-};
diff --git a/extensions/conversational-extension/src/index.ts b/extensions/conversational-extension/src/index.ts
index 66becb748..61f0fd0e9 100644
--- a/extensions/conversational-extension/src/index.ts
+++ b/extensions/conversational-extension/src/index.ts
@@ -4,15 +4,14 @@ import {
   ConversationalExtension,
   Thread,
   ThreadMessage,
+  events,
 } from '@janhq/core'
 
 /**
  * JSONConversationalExtension is a ConversationalExtension implementation that provides
  * functionality for managing threads.
  */
-export default class JSONConversationalExtension
-  extends ConversationalExtension
-{
+export default class JSONConversationalExtension extends ConversationalExtension {
   private static readonly _homeDir = 'file://threads'
   private static readonly _threadInfoFileName = 'thread.json'
   private static readonly _threadMessagesFileName = 'messages.jsonl'
@@ -119,6 +118,32 @@ export default class JSONConversationalExtension
       ])
       if (!(await fs.existsSync(threadDirPath)))
         await fs.mkdirSync(threadDirPath)
+
+      if (message.content[0].type === 'image') {
+        const filesPath = await joinPath([threadDirPath, 'files'])
+        if (!(await fs.existsSync(filesPath))) await fs.mkdirSync(filesPath)
+
+        const imagePath = await joinPath([filesPath, `${message.id}.png`])
+        const base64 = message.content[0].text.annotations[0]
+        await this.storeImage(base64, imagePath)
+        // if (fs.existsSync(imagePath)) {
+        //   message.content[0].text.annotations[0] = imagePath
+        // }
+      }
+
+      if (message.content[0].type === 'pdf') {
+        const filesPath = await joinPath([threadDirPath, 'files'])
+        if (!(await fs.existsSync(filesPath))) await fs.mkdirSync(filesPath)
+
+        const filePath = await joinPath([filesPath, `${message.id}.pdf`])
+        const blob = message.content[0].text.annotations[0]
+        await this.storeFile(blob, filePath)
+
+        if (await fs.existsSync(filePath)) {
+          // Use file path instead of blob
+          message.content[0].text.annotations[0] = `threads/${message.thread_id}/files/${message.id}.pdf`
+        }
+      }
       await fs.appendFileSync(threadMessagePath, JSON.stringify(message) + '\n')
       Promise.resolve()
     } catch (err) {
@@ -126,6 +151,25 @@ export default class JSONConversationalExtension
     }
   }
 
+  async storeImage(base64: string, filePath: string): Promise<void> {
+    const base64Data = base64.replace(/^data:image\/\w+;base64,/, '')
+
+    try {
+      await fs.writeBlob(filePath, base64Data)
+    } catch (err) {
+      console.error(err)
+    }
+  }
+
+  async storeFile(base64: string, filePath: string): Promise<void> {
+    const base64Data = base64.replace(/^data:application\/pdf;base64,/, '')
+    try {
+      await fs.writeBlob(filePath, base64Data)
+    } catch (err) {
+      console.error(err)
+    }
+  }
+
   async writeMessages(
     threadId: string,
     messages: ThreadMessage[]
@@ -229,7 +273,11 @@ export default class JSONConversationalExtension
 
       const messages: ThreadMessage[] = []
       result.forEach((line: string) => {
-        messages.push(JSON.parse(line) as ThreadMessage)
+        try {
+          messages.push(JSON.parse(line) as ThreadMessage)
+        } catch (err) {
+          console.error(err)
+        }
       })
       return messages
     } catch (err) {
diff --git a/extensions/inference-nitro-extension/bin/version.txt b/extensions/inference-nitro-extension/bin/version.txt
index f2722b133..769ed6ae7 100644
--- a/extensions/inference-nitro-extension/bin/version.txt
+++ b/extensions/inference-nitro-extension/bin/version.txt
@@ -1 +1 @@
-0.2.12
+0.2.14
diff --git a/extensions/inference-nitro-extension/package.json b/extensions/inference-nitro-extension/package.json
index 9379e194b..44727eb70 100644
--- a/extensions/inference-nitro-extension/package.json
+++ b/extensions/inference-nitro-extension/package.json
@@ -40,6 +40,7 @@
   "dependencies": {
     "@janhq/core": "file:../../core",
     "@rollup/plugin-replace": "^5.0.5",
+    "@types/os-utils": "^0.0.4",
     "fetch-retry": "^5.0.6",
     "path-browserify": "^1.0.1",
     "rxjs": "^7.8.1",
diff --git a/extensions/inference-nitro-extension/src/index.ts b/extensions/inference-nitro-extension/src/index.ts
index 735383a61..0e6edb992 100644
--- a/extensions/inference-nitro-extension/src/index.ts
+++ b/extensions/inference-nitro-extension/src/index.ts
@@ -50,7 +50,7 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
     ngl: 100,
     cpu_threads: 1,
     cont_batching: false,
-    embedding: false,
+    embedding: true,
   };
 
   controller = new AbortController();
@@ -83,19 +83,19 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.onMessageRequest(data)
+      this.onMessageRequest(data),
     );
 
     events.on(ModelEvent.OnModelInit, (model: Model) =>
-      this.onModelInit(model)
+      this.onModelInit(model),
     );
 
     events.on(ModelEvent.OnModelStop, (model: Model) =>
-      this.onModelStop(model)
+      this.onModelStop(model),
     );
 
     events.on(InferenceEvent.OnInferenceStopped, () =>
-      this.onInferenceStopped()
+      this.onInferenceStopped(),
     );
 
     // Attempt to fetch nvidia info
@@ -120,7 +120,7 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
       } else {
         await fs.writeFileSync(
           engineFile,
-          JSON.stringify(this._engineSettings, null, 2)
+          JSON.stringify(this._engineSettings, null, 2),
         );
       }
     } catch (err) {
@@ -148,7 +148,7 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
 
     this.getNitroProcesHealthIntervalId = setInterval(
       () => this.periodicallyGetNitroHealth(),
-      JanInferenceNitroExtension._intervalHealthCheck
+      JanInferenceNitroExtension._intervalHealthCheck,
     );
   }
 
diff --git a/extensions/inference-nitro-extension/src/node/index.ts b/extensions/inference-nitro-extension/src/node/index.ts
index a75f33df2..77060e414 100644
--- a/extensions/inference-nitro-extension/src/node/index.ts
+++ b/extensions/inference-nitro-extension/src/node/index.ts
@@ -78,7 +78,7 @@ function stopModel(): Promise<void> {
  * TODO: Should pass absolute of the model file instead of just the name - So we can modurize the module.ts to npm package
  */
 async function runModel(
-  wrapper: ModelInitOptions
+  wrapper: ModelInitOptions,
 ): Promise<ModelOperationResponse | void> {
   if (wrapper.model.engine !== InferenceEngine.nitro) {
     // Not a nitro model
@@ -96,7 +96,7 @@ async function runModel(
   const ggufBinFile = files.find(
     (file) =>
       file === path.basename(currentModelFile) ||
-      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT)
+      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT),
   );
 
   if (!ggufBinFile) return Promise.reject("No GGUF model file found");
@@ -133,7 +133,6 @@ async function runModel(
         mmproj: path.join(modelFolderPath, wrapper.model.settings.mmproj),
       }),
     };
-    console.log(currentSettings);
     return runNitroAndLoadModel();
   }
 }
@@ -192,10 +191,10 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const system_prompt = promptTemplate.substring(0, systemIndex);
     const user_prompt = promptTemplate.substring(
       systemIndex + systemMarker.length,
-      promptIndex
+      promptIndex,
     );
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length
+      promptIndex + promptMarker.length,
     );
 
     // Return the split parts
@@ -205,7 +204,7 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const promptIndex = promptTemplate.indexOf(promptMarker);
     const user_prompt = promptTemplate.substring(0, promptIndex);
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length
+      promptIndex + promptMarker.length,
     );
 
     // Return the split parts
@@ -234,8 +233,8 @@ function loadLLMModel(settings: any): Promise<Response> {
     .then((res) => {
       log(
         `[NITRO]::Debug: Load model success with response ${JSON.stringify(
-          res
-        )}`
+          res,
+        )}`,
       );
       return Promise.resolve(res);
     })
@@ -264,8 +263,8 @@ async function validateModelStatus(): Promise<void> {
   }).then(async (res: Response) => {
     log(
       `[NITRO]::Debug: Validate model state success with response ${JSON.stringify(
-        res
-      )}`
+        res,
+      )}`,
     );
     // If the response is OK, check model_loaded status.
     if (res.ok) {
@@ -316,7 +315,7 @@ function spawnNitroProcess(): Promise<any> {
     const args: string[] = ["1", LOCAL_HOST, PORT.toString()];
     // Execute the binary
     log(
-      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`
+      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`,
     );
     subprocess = spawn(
       executableOptions.executablePath,
@@ -327,7 +326,7 @@ function spawnNitroProcess(): Promise<any> {
           ...process.env,
           CUDA_VISIBLE_DEVICES: executableOptions.cudaVisibleDevices,
         },
-      }
+      },
     );
 
     // Handle subprocess output
diff --git a/extensions/inference-openai-extension/src/index.ts b/extensions/inference-openai-extension/src/index.ts
index 54572041d..44525b631 100644
--- a/extensions/inference-openai-extension/src/index.ts
+++ b/extensions/inference-openai-extension/src/index.ts
@@ -15,6 +15,7 @@ import {
   ThreadMessage,
   events,
   fs,
+  InferenceEngine,
   BaseExtension,
   MessageEvent,
   ModelEvent,
@@ -57,7 +58,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data) =>
-      JanInferenceOpenAIExtension.handleMessageRequest(data, this)
+      JanInferenceOpenAIExtension.handleMessageRequest(data, this),
     );
 
     events.on(ModelEvent.OnModelInit, (model: OpenAIModel) => {
@@ -81,7 +82,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
     try {
       const engineFile = join(
         JanInferenceOpenAIExtension._homeDir,
-        JanInferenceOpenAIExtension._engineMetadataFileName
+        JanInferenceOpenAIExtension._engineMetadataFileName,
       );
       if (await fs.existsSync(engineFile)) {
         const engine = await fs.readFileSync(engineFile, "utf-8");
@@ -90,7 +91,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
       } else {
         await fs.writeFileSync(
           engineFile,
-          JSON.stringify(JanInferenceOpenAIExtension._engineSettings, null, 2)
+          JSON.stringify(JanInferenceOpenAIExtension._engineSettings, null, 2),
         );
       }
     } catch (err) {
@@ -98,7 +99,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
     }
   }
   private static async handleModelInit(model: OpenAIModel) {
-    if (model.engine !== "openai") {
+    if (model.engine !== InferenceEngine.openai) {
       return;
     } else {
       JanInferenceOpenAIExtension._currentModel = model;
@@ -116,7 +117,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
   }
 
   private static async handleInferenceStopped(
-    instance: JanInferenceOpenAIExtension
+    instance: JanInferenceOpenAIExtension,
   ) {
     instance.isCancelled = true;
     instance.controller?.abort();
@@ -130,7 +131,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
    */
   private static async handleMessageRequest(
     data: MessageRequest,
-    instance: JanInferenceOpenAIExtension
+    instance: JanInferenceOpenAIExtension,
   ) {
     if (data.model.engine !== "openai") {
       return;
@@ -160,7 +161,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
         ...JanInferenceOpenAIExtension._currentModel,
         parameters: data.model.parameters,
       },
-      instance.controller
+      instance.controller,
     ).subscribe({
       next: (content) => {
         const messageContent: ThreadContent = {
diff --git a/extensions/inference-openai-extension/tsconfig.json b/extensions/inference-openai-extension/tsconfig.json
index b48175a16..7bfdd9009 100644
--- a/extensions/inference-openai-extension/tsconfig.json
+++ b/extensions/inference-openai-extension/tsconfig.json
@@ -3,13 +3,12 @@
     "target": "es2016",
     "module": "ES6",
     "moduleResolution": "node",
-
     "outDir": "./dist",
     "esModuleInterop": true,
     "forceConsistentCasingInFileNames": true,
     "strict": false,
     "skipLibCheck": true,
-    "rootDir": "./src"
+    "rootDir": "./src",
   },
-  "include": ["./src"]
+  "include": ["./src"],
 }
diff --git a/extensions/inference-triton-trtllm-extension/tsconfig.json b/extensions/inference-triton-trtllm-extension/tsconfig.json
index b48175a16..7bfdd9009 100644
--- a/extensions/inference-triton-trtllm-extension/tsconfig.json
+++ b/extensions/inference-triton-trtllm-extension/tsconfig.json
@@ -3,13 +3,12 @@
     "target": "es2016",
     "module": "ES6",
     "moduleResolution": "node",
-
     "outDir": "./dist",
     "esModuleInterop": true,
     "forceConsistentCasingInFileNames": true,
     "strict": false,
     "skipLibCheck": true,
-    "rootDir": "./src"
+    "rootDir": "./src",
   },
-  "include": ["./src"]
+  "include": ["./src"],
 }
diff --git a/web/containers/CardSidebar/index.tsx b/web/containers/CardSidebar/index.tsx
index bc5047497..c0dd19ba5 100644
--- a/web/containers/CardSidebar/index.tsx
+++ b/web/containers/CardSidebar/index.tsx
@@ -17,6 +17,7 @@ import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 interface Props {
   children: ReactNode
+  rightAction?: ReactNode
   title: string
   asChild?: boolean
   hideMoreVerticalAction?: boolean
@@ -25,6 +26,7 @@ export default function CardSidebar({
   children,
   title,
   asChild,
+  rightAction,
   hideMoreVerticalAction,
 }: Props) {
   const [show, setShow] = useState(true)
@@ -53,27 +55,16 @@ export default function CardSidebar({
       <div
         className={twMerge(
           'relative flex items-center justify-between pl-4',
-          show && 'border-b border-border'
+          show && children && 'border-b border-border'
         )}
       >
-        <span className="font-bold">{title}</span>
-        <div className="flex">
-          {!asChild && (
-            <>
-              {!hideMoreVerticalAction && (
-                <div
-                  ref={setToggle}
-                  className="cursor-pointer rounded-lg bg-zinc-100 p-2 pr-0 dark:bg-zinc-900"
-                  onClick={() => setMore(!more)}
-                >
-                  <MoreVerticalIcon className="h-5 w-5" />
-                </div>
-              )}
-            </>
-          )}
+        <div className="flex items-center ">
           <button
-            onClick={() => setShow(!show)}
-            className="flex w-full flex-1 items-center space-x-2 rounded-lg bg-zinc-100 px-3 py-2 dark:bg-zinc-900"
+            onClick={() => {
+              if (!children) return
+              setShow(!show)
+            }}
+            className="flex w-full flex-1 items-center space-x-2 rounded-lg bg-zinc-100 py-2 pr-2 dark:bg-zinc-900"
           >
             <ChevronDownIcon
               className={twMerge(
@@ -82,6 +73,23 @@ export default function CardSidebar({
               )}
             />
           </button>
+          <span className="font-bold">{title}</span>
+        </div>
+        <div className="flex">
+          {rightAction && rightAction}
+          {!asChild && (
+            <>
+              {!hideMoreVerticalAction && (
+                <div
+                  ref={setToggle}
+                  className="cursor-pointer rounded-lg bg-zinc-100 p-2 px-3 dark:bg-zinc-900"
+                  onClick={() => setMore(!more)}
+                >
+                  <MoreVerticalIcon className="h-5 w-5" />
+                </div>
+              )}
+            </>
+          )}
         </div>
 
         {more && (
diff --git a/web/containers/Checkbox/index.tsx b/web/containers/Checkbox/index.tsx
index e8f916d98..a545771b6 100644
--- a/web/containers/Checkbox/index.tsx
+++ b/web/containers/Checkbox/index.tsx
@@ -9,54 +9,26 @@ import {
   TooltipTrigger,
 } from '@janhq/uikit'
 
-import { useAtomValue, useSetAtom } from 'jotai'
 import { InfoIcon } from 'lucide-react'
 
-import { useActiveModel } from '@/hooks/useActiveModel'
-import useUpdateModelParameters from '@/hooks/useUpdateModelParameters'
-
-import { getConfigurationsData } from '@/utils/componentSettings'
-import { toSettingParams } from '@/utils/modelParam'
-
-import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-import {
-  engineParamsUpdateAtom,
-  getActiveThreadIdAtom,
-  getActiveThreadModelParamsAtom,
-} from '@/helpers/atoms/Thread.atom'
-
 type Props = {
   name: string
   title: string
+  enabled?: boolean
   description: string
   checked: boolean
+  onValueChanged?: (e: string | number | boolean) => void
 }
 
-const Checkbox: React.FC<Props> = ({ name, title, checked, description }) => {
-  const { updateModelParameter } = useUpdateModelParameters()
-  const threadId = useAtomValue(getActiveThreadIdAtom)
-
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-
-  const modelSettingParams = toSettingParams(activeModelParams)
-
-  const engineParams = getConfigurationsData(modelSettingParams)
-
-  const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
-
-  const serverEnabled = useAtomValue(serverEnabledAtom)
-
-  const { stopModel } = useActiveModel()
-
+const Checkbox: React.FC<Props> = ({
+  title,
+  checked,
+  enabled = true,
+  description,
+  onValueChanged,
+}) => {
   const onCheckedChange = (checked: boolean) => {
-    if (!threadId) return
-    if (engineParams.some((x) => x.name.includes(name))) {
-      setEngineParamsUpdate(true)
-      stopModel()
-    } else {
-      setEngineParamsUpdate(false)
-    }
-    updateModelParameter(threadId, name, checked)
+    onValueChanged?.(checked)
   }
 
   return (
@@ -80,7 +52,7 @@ const Checkbox: React.FC<Props> = ({ name, title, checked, description }) => {
       <Switch
         checked={checked}
         onCheckedChange={onCheckedChange}
-        disabled={serverEnabled}
+        disabled={!enabled}
       />
     </div>
   )
diff --git a/web/containers/Layout/TopBar/index.tsx b/web/containers/Layout/TopBar/index.tsx
index ac05e4e1a..ab67cb3b7 100644
--- a/web/containers/Layout/TopBar/index.tsx
+++ b/web/containers/Layout/TopBar/index.tsx
@@ -120,13 +120,13 @@ const TopBar = () => {
               </span>
             </div>
           </div>
-          <div
-            className={twMerge(
-              'absolute right-0 h-full w-80',
-              showing && 'border-l border-border'
-            )}
-          >
-            {activeThread && (
+          {activeThread && (
+            <div
+              className={twMerge(
+                'absolute right-0 h-full w-80',
+                showing && 'border-l border-border'
+              )}
+            >
               <div className="flex h-full w-52 items-center justify-between px-4">
                 {showing && (
                   <div className="relative flex h-full items-center">
@@ -227,8 +227,8 @@ const TopBar = () => {
                   />
                 </div>
               </div>
-            )}
-          </div>
+            </div>
+          )}
         </div>
       )}
       <CommandSearch />
diff --git a/web/containers/Loader/GenerateResponse.tsx b/web/containers/Loader/GenerateResponse.tsx
new file mode 100644
index 000000000..457c44987
--- /dev/null
+++ b/web/containers/Loader/GenerateResponse.tsx
@@ -0,0 +1,39 @@
+import React, { useEffect, useState } from 'react'
+
+export default function GenerateResponse() {
+  const [loader, setLoader] = useState(0)
+
+  // This is fake loader please fix this when we have realtime percentage when load model
+  useEffect(() => {
+    if (loader === 24) {
+      setTimeout(() => {
+        setLoader(loader + 1)
+      }, 250)
+    } else if (loader === 50) {
+      setTimeout(() => {
+        setLoader(loader + 1)
+      }, 250)
+    } else if (loader === 78) {
+      setTimeout(() => {
+        setLoader(loader + 1)
+      }, 250)
+    } else if (loader === 85) {
+      setLoader(85)
+    } else {
+      setLoader(loader + 1)
+    }
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [loader])
+
+  return (
+    <div className=" mb-1 mt-2 py-2 text-center">
+      <div className="relative inline-block overflow-hidden rounded-lg border border-neutral-50 bg-gray-50 px-4 py-2 font-semibold text-gray-600 shadow-lg">
+        <div
+          className="absolute left-0 top-0 h-full bg-gray-200"
+          style={{ width: `${loader}%` }}
+        />
+        <span className="relative z-10">Generating response...</span>
+      </div>
+    </div>
+  )
+}
diff --git a/web/containers/ModelConfigInput/index.tsx b/web/containers/ModelConfigInput/index.tsx
index e409fd424..d573a0bf9 100644
--- a/web/containers/ModelConfigInput/index.tsx
+++ b/web/containers/ModelConfigInput/index.tsx
@@ -7,65 +7,26 @@ import {
   TooltipTrigger,
 } from '@janhq/uikit'
 
-import { useAtomValue, useSetAtom } from 'jotai'
-
 import { InfoIcon } from 'lucide-react'
 
-import { useActiveModel } from '@/hooks/useActiveModel'
-import useUpdateModelParameters from '@/hooks/useUpdateModelParameters'
-
-import { getConfigurationsData } from '@/utils/componentSettings'
-
-import { toSettingParams } from '@/utils/modelParam'
-
-import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-import {
-  engineParamsUpdateAtom,
-  getActiveThreadIdAtom,
-  getActiveThreadModelParamsAtom,
-} from '@/helpers/atoms/Thread.atom'
-
 type Props = {
   title: string
+  enabled?: boolean
   name: string
   description: string
   placeholder: string
   value: string
+  onValueChanged?: (e: string | number | boolean) => void
 }
 
 const ModelConfigInput: React.FC<Props> = ({
   title,
-  name,
+  enabled = true,
   value,
   description,
   placeholder,
+  onValueChanged,
 }) => {
-  const { updateModelParameter } = useUpdateModelParameters()
-  const threadId = useAtomValue(getActiveThreadIdAtom)
-
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-
-  const modelSettingParams = toSettingParams(activeModelParams)
-
-  const engineParams = getConfigurationsData(modelSettingParams)
-
-  const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
-
-  const { stopModel } = useActiveModel()
-
-  const serverEnabled = useAtomValue(serverEnabledAtom)
-
-  const onValueChanged = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
-    if (!threadId) return
-    if (engineParams.some((x) => x.name.includes(name))) {
-      setEngineParamsUpdate(true)
-      stopModel()
-    } else {
-      setEngineParamsUpdate(false)
-    }
-    updateModelParameter(threadId, name, e.target.value)
-  }
-
   return (
     <div className="flex flex-col">
       <div className="mb-2 flex items-center gap-x-2">
@@ -86,9 +47,9 @@ const ModelConfigInput: React.FC<Props> = ({
       </div>
       <Textarea
         placeholder={placeholder}
-        onChange={onValueChanged}
+        onChange={(e) => onValueChanged?.(e.target.value)}
         value={value}
-        disabled={serverEnabled}
+        disabled={!enabled}
       />
     </div>
   )
diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index 114370359..01d32b346 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -22,6 +22,7 @@ import { extensionManager } from '@/extension'
 import {
   addNewMessageAtom,
   updateMessageAtom,
+  generateResponseAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
 import {
   updateThreadWaitingForResponseAtom,
@@ -34,6 +35,7 @@ export default function EventHandler({ children }: { children: ReactNode }) {
   const { downloadedModels } = useGetDownloadedModels()
   const setActiveModel = useSetAtom(activeModelAtom)
   const setStateModel = useSetAtom(stateModelAtom)
+  const setGenerateResponse = useSetAtom(generateResponseAtom)
 
   const updateThreadWaiting = useSetAtom(updateThreadWaitingForResponseAtom)
   const threads = useAtomValue(threadsAtom)
@@ -50,6 +52,7 @@ export default function EventHandler({ children }: { children: ReactNode }) {
 
   const onNewMessageResponse = useCallback(
     (message: ThreadMessage) => {
+      setGenerateResponse(false)
       addNewMessage(message)
     },
     [addNewMessage]
@@ -93,6 +96,7 @@ export default function EventHandler({ children }: { children: ReactNode }) {
 
   const onMessageResponseUpdate = useCallback(
     (message: ThreadMessage) => {
+      setGenerateResponse(false)
       updateMessage(
         message.id,
         message.thread_id,
@@ -102,7 +106,6 @@ export default function EventHandler({ children }: { children: ReactNode }) {
       if (message.status === MessageStatus.Pending) {
         return
       }
-
       // Mark the thread as not waiting for response
       updateThreadWaiting(message.thread_id, false)
 
diff --git a/web/containers/Providers/Jotai.tsx b/web/containers/Providers/Jotai.tsx
index 2554ce38d..103f0d9ee 100644
--- a/web/containers/Providers/Jotai.tsx
+++ b/web/containers/Providers/Jotai.tsx
@@ -9,9 +9,17 @@ type Props = {
 }
 
 export const currentPromptAtom = atom<string>('')
+export const fileUploadAtom = atom<FileInfo[]>([])
 export const appDownloadProgress = atom<number>(-1)
 export const searchAtom = atom<string>('')
 
 export default function JotaiWrapper({ children }: Props) {
   return <Provider>{children}</Provider>
 }
+
+export type FileType = 'image' | 'pdf'
+
+export type FileInfo = {
+  file: File
+  type: FileType
+}
diff --git a/web/containers/Shortcut/index.tsx b/web/containers/Shortcut/index.tsx
index 6153f48a7..dd0518b56 100644
--- a/web/containers/Shortcut/index.tsx
+++ b/web/containers/Shortcut/index.tsx
@@ -1,6 +1,6 @@
 export default function ShortCut(props: { menu: string }) {
   const { menu } = props
-  const symbol = isMac ? '⌘' : 'Ctrl'
+  const symbol = isMac ? '⌘' : 'Ctrl + '
 
   return (
     <div className="inline-flex items-center justify-center rounded-full bg-secondary px-1 py-0.5 text-xs font-bold text-muted-foreground">
diff --git a/web/containers/SliderRightPanel/index.tsx b/web/containers/SliderRightPanel/index.tsx
index d9ed00f83..7c017e70f 100644
--- a/web/containers/SliderRightPanel/index.tsx
+++ b/web/containers/SliderRightPanel/index.tsx
@@ -9,74 +9,36 @@ import {
   TooltipPortal,
   TooltipTrigger,
 } from '@janhq/uikit'
-import { useAtomValue, useSetAtom } from 'jotai'
 
 import { InfoIcon } from 'lucide-react'
 
-import { useActiveModel } from '@/hooks/useActiveModel'
 import { useClickOutside } from '@/hooks/useClickOutside'
 
-import useUpdateModelParameters from '@/hooks/useUpdateModelParameters'
-
-import { getConfigurationsData } from '@/utils/componentSettings'
-import { toSettingParams } from '@/utils/modelParam'
-
-import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-import {
-  engineParamsUpdateAtom,
-  getActiveThreadIdAtom,
-  getActiveThreadModelParamsAtom,
-} from '@/helpers/atoms/Thread.atom'
-
 type Props = {
   name: string
   title: string
+  enabled: boolean
   description: string
   min: number
   max: number
   step: number
   value: number
+  onValueChanged: (e: string | number | boolean) => void
 }
 
 const SliderRightPanel: React.FC<Props> = ({
-  name,
   title,
+  enabled,
   min,
   max,
   step,
   description,
   value,
+  onValueChanged,
 }) => {
-  const { updateModelParameter } = useUpdateModelParameters()
-  const threadId = useAtomValue(getActiveThreadIdAtom)
-
-  const serverEnabled = useAtomValue(serverEnabledAtom)
-
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-
-  const modelSettingParams = toSettingParams(activeModelParams)
-
-  const engineParams = getConfigurationsData(modelSettingParams)
-
-  const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
-
-  const { stopModel } = useActiveModel()
-
   const [showTooltip, setShowTooltip] = useState({ max: false, min: false })
 
   useClickOutside(() => setShowTooltip({ max: false, min: false }), null, [])
-
-  const onValueChanged = (e: number[]) => {
-    if (!threadId) return
-    if (engineParams.some((x) => x.name.includes(name))) {
-      setEngineParamsUpdate(true)
-      stopModel()
-    } else {
-      setEngineParamsUpdate(false)
-    }
-    updateModelParameter(threadId, name, e[0])
-  }
-
   return (
     <div className="flex flex-col">
       <div className="mb-3 flex items-center gap-x-2">
@@ -99,11 +61,11 @@ const SliderRightPanel: React.FC<Props> = ({
         <div className="relative w-full">
           <Slider
             value={[value]}
-            onValueChange={onValueChanged}
+            onValueChange={(e) => onValueChanged?.(e[0])}
             min={min}
             max={max}
             step={step}
-            disabled={serverEnabled}
+            disabled={!enabled}
           />
           <div className="relative mt-2 flex items-center justify-between text-gray-400">
             <p className="text-sm">{min}</p>
@@ -118,18 +80,18 @@ const SliderRightPanel: React.FC<Props> = ({
               min={min}
               max={max}
               value={String(value)}
-              disabled={serverEnabled}
+              disabled={!enabled}
               onBlur={(e) => {
                 if (Number(e.target.value) > Number(max)) {
-                  onValueChanged([Number(max)])
+                  onValueChanged?.(Number(max))
                   setShowTooltip({ max: true, min: false })
                 } else if (Number(e.target.value) < Number(min)) {
-                  onValueChanged([Number(min)])
+                  onValueChanged?.(Number(min))
                   setShowTooltip({ max: false, min: true })
                 }
               }}
               onChange={(e) => {
-                onValueChanged([Number(e.target.value)])
+                onValueChanged?.(Number(e.target.value))
               }}
             />
           </TooltipTrigger>
diff --git a/web/helpers/atoms/ChatMessage.atom.ts b/web/helpers/atoms/ChatMessage.atom.ts
index b11e8f3be..0d9211649 100644
--- a/web/helpers/atoms/ChatMessage.atom.ts
+++ b/web/helpers/atoms/ChatMessage.atom.ts
@@ -14,6 +14,8 @@ import {
 /**
  * Stores all chat messages for all threads
  */
+export const generateResponseAtom = atom<boolean>(false)
+
 export const chatMessages = atom<Record<string, ThreadMessage[]>>({})
 
 /**
diff --git a/web/hooks/useCreateNewThread.ts b/web/hooks/useCreateNewThread.ts
index e374d0cc5..d9451a46c 100644
--- a/web/hooks/useCreateNewThread.ts
+++ b/web/hooks/useCreateNewThread.ts
@@ -7,7 +7,9 @@ import {
   ThreadState,
   Model,
 } from '@janhq/core'
-import { atom, useAtomValue, useSetAtom } from 'jotai'
+import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
+
+import { fileUploadAtom } from '@/containers/Providers/Jotai'
 
 import { generateThreadId } from '@/utils/thread'
 
@@ -46,7 +48,7 @@ export const useCreateNewThread = () => {
   const createNewThread = useSetAtom(createNewThreadAtom)
   const setActiveThreadId = useSetAtom(setActiveThreadIdAtom)
   const updateThread = useSetAtom(updateThreadAtom)
-
+  const [fileUpload, setFileUpload] = useAtom(fileUploadAtom)
   const { deleteThread } = useDeleteThread()
 
   const requestCreateNewThread = async (
@@ -72,6 +74,7 @@ export const useCreateNewThread = () => {
     const assistantInfo: ThreadAssistantInfo = {
       assistant_id: assistant.id,
       assistant_name: assistant.name,
+      tools: assistant.tools,
       model: {
         id: modelId,
         settings: {},
@@ -93,6 +96,9 @@ export const useCreateNewThread = () => {
     // add the new thread on top of the thread list to the state
     createNewThread(thread)
     setActiveThreadId(thread.id)
+
+    // Delete the file upload state
+    setFileUpload([])
   }
 
   function updateThreadMetadata(thread: Thread) {
diff --git a/web/hooks/usePath.ts b/web/hooks/usePath.ts
index db6284f93..88abae92c 100644
--- a/web/hooks/usePath.ts
+++ b/web/hooks/usePath.ts
@@ -76,8 +76,25 @@ export const usePath = () => {
     openFileExplorer(fullPath)
   }
 
+  const onViewFile = async (id: string) => {
+    if (!activeThread) return
+    const activeThreadState = threadStates[activeThread.id]
+    if (!activeThreadState.isFinishInit) {
+      alert('Thread is not started yet')
+      return
+    }
+
+    const userSpace = await getJanDataFolderPath()
+    let filePath = undefined
+    filePath = await joinPath(['threads', `${activeThread.id}/files`, `${id}`])
+    if (!filePath) return
+    const fullPath = await joinPath([userSpace, filePath])
+    openFileExplorer(fullPath)
+  }
+
   return {
     onReviewInFinder,
     onViewJson,
+    onViewFile,
   }
 }
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index bf9740489..c8a32564b 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -1,3 +1,4 @@
+/* eslint-disable @typescript-eslint/no-explicit-any */
 import { useEffect, useRef, useState } from 'react'
 
 import {
@@ -13,16 +14,20 @@ import {
   Model,
   ConversationalExtension,
   MessageEvent,
+  InferenceEngine,
+  ChatCompletionMessageContentType,
+  AssistantTool,
 } from '@janhq/core'
 import { useAtom, useAtomValue, useSetAtom } from 'jotai'
 
 import { ulid } from 'ulid'
 
 import { selectedModelAtom } from '@/containers/DropdownListSidebar'
-import { currentPromptAtom } from '@/containers/Providers/Jotai'
+import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
 
 import { toaster } from '@/containers/Toast'
 
+import { getBase64 } from '@/utils/base64'
 import { toRuntimeParams, toSettingParams } from '@/utils/modelParam'
 
 import { useActiveModel } from './useActiveModel'
@@ -30,6 +35,7 @@ import { useActiveModel } from './useActiveModel'
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
   addNewMessageAtom,
+  generateResponseAtom,
   getCurrentChatMessagesAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
 import {
@@ -48,6 +54,7 @@ export default function useSendChatMessage() {
   const updateThread = useSetAtom(updateThreadAtom)
   const updateThreadWaiting = useSetAtom(updateThreadWaitingForResponseAtom)
   const [currentPrompt, setCurrentPrompt] = useAtom(currentPromptAtom)
+  const setGenerateResponse = useSetAtom(generateResponseAtom)
 
   const currentMessages = useAtomValue(getCurrentChatMessagesAtom)
   const { activeModel } = useActiveModel()
@@ -64,6 +71,7 @@ export default function useSendChatMessage() {
   const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
 
   const [reloadModel, setReloadModel] = useState(false)
+  const [fileUpload, setFileUpload] = useAtom(fileUploadAtom)
 
   useEffect(() => {
     modelRef.current = activeModel
@@ -135,6 +143,8 @@ export default function useSendChatMessage() {
   }
 
   const sendChatMessage = async () => {
+    setGenerateResponse(true)
+
     if (!currentPrompt || currentPrompt.trim().length === 0) return
 
     if (!activeThread) {
@@ -160,6 +170,7 @@ export default function useSendChatMessage() {
       const assistantId = activeThread.assistants[0].assistant_id ?? ''
       const assistantName = activeThread.assistants[0].assistant_name ?? ''
       const instructions = activeThread.assistants[0].instructions ?? ''
+      const tools = activeThread.assistants[0].tools ?? []
 
       const updatedThread: Thread = {
         ...activeThread,
@@ -168,6 +179,7 @@ export default function useSendChatMessage() {
             assistant_id: assistantId,
             assistant_name: assistantName,
             instructions: instructions,
+            tools: tools,
             model: {
               id: selectedModel.id,
               settings: settingParams,
@@ -190,6 +202,12 @@ export default function useSendChatMessage() {
     const prompt = currentPrompt.trim()
     setCurrentPrompt('')
 
+    const base64Blob = fileUpload[0]
+      ? await getBase64(fileUpload[0].file).then()
+      : undefined
+
+    const msgId = ulid()
+
     const messages: ChatCompletionMessage[] = [
       activeThread.assistants[0]?.instructions,
     ]
@@ -210,16 +228,41 @@ export default function useSendChatMessage() {
           .concat([
             {
               role: ChatCompletionRole.User,
-              content: prompt,
+              content:
+                selectedModel && base64Blob
+                  ? [
+                      {
+                        type: ChatCompletionMessageContentType.Text,
+                        text: prompt,
+                      },
+                      {
+                        type: ChatCompletionMessageContentType.Doc,
+                        doc_url: {
+                          url: `threads/${activeThread.id}/files/${msgId}.pdf`,
+                        },
+                      },
+                    ]
+                  : prompt,
             } as ChatCompletionMessage,
           ])
       )
-    const msgId = ulid()
 
-    const modelRequest = selectedModel ?? activeThread.assistants[0].model
+    let modelRequest = selectedModel ?? activeThread.assistants[0].model
     if (runtimeParams.stream == null) {
       runtimeParams.stream = true
     }
+    // Add middleware to the model request with tool retrieval enabled
+    if (
+      activeThread.assistants[0].tools?.some(
+        (tool: AssistantTool) => tool.type === 'retrieval' && tool.enabled
+      )
+    ) {
+      modelRequest = {
+        ...modelRequest,
+        engine: InferenceEngine.tool_retrieval_enabled,
+        proxyEngine: modelRequest.engine,
+      }
+    }
     const messageRequest: MessageRequest = {
       id: msgId,
       threadId: activeThread.id,
@@ -229,8 +272,44 @@ export default function useSendChatMessage() {
         settings: settingParams,
         parameters: runtimeParams,
       },
+      thread: activeThread,
     }
     const timestamp = Date.now()
+
+    const content: any = []
+
+    if (base64Blob && fileUpload[0]?.type === 'image') {
+      content.push({
+        type: ContentType.Image,
+        text: {
+          value: prompt,
+          annotations: [base64Blob],
+        },
+      })
+    }
+
+    if (base64Blob && fileUpload[0]?.type === 'pdf') {
+      content.push({
+        type: ContentType.Pdf,
+        text: {
+          value: prompt,
+          annotations: [base64Blob],
+          name: fileUpload[0].file.name,
+          size: fileUpload[0].file.size,
+        },
+      })
+    }
+
+    if (prompt && !base64Blob) {
+      content.push({
+        type: ContentType.Text,
+        text: {
+          value: prompt,
+          annotations: [],
+        },
+      })
+    }
+
     const threadMessage: ThreadMessage = {
       id: msgId,
       thread_id: activeThread.id,
@@ -239,18 +318,13 @@ export default function useSendChatMessage() {
       created: timestamp,
       updated: timestamp,
       object: 'thread.message',
-      content: [
-        {
-          type: ContentType.Text,
-          text: {
-            value: prompt,
-            annotations: [],
-          },
-        },
-      ],
+      content: content,
     }
 
     addNewMessage(threadMessage)
+    if (base64Blob) {
+      setFileUpload([])
+    }
 
     await extensionManager
       .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
diff --git a/web/hooks/useSetActiveThread.ts b/web/hooks/useSetActiveThread.ts
index 76a744bcd..035f0551a 100644
--- a/web/hooks/useSetActiveThread.ts
+++ b/web/hooks/useSetActiveThread.ts
@@ -1,3 +1,5 @@
+import { useEffect } from 'react'
+
 import {
   InferenceEvent,
   ExtensionTypeEnum,
diff --git a/web/next.config.js b/web/next.config.js
index 455ba70fc..0b6a8bc92 100644
--- a/web/next.config.js
+++ b/web/next.config.js
@@ -24,9 +24,6 @@ const nextConfig = {
     config.plugins = [
       ...config.plugins,
       new webpack.DefinePlugin({
-        PLUGIN_CATALOG: JSON.stringify(
-          'https://cdn.jsdelivr.net/npm/@janhq/plugin-catalog@latest/dist/index.js'
-        ),
         VERSION: JSON.stringify(packageJson.version),
         ANALYTICS_ID:
           JSON.stringify(process.env.ANALYTICS_ID) ?? JSON.stringify('xxx'),
diff --git a/web/package.json b/web/package.json
index 5293cf765..498481aa3 100644
--- a/web/package.json
+++ b/web/package.json
@@ -8,6 +8,7 @@
     "build": "next build",
     "start": "next start",
     "lint": "eslint .",
+    "lint:fix": "eslint . --fix",
     "format": "prettier --write \"**/*.{js,jsx,ts,tsx}\"",
     "compile": "tsc --noEmit -p . --pretty"
   },
@@ -32,6 +33,7 @@
     "posthog-js": "^1.95.1",
     "react": "18.2.0",
     "react-dom": "18.2.0",
+    "react-dropzone": "^14.2.3",
     "react-hook-form": "^7.47.0",
     "react-hot-toast": "^2.4.1",
     "react-icons": "^4.12.0",
diff --git a/web/screens/Chat/AssistantSetting/index.tsx b/web/screens/Chat/AssistantSetting/index.tsx
new file mode 100644
index 000000000..b97c39e67
--- /dev/null
+++ b/web/screens/Chat/AssistantSetting/index.tsx
@@ -0,0 +1,78 @@
+import { useAtomValue } from 'jotai'
+
+import { useCreateNewThread } from '@/hooks/useCreateNewThread'
+
+import SettingComponentBuilder, {
+  SettingComponentData,
+} from '../ModelSetting/SettingComponent'
+
+import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
+
+const AssistantSetting = ({
+  componentData,
+}: {
+  componentData: SettingComponentData[]
+}) => {
+  const activeThread = useAtomValue(activeThreadAtom)
+  const { updateThreadMetadata } = useCreateNewThread()
+
+  return (
+    <div className="flex flex-col">
+      {activeThread && componentData && (
+        <SettingComponentBuilder
+          componentData={componentData}
+          updater={(_, name, value) => {
+            if (
+              activeThread.assistants[0].tools &&
+              (name === 'chunk_overlap' || name === 'chunk_size')
+            ) {
+              if (
+                activeThread.assistants[0].tools[0]?.settings.chunk_size <
+                activeThread.assistants[0].tools[0]?.settings.chunk_overlap
+              ) {
+                activeThread.assistants[0].tools[0].settings.chunk_overlap =
+                  activeThread.assistants[0].tools[0].settings.chunk_size
+              }
+
+              if (
+                name === 'chunk_size' &&
+                value <
+                  activeThread.assistants[0].tools[0].settings.chunk_overlap
+              ) {
+                activeThread.assistants[0].tools[0].settings.chunk_overlap =
+                  value
+              } else if (
+                name === 'chunk_overlap' &&
+                value > activeThread.assistants[0].tools[0].settings.chunk_size
+              ) {
+                activeThread.assistants[0].tools[0].settings.chunk_size = value
+              }
+            }
+
+            updateThreadMetadata({
+              ...activeThread,
+              assistants: [
+                {
+                  ...activeThread.assistants[0],
+                  tools: [
+                    {
+                      type: 'retrieval',
+                      enabled: false,
+                      settings: {
+                        ...(activeThread.assistants[0].tools &&
+                          activeThread.assistants[0].tools[0]?.settings),
+                        [name]: value,
+                      },
+                    },
+                  ],
+                },
+              ],
+            })
+          }}
+        />
+      )}
+    </div>
+  )
+}
+
+export default AssistantSetting
diff --git a/web/screens/Chat/ChatBody/index.tsx b/web/screens/Chat/ChatBody/index.tsx
index f56e13845..9f629e627 100644
--- a/web/screens/Chat/ChatBody/index.tsx
+++ b/web/screens/Chat/ChatBody/index.tsx
@@ -8,8 +8,11 @@ import { useAtomValue } from 'jotai'
 
 import LogoMark from '@/containers/Brand/Logo/Mark'
 
+import GenerateResponse from '@/containers/Loader/GenerateResponse'
+
 import { MainViewState } from '@/constants/screens'
 
+import { activeModelAtom } from '@/hooks/useActiveModel'
 import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
 
 import { useMainViewState } from '@/hooks/useMainViewState'
@@ -18,12 +21,17 @@ import ChatItem from '../ChatItem'
 
 import ErrorMessage from '../ErrorMessage'
 
-import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
+import {
+  generateResponseAtom,
+  getCurrentChatMessagesAtom,
+} from '@/helpers/atoms/ChatMessage.atom'
 
 const ChatBody: React.FC = () => {
   const messages = useAtomValue(getCurrentChatMessagesAtom)
+  const activeModel = useAtomValue(activeModelAtom)
   const { downloadedModels } = useGetDownloadedModels()
   const { setMainViewState } = useMainViewState()
+  const generateResponse = useAtomValue(generateResponseAtom)
 
   if (downloadedModels.length === 0)
     return (
@@ -80,7 +88,10 @@ const ChatBody: React.FC = () => {
         <ScrollToBottom className="flex h-full w-full flex-col">
           {messages.map((message, index) => (
             <div key={message.id}>
-              <ChatItem {...message} key={message.id} />
+              {(message.status !== MessageStatus.Pending ||
+                message.content.length > 0) && (
+                <ChatItem {...message} key={message.id} />
+              )}
               {(message.status === MessageStatus.Error ||
                 message.status === MessageStatus.Stopped) &&
                 index === messages.length - 1 && (
@@ -88,6 +99,15 @@ const ChatBody: React.FC = () => {
                 )}
             </div>
           ))}
+
+          {activeModel &&
+            (generateResponse ||
+              (messages.length &&
+                messages[messages.length - 1].status ===
+                  MessageStatus.Pending &&
+                !messages[messages.length - 1].content.length)) && (
+              <GenerateResponse />
+            )}
         </ScrollToBottom>
       )}
     </Fragment>
diff --git a/web/screens/Chat/ChatInput/index.tsx b/web/screens/Chat/ChatInput/index.tsx
new file mode 100644
index 000000000..a07189c74
--- /dev/null
+++ b/web/screens/Chat/ChatInput/index.tsx
@@ -0,0 +1,254 @@
+/* eslint-disable @typescript-eslint/no-explicit-any */
+import { useEffect, useRef, useState } from 'react'
+
+import { InferenceEvent, MessageStatus, events } from '@janhq/core'
+
+import {
+  Textarea,
+  Button,
+  Tooltip,
+  TooltipArrow,
+  TooltipContent,
+  TooltipPortal,
+  TooltipTrigger,
+} from '@janhq/uikit'
+import { useAtom, useAtomValue } from 'jotai'
+import {
+  FileTextIcon,
+  ImageIcon,
+  StopCircle,
+  PaperclipIcon,
+} from 'lucide-react'
+
+import { twMerge } from 'tailwind-merge'
+
+import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
+
+import { useActiveModel } from '@/hooks/useActiveModel'
+import { useClickOutside } from '@/hooks/useClickOutside'
+
+import useSendChatMessage from '@/hooks/useSendChatMessage'
+
+import FileUploadPreview from '../FileUploadPreview'
+import ImageUploadPreview from '../ImageUploadPreview'
+
+import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
+import {
+  activeThreadAtom,
+  getActiveThreadIdAtom,
+  waitingToSendMessage,
+} from '@/helpers/atoms/Thread.atom'
+
+const ChatInput: React.FC = () => {
+  const activeThread = useAtomValue(activeThreadAtom)
+  const { stateModel } = useActiveModel()
+  const messages = useAtomValue(getCurrentChatMessagesAtom)
+
+  const [currentPrompt, setCurrentPrompt] = useAtom(currentPromptAtom)
+  const { sendChatMessage } = useSendChatMessage()
+
+  const activeThreadId = useAtomValue(getActiveThreadIdAtom)
+  const [isWaitingToSend, setIsWaitingToSend] = useAtom(waitingToSendMessage)
+  const [fileUpload, setFileUpload] = useAtom(fileUploadAtom)
+  const textareaRef = useRef<HTMLTextAreaElement>(null)
+  const fileInputRef = useRef<HTMLInputElement>(null)
+  const imageInputRef = useRef<HTMLInputElement>(null)
+  const [ShowAttacmentMenus, setShowAttacmentMenus] = useState(false)
+
+  const onPromptChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
+    setCurrentPrompt(e.target.value)
+  }
+
+  const refAttachmentMenus = useClickOutside(() => setShowAttacmentMenus(false))
+
+  useEffect(() => {
+    if (isWaitingToSend && activeThreadId) {
+      setIsWaitingToSend(false)
+      sendChatMessage()
+    }
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [waitingToSendMessage, activeThreadId])
+
+  useEffect(() => {
+    if (textareaRef.current) {
+      textareaRef.current.style.height = '40px'
+      textareaRef.current.style.height = textareaRef.current.scrollHeight + 'px'
+    }
+  }, [currentPrompt])
+
+  const onKeyDown = async (e: React.KeyboardEvent<HTMLTextAreaElement>) => {
+    if (e.key === 'Enter') {
+      if (!e.shiftKey) {
+        e.preventDefault()
+        if (messages[messages.length - 1]?.status !== MessageStatus.Pending)
+          sendChatMessage()
+        else onStopInferenceClick()
+      }
+    }
+  }
+
+  const onStopInferenceClick = async () => {
+    events.emit(InferenceEvent.OnInferenceStopped, {})
+  }
+
+  /**
+   * Handles the change event of the extension file input element by setting the file name state.
+   * Its to be used to display the extension file name of the selected file.
+   * @param event - The change event object.
+   */
+  const handleFileChange = (event: React.ChangeEvent<HTMLInputElement>) => {
+    const file = event.target.files?.[0]
+    if (!file) return
+    setFileUpload([{ file: file, type: 'pdf' }])
+    setCurrentPrompt('Summarize this for me')
+  }
+
+  const handleImageChange = (event: React.ChangeEvent<HTMLInputElement>) => {
+    const file = event.target.files?.[0]
+    if (!file) return
+    setFileUpload([{ file: file, type: 'image' }])
+    setCurrentPrompt('What do you see in this image?')
+  }
+
+  const renderPreview = (fileUpload: any) => {
+    if (fileUpload.length > 0) {
+      if (fileUpload[0].type === 'image') {
+        return <ImageUploadPreview file={fileUpload[0].file} />
+      } else {
+        return <FileUploadPreview />
+      }
+    }
+  }
+
+  return (
+    <div className="mx-auto flex w-full flex-shrink-0 items-end justify-center space-x-4 px-8 py-4">
+      <div className="relative flex w-full flex-col">
+        {renderPreview(fileUpload)}
+
+        <Textarea
+          className={twMerge(
+            'max-h-[400px] resize-none overflow-y-hidden pr-20',
+            fileUpload.length && 'rounded-t-none'
+          )}
+          style={{ height: '40px' }}
+          ref={textareaRef}
+          onKeyDown={onKeyDown}
+          placeholder="Enter your message..."
+          disabled={stateModel.loading || !activeThread}
+          value={currentPrompt}
+          onChange={onPromptChange}
+        />
+
+        <Tooltip>
+          <TooltipTrigger asChild>
+            <PaperclipIcon
+              size={20}
+              className="absolute bottom-2 right-4 cursor-pointer text-muted-foreground"
+              onClick={(e) => {
+                if (
+                  fileUpload.length > 0 ||
+                  (activeThread?.assistants[0].tools &&
+                    !activeThread?.assistants[0].tools[0]?.enabled)
+                ) {
+                  e.stopPropagation()
+                } else {
+                  setShowAttacmentMenus(!ShowAttacmentMenus)
+                }
+              }}
+            />
+          </TooltipTrigger>
+          <TooltipPortal>
+            {fileUpload.length > 0 ||
+              (activeThread?.assistants[0].tools &&
+                !activeThread?.assistants[0].tools[0]?.enabled && (
+                  <TooltipContent side="top" className="max-w-[154px] px-3">
+                    {fileUpload.length !== 0 && (
+                      <span>
+                        Currently, we only support 1 attachment at the same time
+                      </span>
+                    )}
+                    {activeThread?.assistants[0].tools &&
+                      activeThread?.assistants[0].tools[0]?.enabled ===
+                        false && (
+                        <span>
+                          Turn on Retrieval in Assistant Settings to use this
+                          feature
+                        </span>
+                      )}
+                    <TooltipArrow />
+                  </TooltipContent>
+                ))}
+          </TooltipPortal>
+        </Tooltip>
+
+        {ShowAttacmentMenus && (
+          <div
+            ref={refAttachmentMenus}
+            className="absolute bottom-10 right-0 w-36 cursor-pointer rounded-lg border border-border bg-background py-1 shadow"
+          >
+            <ul>
+              <li className="flex w-full cursor-not-allowed  items-center space-x-2 px-4 py-2 text-muted-foreground opacity-50 hover:bg-secondary">
+                <ImageIcon size={16} />
+                <span className="font-medium">Image</span>
+              </li>
+              <li
+                className="flex w-full cursor-pointer items-center space-x-2 px-4 py-2 text-muted-foreground hover:bg-secondary"
+                onClick={() => {
+                  fileInputRef.current?.click()
+                  setShowAttacmentMenus(false)
+                }}
+              >
+                <FileTextIcon size={16} />
+                <span className="font-medium">Document</span>
+              </li>
+            </ul>
+          </div>
+        )}
+      </div>
+
+      <input
+        type="file"
+        className="hidden"
+        ref={imageInputRef}
+        value=""
+        onChange={handleImageChange}
+        accept="image/png, image/jpeg, image/jpg"
+      />
+      <input
+        type="file"
+        className="hidden"
+        ref={fileInputRef}
+        value=""
+        onChange={handleFileChange}
+        accept="application/pdf"
+      />
+
+      {messages[messages.length - 1]?.status !== MessageStatus.Pending ? (
+        <Button
+          size="lg"
+          disabled={
+            stateModel.loading ||
+            !activeThread ||
+            currentPrompt.trim().length === 0
+          }
+          themes="primary"
+          className="min-w-[100px]"
+          onClick={sendChatMessage}
+        >
+          Send
+        </Button>
+      ) : (
+        <Button
+          size="lg"
+          themes="danger"
+          onClick={onStopInferenceClick}
+          className="min-w-[100px]"
+        >
+          <StopCircle size={24} />
+        </Button>
+      )}
+    </div>
+  )
+}
+
+export default ChatInput
diff --git a/web/screens/Chat/EngineSetting/index.tsx b/web/screens/Chat/EngineSetting/index.tsx
index 4394f835b..2153bcbde 100644
--- a/web/screens/Chat/EngineSetting/index.tsx
+++ b/web/screens/Chat/EngineSetting/index.tsx
@@ -6,11 +6,11 @@ import { selectedModelAtom } from '@/containers/DropdownListSidebar'
 import { getConfigurationsData } from '@/utils/componentSettings'
 import { toSettingParams } from '@/utils/modelParam'
 
-import settingComponentBuilder from '../ModelSetting/settingComponentBuilder'
+import SettingComponentBuilder from '../ModelSetting/SettingComponent'
 
 import { getActiveThreadModelParamsAtom } from '@/helpers/atoms/Thread.atom'
 
-const EngineSetting = () => {
+const EngineSetting = ({ enabled = true }: { enabled?: boolean }) => {
   const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
   const selectedModel = useAtomValue(selectedModelAtom)
 
@@ -18,13 +18,18 @@ const EngineSetting = () => {
 
   const modelSettingParams = toSettingParams(activeModelParams)
 
-  const componentData = getConfigurationsData(modelSettingParams, selectedModel)
-
-  componentData.sort((a, b) => a.title.localeCompare(b.title))
+  const componentData = getConfigurationsData(
+    modelSettingParams,
+    selectedModel
+  ).toSorted((a, b) => a.title.localeCompare(b.title))
 
   return (
     <div className="flex flex-col">
-      {settingComponentBuilder(componentData)}
+      <SettingComponentBuilder
+        componentData={componentData}
+        enabled={enabled}
+        selector={(e) => e.name !== 'prompt_template'}
+      />
     </div>
   )
 }
diff --git a/web/screens/Chat/FileUploadPreview/Icon.tsx b/web/screens/Chat/FileUploadPreview/Icon.tsx
new file mode 100644
index 000000000..fdfcf5565
--- /dev/null
+++ b/web/screens/Chat/FileUploadPreview/Icon.tsx
@@ -0,0 +1,95 @@
+import React from 'react'
+
+type Props = {
+  type: string
+}
+
+const Icon: React.FC<Props> = ({ type }) => {
+  return (
+    <div className="relative">
+      <span className="absolute left-1/2 top-1/2 -translate-x-1/2 -translate-y-1/2 text-[10px] font-medium uppercase">
+        {type}
+      </span>
+      <svg
+        width="34"
+        height="42"
+        viewBox="0 0 34 42"
+        fill="none"
+        xmlns="http://www.w3.org/2000/svg"
+      >
+        <g filter="url(#filter0_dd_2991_12588)">
+          <path
+            d="M26.274 10.2068C25.3629 10.2055 24.4894 9.84283 23.8453 9.19837C23.2011 8.55392 22.8389 7.68029 22.838 6.76912V2H7.48584C6.89683 1.99978 6.31354 2.11561 5.7693 2.34086C5.22507 2.56611 4.73054 2.89637 4.31397 3.31279C3.8974 3.7292 3.56694 4.2236 3.34149 4.76776C3.11603 5.31191 3 5.89517 3 6.48417V33.5158C3 34.1048 3.11603 34.6881 3.34149 35.2322C3.56694 35.7764 3.8974 36.2708 4.31397 36.6872C4.73054 37.1036 5.22507 37.4339 5.7693 37.6591C6.31354 37.8844 6.89683 38.0002 7.48584 38H25.9158C27.105 38 28.2456 37.5275 29.0865 36.6866C29.9275 35.8457 30.3999 34.7051 30.3999 33.5158V10.2068H26.274Z"
+            fill="white"
+          />
+          <path
+            d="M30.3998 10.2068H26.2739C25.3628 10.2055 24.4893 9.84283 23.8452 9.19837C23.201 8.55392 22.8388 7.68029 22.8379 6.76912V2L30.3998 10.2068Z"
+            fill="#A1A1AA"
+          />
+        </g>
+        <defs>
+          <filter
+            id="filter0_dd_2991_12588"
+            x="0"
+            y="0"
+            width="33.3999"
+            height="42"
+            filterUnits="userSpaceOnUse"
+            colorInterpolationFilters="sRGB"
+          >
+            <feFlood floodOpacity="0" result="BackgroundImageFix" />
+            <feColorMatrix
+              in="SourceAlpha"
+              type="matrix"
+              values="0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 127 0"
+              result="hardAlpha"
+            />
+            <feOffset dy="1" />
+            <feGaussianBlur stdDeviation="1.5" />
+            <feColorMatrix
+              type="matrix"
+              values="0 0 0 0 0.0627451 0 0 0 0 0.0941176 0 0 0 0 0.156863 0 0 0 0.1 0"
+            />
+            <feBlend
+              mode="normal"
+              in2="BackgroundImageFix"
+              result="effect1_dropShadow_2991_12588"
+            />
+            <feColorMatrix
+              in="SourceAlpha"
+              type="matrix"
+              values="0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 127 0"
+              result="hardAlpha"
+            />
+            <feMorphology
+              radius="1"
+              operator="erode"
+              in="SourceAlpha"
+              result="effect2_dropShadow_2991_12588"
+            />
+            <feOffset dy="1" />
+            <feGaussianBlur stdDeviation="1" />
+            <feComposite in2="hardAlpha" operator="out" />
+            <feColorMatrix
+              type="matrix"
+              values="0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0.1 0"
+            />
+            <feBlend
+              mode="normal"
+              in2="effect1_dropShadow_2991_12588"
+              result="effect2_dropShadow_2991_12588"
+            />
+            <feBlend
+              mode="normal"
+              in="SourceGraphic"
+              in2="effect2_dropShadow_2991_12588"
+              result="shape"
+            />
+          </filter>
+        </defs>
+      </svg>
+    </div>
+  )
+}
+
+export default Icon
diff --git a/web/screens/Chat/FileUploadPreview/index.tsx b/web/screens/Chat/FileUploadPreview/index.tsx
new file mode 100644
index 000000000..7e1a1bebd
--- /dev/null
+++ b/web/screens/Chat/FileUploadPreview/index.tsx
@@ -0,0 +1,47 @@
+import React from 'react'
+
+import { useAtom, useSetAtom } from 'jotai'
+
+import { XIcon } from 'lucide-react'
+
+import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
+
+import { toGibibytes } from '@/utils/converter'
+
+import Icon from './Icon'
+
+const FileUploadPreview: React.FC = () => {
+  const [fileUpload, setFileUpload] = useAtom(fileUploadAtom)
+  const setCurrentPrompt = useSetAtom(currentPromptAtom)
+
+  const onDeleteClick = () => {
+    setFileUpload([])
+    setCurrentPrompt('')
+  }
+
+  return (
+    <div className="flex flex-col rounded-t-lg border border-b-0 border-border p-4">
+      <div className="relative inline-flex w-60 space-x-3 rounded-lg bg-secondary p-4">
+        <Icon type={fileUpload[0].type} />
+
+        <div>
+          <h6 className="line-clamp-1 font-medium">
+            {fileUpload[0].file.name.replaceAll(/[-._]/g, ' ')}
+          </h6>
+          <p className="text-muted-foreground">
+            {toGibibytes(fileUpload[0].file.size)}
+          </p>
+        </div>
+
+        <div
+          className="absolute -right-2 -top-2 cursor-pointer rounded-full bg-foreground p-0.5"
+          onClick={onDeleteClick}
+        >
+          <XIcon size={14} className="text-background" />
+        </div>
+      </div>
+    </div>
+  )
+}
+
+export default FileUploadPreview
diff --git a/web/screens/Chat/ImageUploadPreview/index.tsx b/web/screens/Chat/ImageUploadPreview/index.tsx
new file mode 100644
index 000000000..2a9c9b4ba
--- /dev/null
+++ b/web/screens/Chat/ImageUploadPreview/index.tsx
@@ -0,0 +1,54 @@
+import React, { useEffect } from 'react'
+import { useState } from 'react'
+
+import { useSetAtom } from 'jotai'
+
+import { XIcon } from 'lucide-react'
+
+import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
+
+import { getBase64 } from '@/utils/base64'
+
+type Props = {
+  file: File
+}
+
+const ImageUploadPreview: React.FC<Props> = ({ file }) => {
+  const [base64, setBase64] = useState<string | undefined>()
+  const setFileUpload = useSetAtom(fileUploadAtom)
+  const setCurrentPrompt = useSetAtom(currentPromptAtom)
+
+  useEffect(() => {
+    getBase64(file)
+      .then((base64) => setBase64(base64))
+      .catch((err) => console.error(err))
+  }, [file])
+
+  if (!base64) {
+    return
+  }
+
+  const onDeleteClick = () => {
+    setFileUpload([])
+    setCurrentPrompt('')
+  }
+
+  return (
+    <div className="flex flex-col rounded-t-lg border border-b-0 border-border p-4">
+      <div className="relative w-60 rounded-lg bg-secondary p-4">
+        <img src={base64} alt={file.name} className="object-cover" />
+        <h6 className="mt-2 line-clamp-1 font-medium">
+          {file.name.replaceAll(/[-._]/g, ' ')}
+        </h6>
+        <div
+          className="absolute -right-2 -top-2 cursor-pointer rounded-full bg-foreground p-0.5"
+          onClick={onDeleteClick}
+        >
+          <XIcon size={14} className="text-background" />
+        </div>
+      </div>
+    </div>
+  )
+}
+
+export default React.memo(ImageUploadPreview)
diff --git a/web/screens/Chat/MessageQueuedBanner/index.tsx b/web/screens/Chat/MessageQueuedBanner/index.tsx
new file mode 100644
index 000000000..df9aa5a21
--- /dev/null
+++ b/web/screens/Chat/MessageQueuedBanner/index.tsx
@@ -0,0 +1,19 @@
+import useSendChatMessage from '@/hooks/useSendChatMessage'
+
+const MessageQueuedBanner: React.FC = () => {
+  const { queuedMessage } = useSendChatMessage()
+
+  return (
+    <div>
+      {queuedMessage && (
+        <div className="my-2 py-2 text-center">
+          <span className="rounded-lg border border-border px-4 py-2 shadow-lg">
+            Message queued. It can be sent once the model has started
+          </span>
+        </div>
+      )}
+    </div>
+  )
+}
+
+export default MessageQueuedBanner
diff --git a/web/screens/Chat/ModelSetting/settingComponentBuilder.tsx b/web/screens/Chat/ModelSetting/SettingComponent.tsx
similarity index 50%
rename from web/screens/Chat/ModelSetting/settingComponentBuilder.tsx
rename to web/screens/Chat/ModelSetting/SettingComponent.tsx
index 8ff8e7c02..bb91d47e7 100644
--- a/web/screens/Chat/ModelSetting/settingComponentBuilder.tsx
+++ b/web/screens/Chat/ModelSetting/SettingComponent.tsx
@@ -1,8 +1,22 @@
 /* eslint-disable no-case-declarations */
+import { useAtomValue, useSetAtom } from 'jotai'
+
 import Checkbox from '@/containers/Checkbox'
 import ModelConfigInput from '@/containers/ModelConfigInput'
 import SliderRightPanel from '@/containers/SliderRightPanel'
 
+import { useActiveModel } from '@/hooks/useActiveModel'
+import useUpdateModelParameters from '@/hooks/useUpdateModelParameters'
+
+import { getConfigurationsData } from '@/utils/componentSettings'
+import { toSettingParams } from '@/utils/modelParam'
+
+import {
+  engineParamsUpdateAtom,
+  getActiveThreadIdAtom,
+  getActiveThreadModelParamsAtom,
+} from '@/helpers/atoms/Thread.atom'
+
 export type ControllerType = 'slider' | 'checkbox' | 'input'
 
 export type SettingComponentData = {
@@ -30,14 +44,51 @@ type CheckboxData = {
   checked: boolean
 }
 
-const settingComponentBuilder = (
-  componentData: SettingComponentData[],
-  onlyPrompt?: boolean
-) => {
+const SettingComponent = ({
+  componentData,
+  enabled = true,
+  selector,
+  updater,
+}: {
+  componentData: SettingComponentData[]
+  enabled?: boolean
+  selector?: (e: SettingComponentData) => boolean
+  updater?: (
+    threadId: string,
+    name: string,
+    value: string | number | boolean
+  ) => void
+}) => {
+  const { updateModelParameter } = useUpdateModelParameters()
+
+  const threadId = useAtomValue(getActiveThreadIdAtom)
+
+  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
+
+  const modelSettingParams = toSettingParams(activeModelParams)
+
+  const engineParams = getConfigurationsData(modelSettingParams)
+
+  const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
+
+  const { stopModel } = useActiveModel()
+
+  const onValueChanged = (name: string, value: string | number | boolean) => {
+    if (!threadId) return
+    if (engineParams.some((x) => x.name.includes(name))) {
+      setEngineParamsUpdate(true)
+      stopModel()
+    } else {
+      setEngineParamsUpdate(false)
+    }
+    if (updater) updater(threadId, name, value)
+    else {
+      updateModelParameter(threadId, name, value)
+    }
+  }
+
   const components = componentData
-    .filter((x) =>
-      onlyPrompt ? x.name === 'prompt_template' : x.name !== 'prompt_template'
-    )
+    .filter((x) => (selector ? selector(x) : true))
     .map((data) => {
       switch (data.controllerType) {
         case 'slider':
@@ -52,6 +103,8 @@ const settingComponentBuilder = (
               step={step}
               value={value}
               name={data.name}
+              enabled={enabled}
+              onValueChanged={(value) => onValueChanged(data.name, value)}
             />
           )
         case 'input':
@@ -60,11 +113,13 @@ const settingComponentBuilder = (
           return (
             <ModelConfigInput
               title={data.title}
+              enabled={enabled}
               key={data.name}
               name={data.name}
               description={data.description}
               placeholder={placeholder}
               value={textValue}
+              onValueChanged={(value) => onValueChanged(data.name, value)}
             />
           )
         case 'checkbox':
@@ -72,10 +127,12 @@ const settingComponentBuilder = (
           return (
             <Checkbox
               key={data.name}
+              enabled={enabled}
               name={data.name}
               description={data.description}
               title={data.title}
               checked={checked}
+              onValueChanged={(value) => onValueChanged(data.name, value)}
             />
           )
         default:
@@ -86,4 +143,4 @@ const settingComponentBuilder = (
   return <div className="flex flex-col gap-y-4">{components}</div>
 }
 
-export default settingComponentBuilder
+export default SettingComponent
diff --git a/web/screens/Chat/ModelSetting/index.tsx b/web/screens/Chat/ModelSetting/index.tsx
index ff5d3d40f..ea95363eb 100644
--- a/web/screens/Chat/ModelSetting/index.tsx
+++ b/web/screens/Chat/ModelSetting/index.tsx
@@ -8,7 +8,7 @@ import { selectedModelAtom } from '@/containers/DropdownListSidebar'
 import { getConfigurationsData } from '@/utils/componentSettings'
 import { toRuntimeParams } from '@/utils/modelParam'
 
-import settingComponentBuilder from './settingComponentBuilder'
+import SettingComponentBuilder from './SettingComponent'
 
 import { getActiveThreadModelParamsAtom } from '@/helpers/atoms/Thread.atom'
 
@@ -27,7 +27,10 @@ const ModelSetting = () => {
 
   return (
     <div className="flex flex-col">
-      {settingComponentBuilder(componentData)}
+      <SettingComponentBuilder
+        componentData={componentData}
+        selector={(e) => e.name !== 'prompt_template'}
+      />
     </div>
   )
 }
diff --git a/web/screens/Chat/ModelSetting/predefinedComponent.ts b/web/screens/Chat/ModelSetting/predefinedComponent.ts
index abcec508e..b67117184 100644
--- a/web/screens/Chat/ModelSetting/predefinedComponent.ts
+++ b/web/screens/Chat/ModelSetting/predefinedComponent.ts
@@ -1,4 +1,4 @@
-import { SettingComponentData } from './settingComponentBuilder'
+import { SettingComponentData } from './SettingComponent'
 
 export const presetConfiguration: Record<string, SettingComponentData> = {
   prompt_template: {
@@ -141,4 +141,52 @@ export const presetConfiguration: Record<string, SettingComponentData> = {
       value: 1,
     },
   },
+  // assistant
+  chunk_size: {
+    name: 'chunk_size',
+    title: 'Chunk Size',
+    description: 'Maximum number of tokens in a chunk',
+    controllerType: 'slider',
+    controllerData: {
+      min: 128,
+      max: 2048,
+      step: 128,
+      value: 1024,
+    },
+  },
+  chunk_overlap: {
+    name: 'chunk_overlap',
+    title: 'Chunk Overlap',
+    description: 'Number of tokens overlapping between two adjacent chunks',
+    controllerType: 'slider',
+    controllerData: {
+      min: 32,
+      max: 512,
+      step: 32,
+      value: 64,
+    },
+  },
+  top_k: {
+    name: 'top_k',
+    title: 'Top K',
+    description: 'Number of top-ranked documents to retrieve',
+    controllerType: 'slider',
+    controllerData: {
+      min: 1,
+      max: 5,
+      step: 1,
+      value: 2,
+    },
+  },
+  retrieval_template: {
+    name: 'retrieval_template',
+    title: 'Retrieval Template',
+    description:
+      'The template to use for retrieval. The following variables are available: {CONTEXT}, {QUESTION}',
+    controllerType: 'input',
+    controllerData: {
+      placeholder: 'Retrieval Template',
+      value: '',
+    },
+  },
 }
diff --git a/web/screens/Chat/RequestDownloadModel/index.tsx b/web/screens/Chat/RequestDownloadModel/index.tsx
new file mode 100644
index 000000000..e62dc562d
--- /dev/null
+++ b/web/screens/Chat/RequestDownloadModel/index.tsx
@@ -0,0 +1,42 @@
+import React, { Fragment, useCallback } from 'react'
+
+import { Button } from '@janhq/uikit'
+
+import LogoMark from '@/containers/Brand/Logo/Mark'
+
+import { MainViewState } from '@/constants/screens'
+
+import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
+import { useMainViewState } from '@/hooks/useMainViewState'
+
+const RequestDownloadModel: React.FC = () => {
+  const { downloadedModels } = useGetDownloadedModels()
+  const { setMainViewState } = useMainViewState()
+
+  const onClick = useCallback(() => {
+    setMainViewState(MainViewState.Hub)
+  }, [setMainViewState])
+
+  return (
+    <div className="mx-auto mt-8 flex h-full w-3/4 flex-col items-center justify-center text-center">
+      {downloadedModels.length === 0 && (
+        <Fragment>
+          <LogoMark
+            className="mx-auto mb-4 animate-wave"
+            width={56}
+            height={56}
+          />
+          <h1 className="text-2xl font-bold">Welcome!</h1>
+          <p className="mt-1 text-base">
+            You need to download your first model
+          </p>
+          <Button className="mt-4" onClick={onClick}>
+            Explore The Hub
+          </Button>
+        </Fragment>
+      )}
+    </div>
+  )
+}
+
+export default React.memo(RequestDownloadModel)
diff --git a/web/screens/Chat/Sidebar/index.tsx b/web/screens/Chat/Sidebar/index.tsx
index 64e58d4d3..763d77b1d 100644
--- a/web/screens/Chat/Sidebar/index.tsx
+++ b/web/screens/Chat/Sidebar/index.tsx
@@ -1,7 +1,8 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
 import React from 'react'
 
-import { Input, Textarea } from '@janhq/uikit'
+import { InferenceEngine } from '@janhq/core'
+import { Input, Textarea, Switch } from '@janhq/uikit'
 
 import { atom, useAtomValue } from 'jotai'
 
@@ -10,17 +11,20 @@ import { twMerge } from 'tailwind-merge'
 import LogoMark from '@/containers/Brand/Logo/Mark'
 import CardSidebar from '@/containers/CardSidebar'
 
-import DropdownListSidebar from '@/containers/DropdownListSidebar'
+import DropdownListSidebar, {
+  selectedModelAtom,
+} from '@/containers/DropdownListSidebar'
 
 import { useCreateNewThread } from '@/hooks/useCreateNewThread'
 
 import { getConfigurationsData } from '@/utils/componentSettings'
 import { toRuntimeParams, toSettingParams } from '@/utils/modelParam'
 
+import AssistantSetting from '../AssistantSetting'
 import EngineSetting from '../EngineSetting'
 import ModelSetting from '../ModelSetting'
 
-import settingComponentBuilder from '../ModelSetting/settingComponentBuilder'
+import SettingComponentBuilder from '../ModelSetting/SettingComponent'
 
 import {
   activeThreadAtom,
@@ -33,18 +37,23 @@ const Sidebar: React.FC = () => {
   const showing = useAtomValue(showRightSideBarAtom)
   const activeThread = useAtomValue(activeThreadAtom)
   const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-
+  const selectedModel = useAtomValue(selectedModelAtom)
   const { updateThreadMetadata } = useCreateNewThread()
 
   const modelEngineParams = toSettingParams(activeModelParams)
   const modelRuntimeParams = toRuntimeParams(activeModelParams)
+  const componentDataAssistantSetting = getConfigurationsData(
+    (activeThread?.assistants[0]?.tools &&
+      activeThread?.assistants[0]?.tools[0]?.settings) ??
+      {}
+  )
   const componentDataEngineSetting = getConfigurationsData(modelEngineParams)
   const componentDataRuntimeSetting = getConfigurationsData(modelRuntimeParams)
 
   return (
     <div
       className={twMerge(
-        'h-full flex-shrink-0 overflow-x-hidden border-l border-border bg-background transition-all duration-100 dark:bg-background/20',
+        'h-full flex-shrink-0 overflow-x-hidden border-l border-border bg-background pb-6 transition-all duration-100 dark:bg-background/20',
         showing
           ? 'w-80 translate-x-0 opacity-100'
           : 'w-0 translate-x-full opacity-0'
@@ -122,21 +131,71 @@ const Sidebar: React.FC = () => {
                 }}
               />
             </div>
-            {/* Temporary disabled */}
-            {/* <div>
-                <label
-                  id="tool-title"
-                  className="mb-2 inline-block font-bold text-zinc-500 dark:text-gray-300"
-                >
-                  Tools
-                </label>
-                <div className="flex items-center justify-between">
-                  <label className="font-medium text-zinc-500 dark:text-gray-300">
-                    Retrieval
-                  </label>
-                  <Switch name="retrieval" />
-                </div>
-              </div> */}
+
+            <div>
+              {activeThread?.assistants[0]?.tools &&
+                componentDataAssistantSetting.length > 0 && (
+                  <div className="mt-2">
+                    <CardSidebar
+                      title="Retrieval"
+                      asChild
+                      rightAction={
+                        <Switch
+                          name="retrieval"
+                          className="mr-2"
+                          checked={activeThread?.assistants[0].tools[0].enabled}
+                          onCheckedChange={(e) => {
+                            if (activeThread)
+                              updateThreadMetadata({
+                                ...activeThread,
+                                assistants: [
+                                  {
+                                    ...activeThread.assistants[0],
+                                    tools: [
+                                      {
+                                        type: 'retrieval',
+                                        enabled: e,
+                                        settings:
+                                          (activeThread.assistants[0].tools &&
+                                            activeThread.assistants[0].tools[0]
+                                              ?.settings) ??
+                                          {},
+                                      },
+                                    ],
+                                  },
+                                ],
+                              })
+                          }}
+                        />
+                      }
+                    >
+                      {activeThread?.assistants[0]?.tools[0].enabled && (
+                        <div className="px-2 py-4">
+                          <div className="mb-4">
+                            <label
+                              id="tool-title"
+                              className="mb-2 inline-block font-bold text-zinc-500 dark:text-gray-300"
+                            >
+                              Embedding Engine
+                            </label>
+                            <div className="flex items-center justify-between">
+                              <label className="font-medium text-zinc-500 dark:text-gray-300">
+                                {selectedModel?.engine ===
+                                InferenceEngine.openai
+                                  ? 'OpenAI'
+                                  : 'Nitro'}
+                              </label>
+                            </div>
+                          </div>
+                          <AssistantSetting
+                            componentData={componentDataAssistantSetting}
+                          />
+                        </div>
+                      )}
+                    </CardSidebar>
+                  </div>
+                )}
+            </div>
           </div>
         </CardSidebar>
         <CardSidebar title="Model">
@@ -145,7 +204,7 @@ const Sidebar: React.FC = () => {
               <DropdownListSidebar />
             </div>
 
-            {componentDataRuntimeSetting.length !== 0 && (
+            {componentDataRuntimeSetting.length > 0 && (
               <div className="mt-6">
                 <CardSidebar title="Inference Parameters" asChild>
                   <div className="px-2 py-4">
@@ -161,13 +220,16 @@ const Sidebar: React.FC = () => {
               <div className="mt-4">
                 <CardSidebar title="Model Parameters" asChild>
                   <div className="px-2 py-4">
-                    {settingComponentBuilder(componentDataEngineSetting, true)}
+                    <SettingComponentBuilder
+                      componentData={componentDataEngineSetting}
+                      selector={(x: any) => x.name === 'prompt_template'}
+                    />
                   </div>
                 </CardSidebar>
               </div>
             )}
 
-            {componentDataEngineSetting.length !== 0 && (
+            {componentDataEngineSetting.length > 0 && (
               <div className="my-4">
                 <CardSidebar title="Engine Parameters" asChild>
                   <div className="px-2 py-4">
diff --git a/web/screens/Chat/SimpleTextMessage/index.tsx b/web/screens/Chat/SimpleTextMessage/index.tsx
index 8754664aa..feed96168 100644
--- a/web/screens/Chat/SimpleTextMessage/index.tsx
+++ b/web/screens/Chat/SimpleTextMessage/index.tsx
@@ -1,10 +1,23 @@
 import React, { useEffect, useRef, useState } from 'react'
 
-import { ChatCompletionRole, MessageStatus, ThreadMessage } from '@janhq/core'
+import {
+  ChatCompletionRole,
+  ContentType,
+  MessageStatus,
+  ThreadMessage,
+} from '@janhq/core'
 
+import {
+  Tooltip,
+  TooltipArrow,
+  TooltipContent,
+  TooltipPortal,
+  TooltipTrigger,
+} from '@janhq/uikit'
 import hljs from 'highlight.js'
 
 import { useAtomValue } from 'jotai'
+import { FolderOpenIcon } from 'lucide-react'
 import { Marked, Renderer } from 'marked'
 
 import { markedHighlight } from 'marked-highlight'
@@ -13,12 +26,13 @@ import { twMerge } from 'tailwind-merge'
 
 import LogoMark from '@/containers/Brand/Logo/Mark'
 
-import BubbleLoader from '@/containers/Loader/Bubble'
-
 import { useClipboard } from '@/hooks/useClipboard'
+import { usePath } from '@/hooks/usePath'
 
+import { toGibibytes } from '@/utils/converter'
 import { displayDate } from '@/utils/datetime'
 
+import Icon from '../FileUploadPreview/Icon'
 import MessageToolbar from '../MessageToolbar'
 
 import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
@@ -29,6 +43,7 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
     text = props.content[0]?.text?.value ?? ''
   }
   const clipboard = useClipboard({ timeout: 1000 })
+  const { onViewFile } = usePath()
 
   const marked: Marked = new Marked(
     markedHighlight({
@@ -77,7 +92,6 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
   const isUser = props.role === ChatCompletionRole.User
   const isSystem = props.role === ChatCompletionRole.System
   const [tokenCount, setTokenCount] = useState(0)
-
   const [lastTimestamp, setLastTimestamp] = useState<number | undefined>()
   const [tokenSpeed, setTokenSpeed] = useState(0)
   const messages = useAtomValue(getCurrentChatMessagesAtom)
@@ -148,6 +162,7 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
             </svg>
           </div>
         )}
+
         <div
           className={twMerge(
             'text-sm font-extrabold capitalize',
@@ -178,23 +193,80 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
       </div>
 
       <div className={twMerge('w-full')}>
-        {props.status === MessageStatus.Pending &&
-        (!props.content[0] || props.content[0].text.value === '') ? (
-          <BubbleLoader />
-        ) : (
-          <>
-            <div
-              className={twMerge(
-                'message flex flex-grow flex-col gap-y-2 text-[15px] font-normal leading-relaxed',
-                isUser
-                  ? 'whitespace-pre-wrap break-words'
-                  : 'rounded-xl bg-secondary p-4'
-              )}
-              // eslint-disable-next-line @typescript-eslint/naming-convention
-              dangerouslySetInnerHTML={{ __html: parsedText }}
-            />
-          </>
-        )}
+        <>
+          {props.content[0]?.type === ContentType.Image && (
+            <div className="group/image relative mb-2 inline-flex overflow-hidden rounded-xl">
+              <img
+                className="aspect-auto h-[300px]"
+                alt={props.content[0]?.text.name}
+                src={props.content[0]?.text.annotations[0]}
+              />
+              <div className="absolute left-0 top-0 z-20 hidden h-full w-full bg-black/20 group-hover/image:inline-block" />
+              <Tooltip>
+                <TooltipTrigger asChild>
+                  <div
+                    className="absolute right-2 top-2 z-20 hidden h-8 w-8 cursor-pointer items-center justify-center rounded-md bg-background group-hover/image:flex"
+                    onClick={() => onViewFile(`${props.id}.png`)}
+                  >
+                    <FolderOpenIcon size={20} />
+                  </div>
+                </TooltipTrigger>
+                <TooltipPortal>
+                  <TooltipContent side="top" className="max-w-[154px] px-3">
+                    <span>Show in finder</span>
+                    <TooltipArrow />
+                  </TooltipContent>
+                </TooltipPortal>
+              </Tooltip>
+            </div>
+          )}
+
+          {props.content[0]?.type === ContentType.Pdf && (
+            <div className="group/file relative mb-2 inline-flex w-60 cursor-pointer gap-x-3 overflow-hidden rounded-lg bg-secondary p-4">
+              <div className="absolute left-0 top-0 z-20 hidden h-full w-full bg-black/20 backdrop-blur-sm group-hover/file:inline-block" />
+              <Tooltip>
+                <TooltipTrigger asChild>
+                  <div
+                    className="absolute right-2 top-2 z-20 hidden h-8 w-8 cursor-pointer items-center justify-center rounded-md bg-background group-hover/file:flex"
+                    onClick={() =>
+                      onViewFile(`${props.id}.${props.content[0]?.type}`)
+                    }
+                  >
+                    <FolderOpenIcon size={20} />
+                  </div>
+                </TooltipTrigger>
+                <TooltipPortal>
+                  <TooltipContent side="top" className="max-w-[154px] px-3">
+                    <span>Show in finder</span>
+                    <TooltipArrow />
+                  </TooltipContent>
+                </TooltipPortal>
+              </Tooltip>
+
+              <Icon type={props.content[0].type} />
+
+              <div>
+                <h6 className="line-clamp-1 font-medium">
+                  {props.content[0].text.name?.replaceAll(/[-._]/g, ' ')}
+                </h6>
+                <p className="text-muted-foreground">
+                  {toGibibytes(Number(props.content[0].text.size))}
+                </p>
+              </div>
+            </div>
+          )}
+
+          <div
+            className={twMerge(
+              'message flex flex-grow flex-col gap-y-2 text-[15px] font-normal leading-relaxed',
+              isUser
+                ? 'whitespace-pre-wrap break-words'
+                : 'rounded-xl bg-secondary p-4'
+            )}
+            // eslint-disable-next-line @typescript-eslint/naming-convention
+            dangerouslySetInnerHTML={{ __html: parsedText }}
+          />
+        </>
       </div>
     </div>
   )
diff --git a/web/screens/Chat/ThreadList/index.tsx b/web/screens/Chat/ThreadList/index.tsx
index 0e09a20a7..b2e15d111 100644
--- a/web/screens/Chat/ThreadList/index.tsx
+++ b/web/screens/Chat/ThreadList/index.tsx
@@ -84,6 +84,7 @@ export default function ThreadList() {
         threads.map((thread, i) => {
           const lastMessage =
             threadStates[thread.id]?.lastMessage ?? 'No new message'
+
           return (
             <div
               key={i}
diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index 684027e49..6da8af13f 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -1,110 +1,123 @@
-import { ChangeEvent, Fragment, KeyboardEvent, useEffect, useRef } from 'react'
+/* eslint-disable @typescript-eslint/naming-convention */
+import React, { useEffect, useState } from 'react'
 
-import { InferenceEvent, MessageStatus, events } from '@janhq/core'
-import { Button, Textarea } from '@janhq/uikit'
+import { useDropzone } from 'react-dropzone'
 
-import { useAtom, useAtomValue } from 'jotai'
+import { useAtomValue, useSetAtom } from 'jotai'
 
-import { debounce } from 'lodash'
-import { StopCircle } from 'lucide-react'
+import { UploadCloudIcon, XIcon } from 'lucide-react'
 
-import LogoMark from '@/containers/Brand/Logo/Mark'
+import { twMerge } from 'tailwind-merge'
 
 import ModelReload from '@/containers/Loader/ModelReload'
 import ModelStart from '@/containers/Loader/ModelStart'
-import { currentPromptAtom } from '@/containers/Providers/Jotai'
 
+import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
 import { showLeftSideBarAtom } from '@/containers/Providers/KeyListener'
 
-import { MainViewState } from '@/constants/screens'
-
-import { useActiveModel } from '@/hooks/useActiveModel'
-
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
-import { useMainViewState } from '@/hooks/useMainViewState'
-
 import useSendChatMessage from '@/hooks/useSendChatMessage'
 
 import ChatBody from '@/screens/Chat/ChatBody'
 
 import ThreadList from '@/screens/Chat/ThreadList'
 
+import ChatInput from './ChatInput'
+import RequestDownloadModel from './RequestDownloadModel'
 import Sidebar from './Sidebar'
 
-import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
-
 import {
   activeThreadAtom,
   engineParamsUpdateAtom,
-  getActiveThreadIdAtom,
-  waitingToSendMessage,
 } from '@/helpers/atoms/Thread.atom'
 
-import { activeThreadStateAtom } from '@/helpers/atoms/Thread.atom'
-
-const ChatScreen = () => {
+const ChatScreen: React.FC = () => {
+  const setCurrentPrompt = useSetAtom(currentPromptAtom)
   const activeThread = useAtomValue(activeThreadAtom)
-  const { downloadedModels } = useGetDownloadedModels()
   const showLeftSideBar = useAtomValue(showLeftSideBarAtom)
-
-  const { activeModel, stateModel } = useActiveModel()
-  const { setMainViewState } = useMainViewState()
-  const messages = useAtomValue(getCurrentChatMessagesAtom)
-
-  const [currentPrompt, setCurrentPrompt] = useAtom(currentPromptAtom)
-  const activeThreadState = useAtomValue(activeThreadStateAtom)
-  const { sendChatMessage, queuedMessage, reloadModel } = useSendChatMessage()
-  const isWaitingForResponse = activeThreadState?.waitingForResponse ?? false
-  const isDisabledChatbox =
-    currentPrompt.trim().length === 0 || isWaitingForResponse
-
-  const activeThreadId = useAtomValue(getActiveThreadIdAtom)
-  const [isWaitingToSend, setIsWaitingToSend] = useAtom(waitingToSendMessage)
-
-  const textareaRef = useRef<HTMLTextAreaElement>(null)
-  const modelRef = useRef(activeModel)
   const engineParamsUpdate = useAtomValue(engineParamsUpdateAtom)
+  const { queuedMessage, reloadModel } = useSendChatMessage()
+  const [dragOver, setDragOver] = useState(false)
+  const [dragRejected, setDragRejected] = useState({ code: '' })
+  const setFileUpload = useSetAtom(fileUploadAtom)
+  const { getRootProps, isDragReject } = useDropzone({
+    noClick: true,
+    multiple: false,
+    accept: {
+      // 'image/*': ['.png', '.jpg', '.jpeg'],
+      'application/pdf': ['.pdf'],
+    },
 
-  useEffect(() => {
-    modelRef.current = activeModel
-  }, [activeModel])
-
-  const onPromptChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
-    setCurrentPrompt(e.target.value)
-  }
-
-  useEffect(() => {
-    if (isWaitingToSend && activeThreadId) {
-      setIsWaitingToSend(false)
-      sendChatMessage()
-    }
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [waitingToSendMessage, activeThreadId])
-
-  useEffect(() => {
-    if (textareaRef.current) {
-      textareaRef.current.style.height = '40px'
-      textareaRef.current.style.height = textareaRef.current.scrollHeight + 'px'
-    }
-  }, [currentPrompt])
-
-  const onKeyDown = debounce(
-    async (e: React.KeyboardEvent<HTMLTextAreaElement>) => {
-      if (e.key === 'Enter') {
-        if (!e.shiftKey) {
-          e.preventDefault()
-          if (messages[messages.length - 1]?.status !== MessageStatus.Pending)
-            sendChatMessage()
-          else onStopInferenceClick()
-        }
+    onDragOver: (e) => {
+      if (
+        e.dataTransfer.items.length === 1 &&
+        activeThread?.assistants[0].tools &&
+        activeThread?.assistants[0].tools[0]?.enabled
+      ) {
+        setDragOver(true)
+      } else if (
+        activeThread?.assistants[0].tools &&
+        !activeThread?.assistants[0].tools[0]?.enabled
+      ) {
+        setDragRejected({ code: 'retrieval-off' })
+      } else {
+        setDragRejected({ code: 'multiple-upload' })
       }
     },
-    50,
-    { leading: false, trailing: true }
-  )
+    onDragLeave: () => setDragOver(false),
+    onDrop: (files, rejectFiles) => {
+      if (
+        !files ||
+        files.length !== 1 ||
+        rejectFiles.length !== 0 ||
+        (activeThread?.assistants[0].tools &&
+          !activeThread?.assistants[0].tools[0]?.enabled)
+      )
+        return
+      const imageType = files[0]?.type.includes('image')
+      setFileUpload([{ file: files[0], type: imageType ? 'image' : 'pdf' }])
+      setDragOver(false)
+      if (imageType) {
+        setCurrentPrompt('What do you see in this image?')
+      } else {
+        setCurrentPrompt('Summarize this for me')
+      }
+    },
+    onDropRejected: (e) => {
+      if (
+        activeThread?.assistants[0].tools &&
+        !activeThread?.assistants[0].tools[0]?.enabled
+      ) {
+        setDragRejected({ code: 'retrieval-off' })
+      } else {
+        setDragRejected({ code: e[0].errors[0].code })
+      }
+      setDragOver(false)
+    },
+  })
 
-  const onStopInferenceClick = async () => {
-    events.emit(InferenceEvent.OnInferenceStopped, {})
+  // TODO @faisal change this until we have sneakbar component
+  useEffect(() => {
+    setTimeout(() => {
+      if (dragRejected.code) {
+        setDragRejected({ code: '' })
+      }
+    }, 2000)
+  }, [dragRejected.code])
+
+  const renderError = (code: string) => {
+    switch (code) {
+      case 'multiple-upload':
+        return 'Currently, we only support 1 attachment at the same time'
+
+      case 'retrieval-off':
+        return 'Turn on Retrieval in Assistant Settings to use this feature'
+
+      case 'file-invalid-type':
+        return 'We do not support this file type'
+
+      default:
+        return 'Oops, something error, please try again.'
+    }
   }
 
   return (
@@ -116,34 +129,68 @@ const ChatScreen = () => {
         </div>
       ) : null}
 
-      <div className="relative flex h-full w-full flex-col overflow-auto bg-background">
+      <div
+        className="relative flex h-full w-full flex-col overflow-auto bg-background outline-none"
+        {...getRootProps()}
+      >
+        {dragRejected.code !== '' && (
+          <div className="absolute bottom-3 left-1/2 z-50 inline-flex w-full -translate-x-1/2 justify-center px-16">
+            <div className="flex items-start justify-between gap-x-4 rounded-lg bg-foreground px-4 py-2 text-white dark:border dark:border-border dark:bg-zinc-900">
+              <svg
+                width="20"
+                height="20"
+                viewBox="0 0 20 20"
+                fill="none"
+                xmlns="http://www.w3.org/2000/svg"
+              >
+                <path
+                  fillRule="evenodd"
+                  clipRule="evenodd"
+                  d="M20 10C20 15.5228 15.5228 20 10 20H0.993697C0.110179 20 -0.332289 18.9229 0.292453 18.2929L2.2495 16.3195C0.843343 14.597 1.21409e-08 12.397 1.21409e-08 10C1.21409e-08 4.47715 4.47715 0 10 0C15.5228 0 20 4.47715 20 10ZM13.2071 6.79289C13.5976 7.18342 13.5976 7.81658 13.2071 8.20711L11.4142 10L13.2071 11.7929C13.5976 12.1834 13.5976 12.8166 13.2071 13.2071C12.8166 13.5976 12.1834 13.5976 11.7929 13.2071L10 11.4142L8.20711 13.2071C7.81658 13.5976 7.18342 13.5976 6.79289 13.2071C6.40237 12.8166 6.40237 12.1834 6.79289 11.7929L8.58579 10L6.79289 8.20711C6.40237 7.81658 6.40237 7.18342 6.79289 6.79289C7.18342 6.40237 7.81658 6.40237 8.20711 6.79289L10 8.58579L11.7929 6.79289C12.1834 6.40237 12.8166 6.40237 13.2071 6.79289Z"
+                  fill="#F87171"
+                />
+              </svg>
+              <p>{renderError(dragRejected.code)}</p>
+              <XIcon
+                size={24}
+                className="cursor-pointer"
+                onClick={() => setDragRejected({ code: '' })}
+              />
+            </div>
+          </div>
+        )}
+
+        {dragOver && (
+          <div className="absolute z-50 mx-auto h-full w-full bg-background/50 p-8 backdrop-blur-lg">
+            <div
+              className={twMerge(
+                'flex h-full w-full items-center justify-center rounded-lg border border-dashed border-blue-500',
+                isDragReject && 'border-red-500'
+              )}
+            >
+              <div className="mx-auto w-1/2 text-center">
+                <div className="mx-auto inline-flex h-12 w-12 items-center justify-center rounded-full bg-blue-200">
+                  <UploadCloudIcon size={24} className="text-blue-600" />
+                </div>
+                <div className="mt-4 text-blue-600">
+                  <h6 className="font-bold">
+                    {isDragReject
+                      ? 'Currently, we only support 1 attachment at the same time with PDF format'
+                      : 'Drop file here'}
+                  </h6>
+                  {!isDragReject && <p className="mt-2">(PDF)</p>}
+                </div>
+              </div>
+            </div>
+          </div>
+        )}
         <div className="flex h-full w-full flex-col justify-between">
           {activeThread ? (
             <div className="flex h-full w-full overflow-y-auto overflow-x-hidden">
               <ChatBody />
             </div>
           ) : (
-            <div className="mx-auto mt-8 flex h-full w-3/4 flex-col items-center justify-center text-center">
-              {downloadedModels.length === 0 && (
-                <Fragment>
-                  <LogoMark
-                    className="mx-auto mb-4 animate-wave"
-                    width={56}
-                    height={56}
-                  />
-                  <h1 className="text-2xl font-bold">Welcome!</h1>
-                  <p className="mt-1 text-base">
-                    You need to download your first model
-                  </p>
-                  <Button
-                    className="mt-4"
-                    onClick={() => setMainViewState(MainViewState.Hub)}
-                  >
-                    Explore The Hub
-                  </Button>
-                </Fragment>
-              )}
-            </div>
+            <RequestDownloadModel />
           )}
 
           {!engineParamsUpdate && <ModelStart />}
@@ -166,48 +213,9 @@ const ChatScreen = () => {
               </span>
             </div>
           )}
-
-          <div className="mx-auto flex w-full flex-shrink-0 items-end justify-center space-x-4 px-8 py-4">
-            <Textarea
-              className="max-h-[400px] resize-none overflow-y-auto pr-20"
-              style={{ height: '40px' }}
-              ref={textareaRef}
-              onKeyDown={(e: KeyboardEvent<HTMLTextAreaElement>) =>
-                onKeyDown(e)
-              }
-              placeholder="Enter your message..."
-              disabled={stateModel.loading || !activeThread}
-              value={currentPrompt}
-              onChange={(e: ChangeEvent<HTMLTextAreaElement>) =>
-                onPromptChange(e)
-              }
-            />
-            {messages[messages.length - 1]?.status !== MessageStatus.Pending ? (
-              <Button
-                size="lg"
-                disabled={
-                  isDisabledChatbox || stateModel.loading || !activeThread
-                }
-                themes="primary"
-                className="min-w-[100px]"
-                onClick={sendChatMessage}
-              >
-                Send
-              </Button>
-            ) : (
-              <Button
-                size="lg"
-                themes="danger"
-                onClick={onStopInferenceClick}
-                className="min-w-[100px]"
-              >
-                <StopCircle size={24} />
-              </Button>
-            )}
-          </div>
+          <ChatInput />
         </div>
       </div>
-
       {/* Right side bar */}
       {activeThread && <Sidebar />}
     </div>
diff --git a/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx b/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
index 656a671c7..3ffe2cbac 100644
--- a/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
+++ b/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
@@ -24,7 +24,9 @@ import { MainViewState } from '@/constants/screens'
 
 import { useCreateNewThread } from '@/hooks/useCreateNewThread'
 import useDownloadModel from '@/hooks/useDownloadModel'
+
 import { useDownloadState } from '@/hooks/useDownloadState'
+
 import { getAssistants } from '@/hooks/useGetAssistants'
 import { downloadedModelsAtom } from '@/hooks/useGetDownloadedModels'
 import { useMainViewState } from '@/hooks/useMainViewState'
diff --git a/web/screens/LocalServer/index.tsx b/web/screens/LocalServer/index.tsx
index ce709d831..1a954c692 100644
--- a/web/screens/LocalServer/index.tsx
+++ b/web/screens/LocalServer/index.tsx
@@ -41,7 +41,7 @@ import { toSettingParams } from '@/utils/modelParam'
 
 import EngineSetting from '../Chat/EngineSetting'
 
-import settingComponentBuilder from '../Chat/ModelSetting/settingComponentBuilder'
+import SettingComponentBuilder from '../Chat/ModelSetting/SettingComponent'
 
 import { showRightSideBarAtom } from '../Chat/Sidebar'
 
@@ -361,7 +361,11 @@ const LocalServerScreen = () => {
             <div className="mt-4">
               <CardSidebar title="Model Parameters" asChild>
                 <div className="px-2 py-4">
-                  {settingComponentBuilder(componentDataEngineSetting, true)}
+                  <SettingComponentBuilder
+                    enabled={!serverEnabled}
+                    componentData={componentDataEngineSetting}
+                    selector={(x) => x.name === 'prompt_template'}
+                  />
                 </div>
               </CardSidebar>
             </div>
@@ -371,7 +375,7 @@ const LocalServerScreen = () => {
             <div className="my-4">
               <CardSidebar title="Engine Parameters" asChild>
                 <div className="px-2 py-4">
-                  <EngineSetting />
+                  <EngineSetting enabled={!serverEnabled} />
                 </div>
               </CardSidebar>
             </div>
diff --git a/web/tsconfig.json b/web/tsconfig.json
index 3529c3531..26f0e8ef3 100644
--- a/web/tsconfig.json
+++ b/web/tsconfig.json
@@ -17,13 +17,13 @@
     "incremental": true,
     "plugins": [
       {
-        "name": "next"
-      }
+        "name": "next",
+      },
     ],
     "paths": {
-      "@/*": ["./*"]
-    }
+      "@/*": ["./*"],
+    },
   },
   "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
-  "exclude": ["node_modules", "../electron"]
+  "exclude": ["node_modules"],
 }
diff --git a/web/types/index.d.ts b/web/types/index.d.ts
index 328fc8f53..833c3e2bd 100644
--- a/web/types/index.d.ts
+++ b/web/types/index.d.ts
@@ -4,7 +4,6 @@ import { APIFunctions } from '@janhq/core'
 export {}
 
 declare global {
-  declare const PLUGIN_CATALOG: string
   declare const VERSION: string
   declare const ANALYTICS_ID: string
   declare const ANALYTICS_HOST: string
diff --git a/web/utils/base64.ts b/web/utils/base64.ts
new file mode 100644
index 000000000..07d016eeb
--- /dev/null
+++ b/web/utils/base64.ts
@@ -0,0 +1,9 @@
+export const getBase64 = async (file: File): Promise<string> =>
+  new Promise((resolve) => {
+    const reader = new FileReader()
+    reader.readAsDataURL(file)
+    reader.onload = () => {
+      const baseURL = reader.result
+      resolve(baseURL as string)
+    }
+  })
diff --git a/web/utils/componentSettings.ts b/web/utils/componentSettings.ts
index 3536bfd99..64df09ffb 100644
--- a/web/utils/componentSettings.ts
+++ b/web/utils/componentSettings.ts
@@ -1,13 +1,10 @@
-import { Model, ModelRuntimeParams, ModelSettingParams } from '@janhq/core'
+import { Model } from '@janhq/core'
 
+import { SettingComponentData } from '@/screens/Chat/ModelSetting/SettingComponent'
 import { presetConfiguration } from '@/screens/Chat/ModelSetting/predefinedComponent'
 
-import { SettingComponentData } from '@/screens/Chat/ModelSetting/settingComponentBuilder'
-
-import { ModelParams } from '@/helpers/atoms/Thread.atom'
-
 export const getConfigurationsData = (
-  settings: ModelSettingParams | ModelRuntimeParams,
+  settings: object,
   selectedModel?: Model
 ) => {
   const componentData: SettingComponentData[] = []
@@ -19,31 +16,35 @@ export const getConfigurationsData = (
       return
     }
     if ('slider' === componentSetting.controllerType) {
-      const value = Number(settings[key as keyof ModelParams])
+      const value = Number(settings[key as keyof typeof settings])
       if ('value' in componentSetting.controllerData) {
         componentSetting.controllerData.value = value
         if ('max' in componentSetting.controllerData) {
           switch (key) {
             case 'max_tokens':
               componentSetting.controllerData.max =
-                selectedModel?.parameters.max_tokens || 4096
+                selectedModel?.parameters.max_tokens ||
+                componentSetting.controllerData.max ||
+                4096
               break
             case 'ctx_len':
               componentSetting.controllerData.max =
-                selectedModel?.settings.ctx_len || 4096
+                selectedModel?.settings.ctx_len ||
+                componentSetting.controllerData.max ||
+                4096
               break
           }
         }
       }
     } else if ('input' === componentSetting.controllerType) {
-      const value = settings[key as keyof ModelParams] as string
-      const placeholder = settings[key as keyof ModelParams] as string
+      const value = settings[key as keyof typeof settings] as string
+      const placeholder = settings[key as keyof typeof settings] as string
       if ('value' in componentSetting.controllerData)
         componentSetting.controllerData.value = value
       if ('placeholder' in componentSetting.controllerData)
         componentSetting.controllerData.placeholder = placeholder
     } else if ('checkbox' === componentSetting.controllerType) {
-      const checked = settings[key as keyof ModelParams] as boolean
+      const checked = settings[key as keyof typeof settings] as boolean
 
       if ('checked' in componentSetting.controllerData)
         componentSetting.controllerData.checked = checked
diff --git a/web/utils/modelParam.ts b/web/utils/modelParam.ts
index 2deffce66..4b9fe84ae 100644
--- a/web/utils/modelParam.ts
+++ b/web/utils/modelParam.ts
@@ -22,7 +22,7 @@ export const toRuntimeParams = (
 
   for (const [key, value] of Object.entries(modelParams)) {
     if (key in defaultModelParams) {
-      runtimeParams[key as keyof ModelRuntimeParams] = value
+      Object.assign(runtimeParams, { ...runtimeParams, [key]: value })
     }
   }
 
@@ -47,7 +47,7 @@ export const toSettingParams = (
 
   for (const [key, value] of Object.entries(modelParams)) {
     if (key in defaultSettingParams) {
-      settingParams[key as keyof ModelSettingParams] = value
+      Object.assign(settingParams, { ...settingParams, [key]: value })
     }
   }
 

From 36a8809c64b36fa303a46142f21e6f61c8f2b161 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Sat, 27 Jan 2024 06:10:20 +0000
Subject: [PATCH 26/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index f5ce84e70..f7ae2de86 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-193.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-194.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-193.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-194.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-193.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-194.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-193.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-194.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-193.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-194.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 5fe68c16fda1f5147ebf3db6f5adad73079de0f8 Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Sun, 28 Jan 2024 12:55:44 +0700
Subject: [PATCH 27/65] feat: put timestamp under thread name in left panel

---
 web/hooks/useSendChatMessage.ts       | 15 ++++++++++++---
 web/screens/Chat/ThreadList/index.tsx | 16 ++++++----------
 2 files changed, 18 insertions(+), 13 deletions(-)

diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index c8a32564b..15caa62c9 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -172,7 +172,7 @@ export default function useSendChatMessage() {
       const instructions = activeThread.assistants[0].instructions ?? ''
       const tools = activeThread.assistants[0].tools ?? []
 
-      const updatedThread: Thread = {
+      const initThread: Thread = {
         ...activeThread,
         assistants: [
           {
@@ -189,12 +189,13 @@ export default function useSendChatMessage() {
           },
         ],
       }
+
       updateThreadInitSuccess(activeThread.id)
-      updateThread(updatedThread)
+      updateThread(initThread)
 
       await extensionManager
         .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
-        ?.saveThread(updatedThread)
+        ?.saveThread(initThread)
     }
 
     updateThreadWaiting(activeThread.id, true)
@@ -326,6 +327,14 @@ export default function useSendChatMessage() {
       setFileUpload([])
     }
 
+    const updatedThread: Thread = {
+      ...activeThread,
+      updated: timestamp,
+    }
+
+    // cheange last update thread when send message
+    updateThread(updatedThread)
+
     await extensionManager
       .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
       ?.addNewMessage(threadMessage)
diff --git a/web/screens/Chat/ThreadList/index.tsx b/web/screens/Chat/ThreadList/index.tsx
index b2e15d111..19298062b 100644
--- a/web/screens/Chat/ThreadList/index.tsx
+++ b/web/screens/Chat/ThreadList/index.tsx
@@ -84,7 +84,6 @@ export default function ThreadList() {
         threads.map((thread, i) => {
           const lastMessage =
             threadStates[thread.id]?.lastMessage ?? 'No new message'
-
           return (
             <div
               key={i}
@@ -96,13 +95,10 @@ export default function ThreadList() {
               }}
             >
               <div className="relative z-10 p-4 py-4">
-                <div className="flex justify-between">
-                  <h2 className="line-clamp-1 font-bold">{thread.title}</h2>
-                  <p className="mb-1 line-clamp-1 text-xs leading-5 text-muted-foreground">
-                    {thread.updated &&
-                      displayDate(new Date(thread.updated).getTime())}
-                  </p>
-                </div>
+                <p className="line-clamp-1 text-xs leading-5 text-muted-foreground">
+                  {thread.updated && displayDate(thread.updated)}
+                </p>
+                <h2 className="line-clamp-1 font-bold">{thread.title}</h2>
                 <p className="mt-1 line-clamp-1 text-xs text-gray-700 group-hover/message:max-w-[160px] dark:text-gray-300">
                   {lastMessage || 'No new message'}
                 </p>
@@ -161,9 +157,9 @@ export default function ThreadList() {
                       <div className="flex cursor-pointer items-center space-x-2 px-4 py-2 hover:bg-secondary">
                         <Trash2Icon
                           size={16}
-                          className="text-muted-foreground"
+                          className="text-red-600 dark:text-red-300"
                         />
-                        <span className="text-bold text-black dark:text-muted-foreground">
+                        <span className="text-bold text-red-600 dark:text-red-300">
                           Delete thread
                         </span>
                       </div>

From 982b0dcd4e19a9bc8dd23558e523e4c4a5de2be4 Mon Sep 17 00:00:00 2001
From: copyhold <ilya.novojilov@logz.io>
Date: Sun, 28 Jan 2024 11:59:33 +0200
Subject: [PATCH 28/65] Revert

---
 web/screens/Chat/index.tsx | 1 +
 1 file changed, 1 insertion(+)

diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index a51f5f3ed..6da8af13f 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -46,6 +46,7 @@ const ChatScreen: React.FC = () => {
       // 'image/*': ['.png', '.jpg', '.jpeg'],
       'application/pdf': ['.pdf'],
     },
+
     onDragOver: (e) => {
       if (
         e.dataTransfer.items.length === 1 &&

From 3445a25606caaeb89da4063401061099656f7d46 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Mon, 29 Jan 2024 03:50:23 +0000
Subject: [PATCH 29/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index f7ae2de86..121934260 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-194.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-195.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-194.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-195.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-194.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-195.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-194.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-195.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-194.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-195.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 50c499601e8a962ac5769d29123fe2b7686cbb15 Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Mon, 29 Jan 2024 11:57:56 +0700
Subject: [PATCH 30/65] fix: highlight menu dropdown server options

---
 web/screens/LocalServer/index.tsx | 17 +++++++++++++++--
 1 file changed, 15 insertions(+), 2 deletions(-)

diff --git a/web/screens/LocalServer/index.tsx b/web/screens/LocalServer/index.tsx
index 1a954c692..0964b7e25 100644
--- a/web/screens/LocalServer/index.tsx
+++ b/web/screens/LocalServer/index.tsx
@@ -73,6 +73,8 @@ const LocalServerScreen = () => {
   const [host, setHost] = useAtom(hostAtom)
   const [port, setPort] = useAtom(portAtom)
 
+  const hostOptions = ['127.0.0.1', '0.0.0.0']
+
   const FIRST_TIME_VISIT_API_SERVER = 'firstTimeVisitAPIServer'
 
   const [firstTimeVisitAPIServer, setFirstTimeVisitAPIServer] =
@@ -166,8 +168,19 @@ const LocalServerScreen = () => {
                       <SelectValue />
                     </SelectTrigger>
                     <SelectContent>
-                      <SelectItem value="127.0.0.1">127.0.0.1</SelectItem>
-                      <SelectItem value="0.0.0.0">0.0.0.0</SelectItem>
+                      {hostOptions.map((option, i) => {
+                        return (
+                          <SelectItem
+                            key={i}
+                            value={option}
+                            className={twMerge(
+                              host === option && 'bg-secondary'
+                            )}
+                          >
+                            {option}
+                          </SelectItem>
+                        )
+                      })}
                     </SelectContent>
                   </Select>
 

From aa94fe25d042268d11f06e21858d84225950c2b8 Mon Sep 17 00:00:00 2001
From: hiento09 <136591877+hiento09@users.noreply.github.com>
Date: Mon, 29 Jan 2024 12:34:40 +0700
Subject: [PATCH 31/65] Update release url on README to default branch instead
 of main branch (#1832)

Co-authored-by: Hien To <tominhhien97@gmail.com>
---
 .github/workflows/update-release-url.yml |  4 ++--
 README.md                                | 10 +++++-----
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/.github/workflows/update-release-url.yml b/.github/workflows/update-release-url.yml
index 545d6542e..99a3db0e0 100644
--- a/.github/workflows/update-release-url.yml
+++ b/.github/workflows/update-release-url.yml
@@ -17,7 +17,7 @@ jobs:
         with:
           fetch-depth: "0"
           token: ${{ secrets.PAT_SERVICE_ACCOUNT }}
-          ref: main
+          ref: dev
 
       - name: Get Latest Release
         uses: pozetroninc/github-action-get-latest-release@v0.7.0
@@ -46,4 +46,4 @@ jobs:
           git config --global user.name "Service Account"
           git add README.md
           git commit -m "Update README.md with Stable Download URLs"
-          git -c http.extraheader="AUTHORIZATION: bearer ${{ secrets.PAT_SERVICE_ACCOUNT }}" push origin HEAD:main
+          git -c http.extraheader="AUTHORIZATION: bearer ${{ secrets.PAT_SERVICE_ACCOUNT }}" push origin HEAD:dev
diff --git a/README.md b/README.md
index 121934260..1e2d76853 100644
--- a/README.md
+++ b/README.md
@@ -43,31 +43,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Stable (Recommended)</b></td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.4/jan-win-x64-0.4.4.exe'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-win-x64-0.4.5.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.4/jan-mac-x64-0.4.4.dmg'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-mac-x64-0.4.5.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.4/jan-mac-arm64-0.4.4.dmg'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-mac-arm64-0.4.5.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.4/jan-linux-amd64-0.4.4.deb'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-linux-amd64-0.4.5.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.4/jan-linux-x86_64-0.4.4.AppImage'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-linux-x86_64-0.4.5.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 7c30c56277422bae1ecdfa3665a14d2254924895 Mon Sep 17 00:00:00 2001
From: Louis <louis@jan.ai>
Date: Mon, 29 Jan 2024 12:44:32 +0700
Subject: [PATCH 32/65] chore: resolve (#1833)

---
 .../inference-openai-extension/src/index.ts   |  8 ++++----
 web/containers/Layout/TopBar/index.tsx        | 19 ++++++++++---------
 2 files changed, 14 insertions(+), 13 deletions(-)

diff --git a/extensions/inference-openai-extension/src/index.ts b/extensions/inference-openai-extension/src/index.ts
index 44525b631..da06d5dc6 100644
--- a/extensions/inference-openai-extension/src/index.ts
+++ b/extensions/inference-openai-extension/src/index.ts
@@ -31,7 +31,7 @@ import { join } from "path";
  * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
  */
 export default class JanInferenceOpenAIExtension extends BaseExtension {
-  private static readonly _homeDir = "file://engines";
+  private static readonly _engineDir = "file://engines";
   private static readonly _engineMetadataFileName = "openai.json";
 
   private static _currentModel: OpenAIModel;
@@ -48,9 +48,9 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
    * Subscribes to events emitted by the @janhq/core package.
    */
   async onLoad() {
-    if (!(await fs.existsSync(JanInferenceOpenAIExtension._homeDir))) {
+    if (!(await fs.existsSync(JanInferenceOpenAIExtension._engineDir))) {
       await fs
-        .mkdirSync(JanInferenceOpenAIExtension._homeDir)
+        .mkdirSync(JanInferenceOpenAIExtension._engineDir)
         .catch((err) => console.debug(err));
     }
 
@@ -81,7 +81,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
   static async writeDefaultEngineSettings() {
     try {
       const engineFile = join(
-        JanInferenceOpenAIExtension._homeDir,
+        JanInferenceOpenAIExtension._engineDir,
         JanInferenceOpenAIExtension._engineMetadataFileName,
       );
       if (await fs.existsSync(engineFile)) {
diff --git a/web/containers/Layout/TopBar/index.tsx b/web/containers/Layout/TopBar/index.tsx
index ab67cb3b7..807b8be55 100644
--- a/web/containers/Layout/TopBar/index.tsx
+++ b/web/containers/Layout/TopBar/index.tsx
@@ -120,13 +120,14 @@ const TopBar = () => {
               </span>
             </div>
           </div>
-          {activeThread && (
-            <div
-              className={twMerge(
-                'absolute right-0 h-full w-80',
-                showing && 'border-l border-border'
-              )}
-            >
+          <div
+            className={twMerge(
+              'absolute right-0 h-full w-80',
+              showing && 'border-l border-border'
+            )}
+          >
+            {((activeThread && mainViewState === MainViewState.Thread) ||
+              mainViewState === MainViewState.LocalServer) && (
               <div className="flex h-full w-52 items-center justify-between px-4">
                 {showing && (
                   <div className="relative flex h-full items-center">
@@ -227,8 +228,8 @@ const TopBar = () => {
                   />
                 </div>
               </div>
-            </div>
-          )}
+            )}
+          </div>
         </div>
       )}
       <CommandSearch />

From bb47d6869d0700b2cb31420b66eceab4e3129997 Mon Sep 17 00:00:00 2001
From: NamH <NamNh0122@gmail.com>
Date: Mon, 29 Jan 2024 13:53:18 +0700
Subject: [PATCH 33/65] perf: remove unnecessary rerender when user typing
 input (#1818)

Co-authored-by: Faisal Amir <urmauur@gmail.com>
---
 web/containers/Providers/EventHandler.tsx     |  4 --
 web/helpers/atoms/ChatMessage.atom.ts         |  2 -
 web/hooks/useInference.ts                     | 15 +++++++
 web/hooks/useSendChatMessage.ts               | 38 ++++++++----------
 web/screens/Chat/ChatBody/index.tsx           | 10 ++---
 web/screens/Chat/ChatInput/index.tsx          | 25 +++++++-----
 .../Chat/MessageQueuedBanner/index.tsx        |  6 ++-
 web/screens/Chat/index.tsx                    | 40 ++++++++++---------
 8 files changed, 74 insertions(+), 66 deletions(-)
 create mode 100644 web/hooks/useInference.ts

diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index 01d32b346..2b990ec0a 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -22,7 +22,6 @@ import { extensionManager } from '@/extension'
 import {
   addNewMessageAtom,
   updateMessageAtom,
-  generateResponseAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
 import {
   updateThreadWaitingForResponseAtom,
@@ -35,7 +34,6 @@ export default function EventHandler({ children }: { children: ReactNode }) {
   const { downloadedModels } = useGetDownloadedModels()
   const setActiveModel = useSetAtom(activeModelAtom)
   const setStateModel = useSetAtom(stateModelAtom)
-  const setGenerateResponse = useSetAtom(generateResponseAtom)
 
   const updateThreadWaiting = useSetAtom(updateThreadWaitingForResponseAtom)
   const threads = useAtomValue(threadsAtom)
@@ -52,7 +50,6 @@ export default function EventHandler({ children }: { children: ReactNode }) {
 
   const onNewMessageResponse = useCallback(
     (message: ThreadMessage) => {
-      setGenerateResponse(false)
       addNewMessage(message)
     },
     [addNewMessage]
@@ -96,7 +93,6 @@ export default function EventHandler({ children }: { children: ReactNode }) {
 
   const onMessageResponseUpdate = useCallback(
     (message: ThreadMessage) => {
-      setGenerateResponse(false)
       updateMessage(
         message.id,
         message.thread_id,
diff --git a/web/helpers/atoms/ChatMessage.atom.ts b/web/helpers/atoms/ChatMessage.atom.ts
index 0d9211649..b11e8f3be 100644
--- a/web/helpers/atoms/ChatMessage.atom.ts
+++ b/web/helpers/atoms/ChatMessage.atom.ts
@@ -14,8 +14,6 @@ import {
 /**
  * Stores all chat messages for all threads
  */
-export const generateResponseAtom = atom<boolean>(false)
-
 export const chatMessages = atom<Record<string, ThreadMessage[]>>({})
 
 /**
diff --git a/web/hooks/useInference.ts b/web/hooks/useInference.ts
new file mode 100644
index 000000000..8ada18cb7
--- /dev/null
+++ b/web/hooks/useInference.ts
@@ -0,0 +1,15 @@
+import { useAtomValue } from 'jotai'
+
+import { threadStatesAtom } from '@/helpers/atoms/Thread.atom'
+
+export default function useInference() {
+  const threadStates = useAtomValue(threadStatesAtom)
+
+  const isGeneratingResponse = Object.values(threadStates).some(
+    (threadState) => threadState.waitingForResponse
+  )
+
+  return {
+    isGeneratingResponse,
+  }
+}
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index c8a32564b..5df715bb0 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -1,5 +1,5 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
-import { useEffect, useRef, useState } from 'react'
+import { useEffect, useRef } from 'react'
 
 import {
   ChatCompletionMessage,
@@ -18,7 +18,7 @@ import {
   ChatCompletionMessageContentType,
   AssistantTool,
 } from '@janhq/core'
-import { useAtom, useAtomValue, useSetAtom } from 'jotai'
+import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 
 import { ulid } from 'ulid'
 
@@ -35,7 +35,6 @@ import { useActiveModel } from './useActiveModel'
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
   addNewMessageAtom,
-  generateResponseAtom,
   getCurrentChatMessagesAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
 import {
@@ -48,29 +47,30 @@ import {
   updateThreadWaitingForResponseAtom,
 } from '@/helpers/atoms/Thread.atom'
 
+export const queuedMessageAtom = atom(false)
+export const reloadModelAtom = atom(false)
+
 export default function useSendChatMessage() {
   const activeThread = useAtomValue(activeThreadAtom)
   const addNewMessage = useSetAtom(addNewMessageAtom)
   const updateThread = useSetAtom(updateThreadAtom)
   const updateThreadWaiting = useSetAtom(updateThreadWaitingForResponseAtom)
-  const [currentPrompt, setCurrentPrompt] = useAtom(currentPromptAtom)
-  const setGenerateResponse = useSetAtom(generateResponseAtom)
+  const setCurrentPrompt = useSetAtom(currentPromptAtom)
 
   const currentMessages = useAtomValue(getCurrentChatMessagesAtom)
   const { activeModel } = useActiveModel()
   const selectedModel = useAtomValue(selectedModelAtom)
   const { startModel } = useActiveModel()
-  const [queuedMessage, setQueuedMessage] = useState(false)
+  const setQueuedMessage = useSetAtom(queuedMessageAtom)
 
   const modelRef = useRef<Model | undefined>()
   const threadStates = useAtomValue(threadStatesAtom)
   const updateThreadInitSuccess = useSetAtom(updateThreadInitSuccessAtom)
   const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-
   const engineParamsUpdate = useAtomValue(engineParamsUpdateAtom)
-  const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
 
-  const [reloadModel, setReloadModel] = useState(false)
+  const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
+  const setReloadModel = useSetAtom(reloadModelAtom)
   const [fileUpload, setFileUpload] = useAtom(fileUploadAtom)
 
   useEffect(() => {
@@ -82,9 +82,7 @@ export default function useSendChatMessage() {
       console.error('No active thread')
       return
     }
-
     updateThreadWaiting(activeThread.id, true)
-
     const messages: ChatCompletionMessage[] = [
       activeThread.assistants[0]?.instructions,
     ]
@@ -121,19 +119,19 @@ export default function useSendChatMessage() {
     if (activeModel?.id !== modelId) {
       setQueuedMessage(true)
       startModel(modelId)
-      await WaitForModelStarting(modelId)
+      await waitForModelStarting(modelId)
       setQueuedMessage(false)
     }
     events.emit(MessageEvent.OnMessageSent, messageRequest)
   }
 
   // TODO: Refactor @louis
-  const WaitForModelStarting = async (modelId: string) => {
+  const waitForModelStarting = async (modelId: string) => {
     return new Promise<void>((resolve) => {
       setTimeout(async () => {
         if (modelRef.current?.id !== modelId) {
           console.debug('waiting for model to start')
-          await WaitForModelStarting(modelId)
+          await waitForModelStarting(modelId)
           resolve()
         } else {
           resolve()
@@ -142,10 +140,8 @@ export default function useSendChatMessage() {
     })
   }
 
-  const sendChatMessage = async () => {
-    setGenerateResponse(true)
-
-    if (!currentPrompt || currentPrompt.trim().length === 0) return
+  const sendChatMessage = async (message: string) => {
+    if (!message || message.trim().length === 0) return
 
     if (!activeThread) {
       console.error('No active thread')
@@ -199,7 +195,7 @@ export default function useSendChatMessage() {
 
     updateThreadWaiting(activeThread.id, true)
 
-    const prompt = currentPrompt.trim()
+    const prompt = message.trim()
     setCurrentPrompt('')
 
     const base64Blob = fileUpload[0]
@@ -335,7 +331,7 @@ export default function useSendChatMessage() {
     if (activeModel?.id !== modelId) {
       setQueuedMessage(true)
       startModel(modelId)
-      await WaitForModelStarting(modelId)
+      await waitForModelStarting(modelId)
       setQueuedMessage(false)
     }
 
@@ -346,9 +342,7 @@ export default function useSendChatMessage() {
   }
 
   return {
-    reloadModel,
     sendChatMessage,
     resendChatMessage,
-    queuedMessage,
   }
 }
diff --git a/web/screens/Chat/ChatBody/index.tsx b/web/screens/Chat/ChatBody/index.tsx
index 9f629e627..daf27f8dd 100644
--- a/web/screens/Chat/ChatBody/index.tsx
+++ b/web/screens/Chat/ChatBody/index.tsx
@@ -15,23 +15,21 @@ import { MainViewState } from '@/constants/screens'
 import { activeModelAtom } from '@/hooks/useActiveModel'
 import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
 
+import useInference from '@/hooks/useInference'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import ChatItem from '../ChatItem'
 
 import ErrorMessage from '../ErrorMessage'
 
-import {
-  generateResponseAtom,
-  getCurrentChatMessagesAtom,
-} from '@/helpers/atoms/ChatMessage.atom'
+import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
 
 const ChatBody: React.FC = () => {
   const messages = useAtomValue(getCurrentChatMessagesAtom)
   const activeModel = useAtomValue(activeModelAtom)
   const { downloadedModels } = useGetDownloadedModels()
   const { setMainViewState } = useMainViewState()
-  const generateResponse = useAtomValue(generateResponseAtom)
+  const { isGeneratingResponse } = useInference()
 
   if (downloadedModels.length === 0)
     return (
@@ -101,7 +99,7 @@ const ChatBody: React.FC = () => {
           ))}
 
           {activeModel &&
-            (generateResponse ||
+            (isGeneratingResponse ||
               (messages.length &&
                 messages[messages.length - 1].status ===
                   MessageStatus.Pending &&
diff --git a/web/screens/Chat/ChatInput/index.tsx b/web/screens/Chat/ChatInput/index.tsx
index b960bdc57..9293cdc7a 100644
--- a/web/screens/Chat/ChatInput/index.tsx
+++ b/web/screens/Chat/ChatInput/index.tsx
@@ -64,13 +64,18 @@ const ChatInput: React.FC = () => {
   useEffect(() => {
     if (isWaitingToSend && activeThreadId) {
       setIsWaitingToSend(false)
-      sendChatMessage()
+      sendChatMessage(currentPrompt)
     }
     if (textareaRef.current) {
       textareaRef.current.focus()
     }
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [waitingToSendMessage, activeThreadId])
+  }, [
+    activeThreadId,
+    isWaitingToSend,
+    currentPrompt,
+    setIsWaitingToSend,
+    sendChatMessage,
+  ])
 
   useEffect(() => {
     if (textareaRef.current) {
@@ -81,13 +86,11 @@ const ChatInput: React.FC = () => {
   }, [currentPrompt])
 
   const onKeyDown = async (e: React.KeyboardEvent<HTMLTextAreaElement>) => {
-    if (e.key === 'Enter') {
-      if (!e.shiftKey) {
-        e.preventDefault()
-        if (messages[messages.length - 1]?.status !== MessageStatus.Pending)
-          sendChatMessage()
-        else onStopInferenceClick()
-      }
+    if (e.key === 'Enter' && !e.shiftKey) {
+      e.preventDefault()
+      if (messages[messages.length - 1]?.status !== MessageStatus.Pending)
+        sendChatMessage(currentPrompt)
+      else onStopInferenceClick()
     }
   }
 
@@ -237,7 +240,7 @@ const ChatInput: React.FC = () => {
           }
           themes="primary"
           className="min-w-[100px]"
-          onClick={sendChatMessage}
+          onClick={() => sendChatMessage(currentPrompt)}
         >
           Send
         </Button>
diff --git a/web/screens/Chat/MessageQueuedBanner/index.tsx b/web/screens/Chat/MessageQueuedBanner/index.tsx
index df9aa5a21..5847394b4 100644
--- a/web/screens/Chat/MessageQueuedBanner/index.tsx
+++ b/web/screens/Chat/MessageQueuedBanner/index.tsx
@@ -1,7 +1,9 @@
-import useSendChatMessage from '@/hooks/useSendChatMessage'
+import { useAtomValue } from 'jotai'
+
+import { queuedMessageAtom } from '@/hooks/useSendChatMessage'
 
 const MessageQueuedBanner: React.FC = () => {
-  const { queuedMessage } = useSendChatMessage()
+  const queuedMessage = useAtomValue(queuedMessageAtom)
 
   return (
     <div>
diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index 6da8af13f..cfd47ad39 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -15,7 +15,7 @@ import ModelStart from '@/containers/Loader/ModelStart'
 import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
 import { showLeftSideBarAtom } from '@/containers/Providers/KeyListener'
 
-import useSendChatMessage from '@/hooks/useSendChatMessage'
+import { queuedMessageAtom, reloadModelAtom } from '@/hooks/useSendChatMessage'
 
 import ChatBody from '@/screens/Chat/ChatBody'
 
@@ -30,20 +30,37 @@ import {
   engineParamsUpdateAtom,
 } from '@/helpers/atoms/Thread.atom'
 
+const renderError = (code: string) => {
+  switch (code) {
+    case 'multiple-upload':
+      return 'Currently, we only support 1 attachment at the same time'
+
+    case 'retrieval-off':
+      return 'Turn on Retrieval in Assistant Settings to use this feature'
+
+    case 'file-invalid-type':
+      return 'We do not support this file type'
+
+    default:
+      return 'Oops, something error, please try again.'
+  }
+}
+
 const ChatScreen: React.FC = () => {
   const setCurrentPrompt = useSetAtom(currentPromptAtom)
   const activeThread = useAtomValue(activeThreadAtom)
   const showLeftSideBar = useAtomValue(showLeftSideBarAtom)
   const engineParamsUpdate = useAtomValue(engineParamsUpdateAtom)
-  const { queuedMessage, reloadModel } = useSendChatMessage()
   const [dragOver, setDragOver] = useState(false)
+
+  const queuedMessage = useAtomValue(queuedMessageAtom)
+  const reloadModel = useAtomValue(reloadModelAtom)
   const [dragRejected, setDragRejected] = useState({ code: '' })
   const setFileUpload = useSetAtom(fileUploadAtom)
   const { getRootProps, isDragReject } = useDropzone({
     noClick: true,
     multiple: false,
     accept: {
-      // 'image/*': ['.png', '.jpg', '.jpeg'],
       'application/pdf': ['.pdf'],
     },
 
@@ -104,22 +121,6 @@ const ChatScreen: React.FC = () => {
     }, 2000)
   }, [dragRejected.code])
 
-  const renderError = (code: string) => {
-    switch (code) {
-      case 'multiple-upload':
-        return 'Currently, we only support 1 attachment at the same time'
-
-      case 'retrieval-off':
-        return 'Turn on Retrieval in Assistant Settings to use this feature'
-
-      case 'file-invalid-type':
-        return 'We do not support this file type'
-
-      default:
-        return 'Oops, something error, please try again.'
-    }
-  }
-
   return (
     <div className="flex h-full w-full">
       {/* Left side bar */}
@@ -216,6 +217,7 @@ const ChatScreen: React.FC = () => {
           <ChatInput />
         </div>
       </div>
+
       {/* Right side bar */}
       {activeThread && <Sidebar />}
     </div>

From 391f053266c1b068815942288a3f17987f535b0e Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Mon, 29 Jan 2024 14:04:17 +0700
Subject: [PATCH 34/65] fix: typo copy

---
 web/hooks/useSendChatMessage.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index 15caa62c9..f72f5c36a 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -332,7 +332,7 @@ export default function useSendChatMessage() {
       updated: timestamp,
     }
 
-    // cheange last update thread when send message
+    // change last update thread when send message
     updateThread(updatedThread)
 
     await extensionManager

From 7b1337aee7cc368c9c35b2e643d1c940e14aa155 Mon Sep 17 00:00:00 2001
From: NamH <NamNh0122@gmail.com>
Date: Mon, 29 Jan 2024 14:31:17 +0700
Subject: [PATCH 35/65] fix: preserve focused thread when navigating in jan app
 (#1814)

* fix: preserve focused thread when navigating in jan app

Signed-off-by: James <james@jan.ai>

* Update web/hooks/useThreads.ts

Co-authored-by: Louis <louis@jan.ai>

---------

Signed-off-by: James <james@jan.ai>
Co-authored-by: James <james@jan.ai>
Co-authored-by: Louis <louis@jan.ai>
---
 web/hooks/useThreads.ts | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/web/hooks/useThreads.ts b/web/hooks/useThreads.ts
index b79cfea92..44be485fe 100644
--- a/web/hooks/useThreads.ts
+++ b/web/hooks/useThreads.ts
@@ -5,13 +5,14 @@ import {
   ConversationalExtension,
 } from '@janhq/core'
 
-import { useAtom } from 'jotai'
+import { useAtom, useAtomValue } from 'jotai'
 
 import useSetActiveThread from './useSetActiveThread'
 
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
   ModelParams,
+  activeThreadAtom,
   threadModelParamsAtom,
   threadStatesAtom,
   threadsAtom,
@@ -23,6 +24,7 @@ const useThreads = () => {
   const [threadModelRuntimeParams, setThreadModelRuntimeParams] = useAtom(
     threadModelParamsAtom
   )
+  const activeThread = useAtomValue(activeThreadAtom)
   const { setActiveThread } = useSetActiveThread()
 
   const getThreads = async () => {
@@ -84,7 +86,7 @@ const useThreads = () => {
       setThreadStates(localThreadStates)
       setThreads(allThreads)
       setThreadModelRuntimeParams(threadModelParams)
-      if (allThreads.length > 0) {
+      if (allThreads.length && !activeThread) {
         setActiveThread(allThreads[0])
       }
     } catch (error) {

From 86a5de2f1c4c7967a70ccf71bd6216bcc9c87cdd Mon Sep 17 00:00:00 2001
From: hiento09 <136591877+hiento09@users.noreply.github.com>
Date: Mon, 29 Jan 2024 15:27:43 +0700
Subject: [PATCH 36/65] Add code sign step for darwin assistant extension
 (#1841)

Co-authored-by: Service Account <service@jan.ai>
---
 extensions/assistant-extension/package.json | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/extensions/assistant-extension/package.json b/extensions/assistant-extension/package.json
index f4e4dd825..84bcdf47e 100644
--- a/extensions/assistant-extension/package.json
+++ b/extensions/assistant-extension/package.json
@@ -8,7 +8,10 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc --module commonjs && rollup -c rollup.config.ts",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install",
+    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && ../../.github/scripts/auto-sign.sh && npm pack && cpx *.tgz ../../electron/pre-install",
+    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install",
+    "build:publish": "run-script-os"
   },
   "devDependencies": {
     "@rollup/plugin-commonjs": "^25.0.7",
@@ -22,7 +25,8 @@
     "rollup-plugin-define": "^1.0.1",
     "rollup-plugin-sourcemaps": "^0.6.3",
     "rollup-plugin-typescript2": "^0.36.0",
-    "typescript": "^5.3.3"
+    "typescript": "^5.3.3",
+    "run-script-os": "^1.1.6"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",

From f19db6c2ebf5f5d05c68aefb160cdf8e4da93358 Mon Sep 17 00:00:00 2001
From: Louis <louis@jan.ai>
Date: Mon, 29 Jan 2024 15:28:31 +0700
Subject: [PATCH 37/65] chore: The Data Folder is no longer an experimental
 feature (#1847)

---
 web/screens/Settings/Advanced/index.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/web/screens/Settings/Advanced/index.tsx b/web/screens/Settings/Advanced/index.tsx
index e1f733699..5c85a0e1e 100644
--- a/web/screens/Settings/Advanced/index.tsx
+++ b/web/screens/Settings/Advanced/index.tsx
@@ -137,7 +137,7 @@ const Advanced = () => {
       )}
 
       {/* Directory */}
-      {experimentalFeature && <DataFolder />}
+      <DataFolder />
 
       {/* Proxy */}
       <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">

From 00a109d46b4ec459c7e76ab8147fd935b585c8e0 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Mon, 29 Jan 2024 08:48:40 +0000
Subject: [PATCH 38/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 1e2d76853..ee9862d45 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.4-195.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-199.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.4-195.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-199.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.4-195.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-199.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.4-195.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-199.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.4-195.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-199.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From a4772202af594e8a3612eee170c6e0aef9f5d7b5 Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Mon, 29 Jan 2024 17:00:23 +0700
Subject: [PATCH 39/65] fix: add loader when user change folder

---
 web/containers/Layout/index.tsx                    |  1 -
 web/screens/Settings/Advanced/DataFolder/index.tsx | 11 +++++++++--
 web/screens/Settings/index.tsx                     |  1 +
 3 files changed, 10 insertions(+), 3 deletions(-)

diff --git a/web/containers/Layout/index.tsx b/web/containers/Layout/index.tsx
index 033038bad..e7bde49c0 100644
--- a/web/containers/Layout/index.tsx
+++ b/web/containers/Layout/index.tsx
@@ -27,7 +27,6 @@ const BaseLayout = (props: PropsWithChildren) => {
   useEffect(() => {
     if (localStorage.getItem(SUCCESS_SET_NEW_DESTINATION) === 'true') {
       setMainViewState(MainViewState.Settings)
-      localStorage.removeItem(SUCCESS_SET_NEW_DESTINATION)
     }
   }, [setMainViewState])
 
diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index 9a1863fa2..4b242f235 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -5,6 +5,8 @@ import { Button, Input } from '@janhq/uikit'
 import { useSetAtom } from 'jotai'
 import { PencilIcon, FolderOpenIcon } from 'lucide-react'
 
+import Loader from '@/containers/Loader'
+
 import { SUCCESS_SET_NEW_DESTINATION } from '@/hooks/useVaultDirectory'
 
 import ModalChangeDirectory, {
@@ -13,10 +15,12 @@ import ModalChangeDirectory, {
 import ModalErrorSetDestGlobal, {
   showChangeFolderErrorAtom,
 } from './ModalErrorSetDestGlobal'
+
 import ModalSameDirectory, { showSamePathModalAtom } from './ModalSameDirectory'
 
 const DataFolder = () => {
   const [janDataFolderPath, setJanDataFolderPath] = useState('')
+  const [showLoader, setShowLoader] = useState(false)
   const setShowDirectoryConfirm = useSetAtom(showDirectoryConfirmModalAtom)
   const setShowSameDirectory = useSetAtom(showSamePathModalAtom)
   const setShowChangeFolderError = useSetAtom(showChangeFolderErrorAtom)
@@ -46,18 +50,20 @@ const DataFolder = () => {
   const onUserConfirmed = useCallback(async () => {
     if (!destinationPath) return
     try {
+      setShowLoader(true)
       const appConfiguration: AppConfiguration =
         await window.core?.api?.getAppConfigurations()
       const currentJanDataFolder = appConfiguration.data_folder
       appConfiguration.data_folder = destinationPath
       await fs.syncFile(currentJanDataFolder, destinationPath)
       await window.core?.api?.updateAppConfiguration(appConfiguration)
-
       console.debug(
         `File sync finished from ${currentJanDataFolder} to ${destinationPath}`
       )
-
       localStorage.setItem(SUCCESS_SET_NEW_DESTINATION, 'true')
+      setTimeout(() => {
+        setShowLoader(false)
+      }, 1200)
       await window.core?.api?.relaunch()
     } catch (e) {
       console.error(`Error: ${e}`)
@@ -107,6 +113,7 @@ const DataFolder = () => {
         onUserConfirmed={onUserConfirmed}
       />
       <ModalErrorSetDestGlobal />
+      {showLoader && <Loader description="Relocating Jan Data Folder..." />}
     </Fragment>
   )
 }
diff --git a/web/screens/Settings/index.tsx b/web/screens/Settings/index.tsx
index ea12ccc20..8f3860ee9 100644
--- a/web/screens/Settings/index.tsx
+++ b/web/screens/Settings/index.tsx
@@ -49,6 +49,7 @@ const SettingsScreen = () => {
   useEffect(() => {
     if (localStorage.getItem(SUCCESS_SET_NEW_DESTINATION) === 'true') {
       setActiveStaticMenu('Advanced Settings')
+      localStorage.removeItem(SUCCESS_SET_NEW_DESTINATION)
     }
   }, [])
 

From 1689702dcdda534612be432b11f4b53dc19fbb12 Mon Sep 17 00:00:00 2001
From: NamH <NamNh0122@gmail.com>
Date: Mon, 29 Jan 2024 18:53:49 +0700
Subject: [PATCH 40/65] fix: all input text box are disabled (#1855)

Signed-off-by: James <james@jan.ai>
Co-authored-by: James <james@jan.ai>
---
 web/screens/Chat/ChatInput/index.tsx | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/web/screens/Chat/ChatInput/index.tsx b/web/screens/Chat/ChatInput/index.tsx
index 9293cdc7a..b760ab44c 100644
--- a/web/screens/Chat/ChatInput/index.tsx
+++ b/web/screens/Chat/ChatInput/index.tsx
@@ -66,9 +66,6 @@ const ChatInput: React.FC = () => {
       setIsWaitingToSend(false)
       sendChatMessage(currentPrompt)
     }
-    if (textareaRef.current) {
-      textareaRef.current.focus()
-    }
   }, [
     activeThreadId,
     isWaitingToSend,
@@ -77,11 +74,16 @@ const ChatInput: React.FC = () => {
     sendChatMessage,
   ])
 
+  useEffect(() => {
+    if (textareaRef.current) {
+      textareaRef.current.focus()
+    }
+  }, [activeThreadId])
+
   useEffect(() => {
     if (textareaRef.current) {
       textareaRef.current.style.height = '40px'
       textareaRef.current.style.height = textareaRef.current.scrollHeight + 'px'
-      textareaRef.current.focus()
     }
   }, [currentPrompt])
 

From 24fc0f027d01b55b8cc9a28830b647f2d6116b84 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Mon, 29 Jan 2024 12:17:38 +0000
Subject: [PATCH 41/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index ee9862d45..f8b09d8d0 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-199.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-208.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-199.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-208.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-199.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-208.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-199.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-208.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-199.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-208.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 12ebf272d614083f22e421166a811272f5a3bd7a Mon Sep 17 00:00:00 2001
From: Louis <louis@jan.ai>
Date: Mon, 29 Jan 2024 22:44:13 +0700
Subject: [PATCH 42/65] fix: retrieval always ask for api key

---
 .../src/node/tools/retrieval/index.ts               |  9 +++++----
 extensions/conversational-extension/src/index.ts    | 13 +++++++------
 web/containers/Providers/EventHandler.tsx           |  2 ++
 web/screens/Chat/ChatBody/index.tsx                 |  9 +--------
 web/screens/Chat/MessageToolbar/index.tsx           |  5 ++++-
 5 files changed, 19 insertions(+), 19 deletions(-)

diff --git a/extensions/assistant-extension/src/node/tools/retrieval/index.ts b/extensions/assistant-extension/src/node/tools/retrieval/index.ts
index f9d5c4029..cd7e9abb1 100644
--- a/extensions/assistant-extension/src/node/tools/retrieval/index.ts
+++ b/extensions/assistant-extension/src/node/tools/retrieval/index.ts
@@ -12,12 +12,11 @@ export class Retrieval {
   public chunkOverlap?: number = 0;
   private retriever: any;
 
-  private embeddingModel: any = undefined;
+  private embeddingModel?: OpenAIEmbeddings = undefined;
   private textSplitter?: RecursiveCharacterTextSplitter;
 
   constructor(chunkSize: number = 4000, chunkOverlap: number = 200) {
     this.updateTextSplitter(chunkSize, chunkOverlap);
-    this.embeddingModel = new OpenAIEmbeddings({});
   }
 
   public updateTextSplitter(chunkSize: number, chunkOverlap: number): void {
@@ -36,7 +35,7 @@ export class Retrieval {
     if (engine === "nitro") {
       this.embeddingModel = new OpenAIEmbeddings(
         { openAIApiKey: "nitro-embedding" },
-        { basePath: "http://127.0.0.1:3928/v1" },
+        { basePath: "http://127.0.0.1:3928/v1" }
       );
     } else {
       // Fallback to OpenAI Settings
@@ -50,11 +49,12 @@ export class Retrieval {
 
   public ingestAgentKnowledge = async (
     filePath: string,
-    memoryPath: string,
+    memoryPath: string
   ): Promise<any> => {
     const loader = new PDFLoader(filePath, {
       splitPages: true,
     });
+    if (!this.embeddingModel) return Promise.reject();
     const doc = await loader.load();
     const docs = await this.textSplitter!.splitDocuments(doc);
     const vectorStore = await HNSWLib.fromDocuments(docs, this.embeddingModel);
@@ -62,6 +62,7 @@ export class Retrieval {
   };
 
   public loadRetrievalAgent = async (memoryPath: string): Promise<void> => {
+    if (!this.embeddingModel) return Promise.reject();
     const vectorStore = await HNSWLib.load(memoryPath, this.embeddingModel);
     this.retriever = vectorStore.asRetriever(2);
     return Promise.resolve();
diff --git a/extensions/conversational-extension/src/index.ts b/extensions/conversational-extension/src/index.ts
index 61f0fd0e9..3d28a9c1d 100644
--- a/extensions/conversational-extension/src/index.ts
+++ b/extensions/conversational-extension/src/index.ts
@@ -119,19 +119,20 @@ export default class JSONConversationalExtension extends ConversationalExtension
       if (!(await fs.existsSync(threadDirPath)))
         await fs.mkdirSync(threadDirPath)
 
-      if (message.content[0].type === 'image') {
+      if (message.content[0]?.type === 'image') {
         const filesPath = await joinPath([threadDirPath, 'files'])
         if (!(await fs.existsSync(filesPath))) await fs.mkdirSync(filesPath)
 
         const imagePath = await joinPath([filesPath, `${message.id}.png`])
         const base64 = message.content[0].text.annotations[0]
         await this.storeImage(base64, imagePath)
-        // if (fs.existsSync(imagePath)) {
-        //   message.content[0].text.annotations[0] = imagePath
-        // }
+        if ((await fs.existsSync(imagePath)) && message.content?.length) {
+          // Use file path instead of blob
+          message.content[0].text.annotations[0] = `threads/${message.thread_id}/files/${message.id}.png`
+        }
       }
 
-      if (message.content[0].type === 'pdf') {
+      if (message.content[0]?.type === 'pdf') {
         const filesPath = await joinPath([threadDirPath, 'files'])
         if (!(await fs.existsSync(filesPath))) await fs.mkdirSync(filesPath)
 
@@ -139,7 +140,7 @@ export default class JSONConversationalExtension extends ConversationalExtension
         const blob = message.content[0].text.annotations[0]
         await this.storeFile(blob, filePath)
 
-        if (await fs.existsSync(filePath)) {
+        if ((await fs.existsSync(filePath)) && message.content?.length) {
           // Use file path instead of blob
           message.content[0].text.annotations[0] = `threads/${message.thread_id}/files/${message.id}.pdf`
         }
diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index 2b990ec0a..5af6d4917 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -100,6 +100,8 @@ export default function EventHandler({ children }: { children: ReactNode }) {
         message.status
       )
       if (message.status === MessageStatus.Pending) {
+        if (message.content.length)
+          updateThreadWaiting(message.thread_id, false)
         return
       }
       // Mark the thread as not waiting for response
diff --git a/web/screens/Chat/ChatBody/index.tsx b/web/screens/Chat/ChatBody/index.tsx
index daf27f8dd..e0a34a1a1 100644
--- a/web/screens/Chat/ChatBody/index.tsx
+++ b/web/screens/Chat/ChatBody/index.tsx
@@ -98,14 +98,7 @@ const ChatBody: React.FC = () => {
             </div>
           ))}
 
-          {activeModel &&
-            (isGeneratingResponse ||
-              (messages.length &&
-                messages[messages.length - 1].status ===
-                  MessageStatus.Pending &&
-                !messages[messages.length - 1].content.length)) && (
-              <GenerateResponse />
-            )}
+          {activeModel && isGeneratingResponse && <GenerateResponse />}
         </ScrollToBottom>
       )}
     </Fragment>
diff --git a/web/screens/Chat/MessageToolbar/index.tsx b/web/screens/Chat/MessageToolbar/index.tsx
index dfa8d63c6..070022122 100644
--- a/web/screens/Chat/MessageToolbar/index.tsx
+++ b/web/screens/Chat/MessageToolbar/index.tsx
@@ -4,6 +4,7 @@ import {
   ThreadMessage,
   ChatCompletionRole,
   ConversationalExtension,
+  ContentType,
 } from '@janhq/core'
 import { useAtomValue, useSetAtom } from 'jotai'
 import { RefreshCcw, CopyIcon, Trash2Icon, CheckIcon } from 'lucide-react'
@@ -53,7 +54,9 @@ const MessageToolbar = ({ message }: { message: ThreadMessage }) => {
     <div className={twMerge('flex flex-row items-center')}>
       <div className="flex overflow-hidden rounded-md border border-border bg-background/20">
         {message.id === messages[messages.length - 1]?.id &&
-          messages[messages.length - 1].status !== MessageStatus.Error && (
+          messages[messages.length - 1].status !== MessageStatus.Error &&
+          messages[messages.length - 1].content[0]?.type !==
+            ContentType.Pdf && (
             <div
               className="cursor-pointer border-r border-border px-2 py-2 hover:bg-background/80"
               onClick={onRegenerateClick}

From 0778beb6529c399e41d851a68fb8c4bb11ec3ed9 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Mon, 29 Jan 2024 20:22:44 +0000
Subject: [PATCH 43/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index f8b09d8d0..c31602fdd 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-208.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-210.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-208.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-210.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-208.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-210.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-208.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-210.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-208.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-210.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From a2b605591100aa1df9d9d2b9249a8b74978d07d3 Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Tue, 30 Jan 2024 11:20:52 +0700
Subject: [PATCH 44/65] fix: auto collapse retrieval setting while update
 config

---
 web/screens/Chat/AssistantSetting/index.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/web/screens/Chat/AssistantSetting/index.tsx b/web/screens/Chat/AssistantSetting/index.tsx
index b97c39e67..df516def0 100644
--- a/web/screens/Chat/AssistantSetting/index.tsx
+++ b/web/screens/Chat/AssistantSetting/index.tsx
@@ -57,7 +57,7 @@ const AssistantSetting = ({
                   tools: [
                     {
                       type: 'retrieval',
-                      enabled: false,
+                      enabled: true,
                       settings: {
                         ...(activeThread.assistants[0].tools &&
                           activeThread.assistants[0].tools[0]?.settings),

From 5e13fd2f53bb6127770b053f1a922db2eb428999 Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Tue, 30 Jan 2024 16:36:58 +0700
Subject: [PATCH 45/65] fix: loader error change folder

---
 web/containers/Layout/index.tsx               |  3 +-
 web/hooks/useVaultDirectory.ts                | 87 -------------------
 .../DataFolder/ModalSameDirectory.tsx         | 15 +++-
 .../Settings/Advanced/DataFolder/index.tsx    |  5 +-
 web/screens/Settings/index.tsx                |  4 +-
 5 files changed, 20 insertions(+), 94 deletions(-)
 delete mode 100644 web/hooks/useVaultDirectory.ts

diff --git a/web/containers/Layout/index.tsx b/web/containers/Layout/index.tsx
index e7bde49c0..77a1fe971 100644
--- a/web/containers/Layout/index.tsx
+++ b/web/containers/Layout/index.tsx
@@ -12,7 +12,8 @@ import TopBar from '@/containers/Layout/TopBar'
 import { MainViewState } from '@/constants/screens'
 
 import { useMainViewState } from '@/hooks/useMainViewState'
-import { SUCCESS_SET_NEW_DESTINATION } from '@/hooks/useVaultDirectory'
+
+import { SUCCESS_SET_NEW_DESTINATION } from '@/screens/Settings/Advanced/DataFolder'
 
 const BaseLayout = (props: PropsWithChildren) => {
   const { children } = props
diff --git a/web/hooks/useVaultDirectory.ts b/web/hooks/useVaultDirectory.ts
deleted file mode 100644
index 9d7adf2ab..000000000
--- a/web/hooks/useVaultDirectory.ts
+++ /dev/null
@@ -1,87 +0,0 @@
-import { useEffect, useState } from 'react'
-
-import { fs, AppConfiguration } from '@janhq/core'
-
-export const SUCCESS_SET_NEW_DESTINATION = 'successSetNewDestination'
-
-export function useVaultDirectory() {
-  const [isSameDirectory, setIsSameDirectory] = useState(false)
-  const [isDirectoryConfirm, setIsDirectoryConfirm] = useState(false)
-  const [isErrorSetNewDest, setIsErrorSetNewDest] = useState(false)
-  const [currentPath, setCurrentPath] = useState('')
-  const [newDestinationPath, setNewDestinationPath] = useState('')
-
-  useEffect(() => {
-    window.core?.api
-      ?.getAppConfigurations()
-      ?.then((appConfig: AppConfiguration) => {
-        setCurrentPath(appConfig.data_folder)
-      })
-  }, [])
-
-  const setNewDestination = async () => {
-    const destFolder = await window.core?.api?.selectDirectory()
-    setNewDestinationPath(destFolder)
-
-    if (destFolder) {
-      console.debug(`Destination folder selected: ${destFolder}`)
-      try {
-        const appConfiguration: AppConfiguration =
-          await window.core?.api?.getAppConfigurations()
-        const currentJanDataFolder = appConfiguration.data_folder
-
-        if (currentJanDataFolder === destFolder) {
-          console.debug(
-            `Destination folder is the same as current folder. Ignore..`
-          )
-          setIsSameDirectory(true)
-          setIsDirectoryConfirm(false)
-          return
-        } else {
-          setIsSameDirectory(false)
-          setIsDirectoryConfirm(true)
-        }
-        setIsErrorSetNewDest(false)
-      } catch (e) {
-        console.error(`Error: ${e}`)
-        setIsErrorSetNewDest(true)
-      }
-    }
-  }
-
-  const applyNewDestination = async () => {
-    try {
-      const appConfiguration: AppConfiguration =
-        await window.core?.api?.getAppConfigurations()
-      const currentJanDataFolder = appConfiguration.data_folder
-
-      appConfiguration.data_folder = newDestinationPath
-
-      await fs.syncFile(currentJanDataFolder, newDestinationPath)
-      await window.core?.api?.updateAppConfiguration(appConfiguration)
-      console.debug(
-        `File sync finished from ${currentPath} to ${newDestinationPath}`
-      )
-
-      setIsErrorSetNewDest(false)
-      localStorage.setItem(SUCCESS_SET_NEW_DESTINATION, 'true')
-      await window.core?.api?.relaunch()
-    } catch (e) {
-      console.error(`Error: ${e}`)
-      setIsErrorSetNewDest(true)
-    }
-  }
-
-  return {
-    setNewDestination,
-    newDestinationPath,
-    applyNewDestination,
-    isSameDirectory,
-    setIsDirectoryConfirm,
-    isDirectoryConfirm,
-    setIsSameDirectory,
-    currentPath,
-    isErrorSetNewDest,
-    setIsErrorSetNewDest,
-  }
-}
diff --git a/web/screens/Settings/Advanced/DataFolder/ModalSameDirectory.tsx b/web/screens/Settings/Advanced/DataFolder/ModalSameDirectory.tsx
index 8b2d90c61..1909e6428 100644
--- a/web/screens/Settings/Advanced/DataFolder/ModalSameDirectory.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/ModalSameDirectory.tsx
@@ -15,7 +15,11 @@ import { atom, useAtom } from 'jotai'
 
 export const showSamePathModalAtom = atom(false)
 
-const ModalSameDirectory = () => {
+type Props = {
+  onChangeFolderClick: () => void
+}
+
+const ModalSameDirectory = ({ onChangeFolderClick }: Props) => {
   const [show, setShow] = useAtom(showSamePathModalAtom)
 
   return (
@@ -34,7 +38,14 @@ const ModalSameDirectory = () => {
               <Button themes="ghost">Cancel</Button>
             </ModalClose>
             <ModalClose asChild>
-              <Button themes="danger" onClick={() => setShow(false)} autoFocus>
+              <Button
+                themes="danger"
+                onClick={() => {
+                  setShow(false)
+                  onChangeFolderClick()
+                }}
+                autoFocus
+              >
                 Choose a different folder
               </Button>
             </ModalClose>
diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index 4b242f235..e653e4b9b 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -7,7 +7,7 @@ import { PencilIcon, FolderOpenIcon } from 'lucide-react'
 
 import Loader from '@/containers/Loader'
 
-import { SUCCESS_SET_NEW_DESTINATION } from '@/hooks/useVaultDirectory'
+export const SUCCESS_SET_NEW_DESTINATION = 'successSetNewDestination'
 
 import ModalChangeDirectory, {
   showDirectoryConfirmModalAtom,
@@ -67,6 +67,7 @@ const DataFolder = () => {
       await window.core?.api?.relaunch()
     } catch (e) {
       console.error(`Error: ${e}`)
+      setShowLoader(false)
       setShowChangeFolderError(true)
     }
   }, [destinationPath, setShowChangeFolderError])
@@ -107,7 +108,7 @@ const DataFolder = () => {
           </Button>
         </div>
       </div>
-      <ModalSameDirectory />
+      <ModalSameDirectory onChangeFolderClick={onChangeFolderClick} />
       <ModalChangeDirectory
         destinationPath={destinationPath ?? ''}
         onUserConfirmed={onUserConfirmed}
diff --git a/web/screens/Settings/index.tsx b/web/screens/Settings/index.tsx
index 8f3860ee9..671f3be70 100644
--- a/web/screens/Settings/index.tsx
+++ b/web/screens/Settings/index.tsx
@@ -7,14 +7,14 @@ import { motion as m } from 'framer-motion'
 
 import { twMerge } from 'tailwind-merge'
 
-import { SUCCESS_SET_NEW_DESTINATION } from '@/hooks/useVaultDirectory'
-
 import Advanced from '@/screens/Settings/Advanced'
 import AppearanceOptions from '@/screens/Settings/Appearance'
 import ExtensionCatalog from '@/screens/Settings/CoreExtensions'
 
 import Models from '@/screens/Settings/Models'
 
+import { SUCCESS_SET_NEW_DESTINATION } from './Advanced/DataFolder'
+
 const SettingsScreen = () => {
   const [activeStaticMenu, setActiveStaticMenu] = useState('My Models')
   const [menus, setMenus] = useState<any[]>([])

From 00c4397be66901545353b11e56a67fbb549b734e Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Tue, 30 Jan 2024 16:43:58 +0700
Subject: [PATCH 46/65] fix: loader error change folder

---
 .../Advanced/DataFolder/ModalErrorSetDestGlobal.tsx      | 7 +++++--
 web/screens/Settings/Advanced/DataFolder/index.tsx       | 9 +++++++--
 2 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx b/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
index 3729dc0d8..125cd18bd 100644
--- a/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
@@ -10,13 +10,15 @@ import {
   ModalClose,
   Button,
 } from '@janhq/uikit'
-import { atom, useAtom } from 'jotai'
+import { atom, useAtom, useAtomValue } from 'jotai'
+
+import { errorAtom } from '.'
 
 export const showChangeFolderErrorAtom = atom(false)
 
 const ModalErrorSetDestGlobal = () => {
   const [show, setShow] = useAtom(showChangeFolderErrorAtom)
-
+  const error = useAtomValue(errorAtom)
   return (
     <Modal open={show} onOpenChange={setShow}>
       <ModalPortal />
@@ -28,6 +30,7 @@ const ModalErrorSetDestGlobal = () => {
           Oops! Something went wrong. Jan data folder remains the same. Please
           try again.
         </p>
+        <p>{error}</p>
         <ModalFooter>
           <div className="flex gap-x-2">
             <ModalClose asChild onClick={() => setShow(false)}>
diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index e653e4b9b..b7bb88cdd 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -2,7 +2,7 @@ import { Fragment, useCallback, useEffect, useState } from 'react'
 
 import { fs, AppConfiguration } from '@janhq/core'
 import { Button, Input } from '@janhq/uikit'
-import { useSetAtom } from 'jotai'
+import { atom, useSetAtom } from 'jotai'
 import { PencilIcon, FolderOpenIcon } from 'lucide-react'
 
 import Loader from '@/containers/Loader'
@@ -18,6 +18,8 @@ import ModalErrorSetDestGlobal, {
 
 import ModalSameDirectory, { showSamePathModalAtom } from './ModalSameDirectory'
 
+export const errorAtom = atom('')
+
 const DataFolder = () => {
   const [janDataFolderPath, setJanDataFolderPath] = useState('')
   const [showLoader, setShowLoader] = useState(false)
@@ -25,6 +27,7 @@ const DataFolder = () => {
   const setShowSameDirectory = useSetAtom(showSamePathModalAtom)
   const setShowChangeFolderError = useSetAtom(showChangeFolderErrorAtom)
   const [destinationPath, setDestinationPath] = useState(undefined)
+  const setError = useSetAtom(errorAtom)
 
   useEffect(() => {
     window.core?.api
@@ -65,8 +68,10 @@ const DataFolder = () => {
         setShowLoader(false)
       }, 1200)
       await window.core?.api?.relaunch()
-    } catch (e) {
+      // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    } catch (e: any) {
       console.error(`Error: ${e}`)
+      setError(e.message)
       setShowLoader(false)
       setShowChangeFolderError(true)
     }

From 96aded6b035a284e1b12c0c23325dcb53c0cd2e3 Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Tue, 30 Jan 2024 17:04:56 +0700
Subject: [PATCH 47/65] fix: showing catch error on modal when change folder

---
 .../Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx    | 2 +-
 web/screens/Settings/Advanced/DataFolder/index.tsx              | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx b/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
index 125cd18bd..d80e34f3c 100644
--- a/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
@@ -30,7 +30,7 @@ const ModalErrorSetDestGlobal = () => {
           Oops! Something went wrong. Jan data folder remains the same. Please
           try again.
         </p>
-        <p>{error}</p>
+        <p className="text-muted-foreground">{error}</p>
         <ModalFooter>
           <div className="flex gap-x-2">
             <ModalClose asChild onClick={() => setShow(false)}>
diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index b7bb88cdd..1704cd964 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -75,7 +75,7 @@ const DataFolder = () => {
       setShowLoader(false)
       setShowChangeFolderError(true)
     }
-  }, [destinationPath, setShowChangeFolderError])
+  }, [destinationPath, setError, setShowChangeFolderError])
 
   return (
     <Fragment>

From 282dd58d0519c92ab5a335b3c5b1f60f8fe6f262 Mon Sep 17 00:00:00 2001
From: James <james@jan.ai>
Date: Tue, 30 Jan 2024 23:03:20 +0700
Subject: [PATCH 48/65] fix: not allow user to choose sub directory as jan data
 folder

Signed-off-by: James <james@jan.ai>
---
 core/src/api/index.ts                         |  1 +
 core/src/core.ts                              | 20 ++++++++++++++--
 electron/handlers/app.ts                      | 23 ++++++++++++++++++-
 .../DataFolder/ModalErrorSetDestGlobal.tsx    |  6 +----
 .../Settings/Advanced/DataFolder/index.tsx    | 22 ++++++++++--------
 5 files changed, 55 insertions(+), 17 deletions(-)

diff --git a/core/src/api/index.ts b/core/src/api/index.ts
index a232c4090..0adc8b7e2 100644
--- a/core/src/api/index.ts
+++ b/core/src/api/index.ts
@@ -12,6 +12,7 @@ export enum AppRoute {
   updateAppConfiguration = 'updateAppConfiguration',
   relaunch = 'relaunch',
   joinPath = 'joinPath',
+  isSubdirectory = 'isSubdirectory',
   baseName = 'baseName',
   startServer = 'startServer',
   stopServer = 'stopServer',
diff --git a/core/src/core.ts b/core/src/core.ts
index aa545e10e..24053e55c 100644
--- a/core/src/core.ts
+++ b/core/src/core.ts
@@ -22,7 +22,11 @@ const executeOnMain: (extension: string, method: string, ...args: any[]) => Prom
  * @param {object} network - Optional object to specify proxy/whether to ignore SSL certificates.
  * @returns {Promise<any>} A promise that resolves when the file is downloaded.
  */
-const downloadFile: (url: string, fileName: string, network?: { proxy?: string, ignoreSSL?: boolean }) => Promise<any> = (url, fileName, network) => {
+const downloadFile: (
+  url: string,
+  fileName: string,
+  network?: { proxy?: string; ignoreSSL?: boolean }
+) => Promise<any> = (url, fileName, network) => {
   return global.core?.api?.downloadFile(url, fileName, network)
 }
 
@@ -87,6 +91,17 @@ const getResourcePath: () => Promise<string> = () => global.core.api?.getResourc
 const log: (message: string, fileName?: string) => void = (message, fileName) =>
   global.core.api?.log(message, fileName)
 
+/**
+ * Check whether the path is a subdirectory of another path.
+ *
+ * @param from - The path to check.
+ * @param to - The path to check against.
+ *
+ * @returns {Promise<boolean>} - A promise that resolves with a boolean indicating whether the path is a subdirectory.
+ */
+const isSubdirectory: (from: string, to: string) => Promise<boolean> = (from: string, to: string) =>
+  global.core.api?.isSubdirectory(from, to)
+
 /**
  * Register extension point function type definition
  */
@@ -94,7 +109,7 @@ export type RegisterExtensionPoint = (
   extensionName: string,
   extensionId: string,
   method: Function,
-  priority?: number,
+  priority?: number
 ) => void
 
 /**
@@ -111,5 +126,6 @@ export {
   openExternalUrl,
   baseName,
   log,
+  isSubdirectory,
   FileStat,
 }
diff --git a/electron/handlers/app.ts b/electron/handlers/app.ts
index bdb70047a..c1f431ef3 100644
--- a/electron/handlers/app.ts
+++ b/electron/handlers/app.ts
@@ -1,5 +1,5 @@
 import { app, ipcMain, dialog, shell } from 'electron'
-import { join, basename } from 'path'
+import { join, basename, relative as getRelative, isAbsolute } from 'path'
 import { WindowManager } from './../managers/window'
 import { getResourcePath } from './../utils/path'
 import { AppRoute, AppConfiguration } from '@janhq/core'
@@ -50,6 +50,27 @@ export function handleAppIPCs() {
     join(...paths)
   )
 
+  /**
+   * Checks if the given path is a subdirectory of the given directory.
+   *
+   * @param _event - The IPC event object.
+   * @param from - The path to check.
+   * @param to - The directory to check against.
+   *
+   * @returns {Promise<boolean>} - A promise that resolves with the result.
+   */
+  ipcMain.handle(
+    AppRoute.isSubdirectory,
+    async (_event, from: string, to: string) => {
+      const relative = getRelative(from, to)
+      const isSubdir =
+        relative && !relative.startsWith('..') && !isAbsolute(relative)
+
+      if (isSubdir === '') return false
+      else return isSubdir
+    }
+  )
+
   /**
    * Retrieve basename from given path, respect to the current OS.
    */
diff --git a/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx b/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
index d80e34f3c..84646e735 100644
--- a/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/ModalErrorSetDestGlobal.tsx
@@ -10,15 +10,12 @@ import {
   ModalClose,
   Button,
 } from '@janhq/uikit'
-import { atom, useAtom, useAtomValue } from 'jotai'
-
-import { errorAtom } from '.'
+import { atom, useAtom } from 'jotai'
 
 export const showChangeFolderErrorAtom = atom(false)
 
 const ModalErrorSetDestGlobal = () => {
   const [show, setShow] = useAtom(showChangeFolderErrorAtom)
-  const error = useAtomValue(errorAtom)
   return (
     <Modal open={show} onOpenChange={setShow}>
       <ModalPortal />
@@ -30,7 +27,6 @@ const ModalErrorSetDestGlobal = () => {
           Oops! Something went wrong. Jan data folder remains the same. Please
           try again.
         </p>
-        <p className="text-muted-foreground">{error}</p>
         <ModalFooter>
           <div className="flex gap-x-2">
             <ModalClose asChild onClick={() => setShow(false)}>
diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index 1704cd964..5abd5390b 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -1,8 +1,8 @@
 import { Fragment, useCallback, useEffect, useState } from 'react'
 
-import { fs, AppConfiguration } from '@janhq/core'
+import { fs, AppConfiguration, isSubdirectory } from '@janhq/core'
 import { Button, Input } from '@janhq/uikit'
-import { atom, useSetAtom } from 'jotai'
+import { useSetAtom } from 'jotai'
 import { PencilIcon, FolderOpenIcon } from 'lucide-react'
 
 import Loader from '@/containers/Loader'
@@ -18,8 +18,6 @@ import ModalErrorSetDestGlobal, {
 
 import ModalSameDirectory, { showSamePathModalAtom } from './ModalSameDirectory'
 
-export const errorAtom = atom('')
-
 const DataFolder = () => {
   const [janDataFolderPath, setJanDataFolderPath] = useState('')
   const [showLoader, setShowLoader] = useState(false)
@@ -27,7 +25,6 @@ const DataFolder = () => {
   const setShowSameDirectory = useSetAtom(showSamePathModalAtom)
   const setShowChangeFolderError = useSetAtom(showChangeFolderErrorAtom)
   const [destinationPath, setDestinationPath] = useState(undefined)
-  const setError = useSetAtom(errorAtom)
 
   useEffect(() => {
     window.core?.api
@@ -46,6 +43,15 @@ const DataFolder = () => {
       return
     }
 
+    const appConfiguration: AppConfiguration =
+      await window.core?.api?.getAppConfigurations()
+    const currentJanDataFolder = appConfiguration.data_folder
+
+    if (await isSubdirectory(currentJanDataFolder, destFolder)) {
+      setShowSameDirectory(true)
+      return
+    }
+
     setDestinationPath(destFolder)
     setShowDirectoryConfirm(true)
   }, [janDataFolderPath, setShowSameDirectory, setShowDirectoryConfirm])
@@ -68,14 +74,12 @@ const DataFolder = () => {
         setShowLoader(false)
       }, 1200)
       await window.core?.api?.relaunch()
-      // eslint-disable-next-line @typescript-eslint/no-explicit-any
-    } catch (e: any) {
+    } catch (e) {
       console.error(`Error: ${e}`)
-      setError(e.message)
       setShowLoader(false)
       setShowChangeFolderError(true)
     }
-  }, [destinationPath, setError, setShowChangeFolderError])
+  }, [destinationPath, setShowChangeFolderError])
 
   return (
     <Fragment>

From 0b20a401f55ab9884426b505898ff810147bca3e Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Tue, 30 Jan 2024 20:26:39 +0000
Subject: [PATCH 49/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index c31602fdd..e30f310ea 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-210.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-211.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-210.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-211.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-210.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-211.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-210.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-211.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-210.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-211.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 2ec6037b8a96a4735a38393b3cb1d16b6dc91a3c Mon Sep 17 00:00:00 2001
From: hiro <vuonghoainam.work@gmail.com>
Date: Wed, 31 Jan 2024 10:45:13 +0700
Subject: [PATCH 50/65] chore: Bump nitro to 0.3.3 for fixing hungup 2nd
 request

---
 extensions/inference-nitro-extension/bin/version.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/extensions/inference-nitro-extension/bin/version.txt b/extensions/inference-nitro-extension/bin/version.txt
index 769ed6ae7..1c09c74e2 100644
--- a/extensions/inference-nitro-extension/bin/version.txt
+++ b/extensions/inference-nitro-extension/bin/version.txt
@@ -1 +1 @@
-0.2.14
+0.3.3

From cfadd130e9685b2f0402699479c3d39270485042 Mon Sep 17 00:00:00 2001
From: hiento09 <136591877+hiento09@users.noreply.github.com>
Date: Wed, 31 Jan 2024 11:26:30 +0700
Subject: [PATCH 51/65] Increase timeout for explore.e2e.spec test (#1844)

* Increase timeout for explore.e2e.spec test

* fix: test cases and timeout

---------

Co-authored-by: Hien To <tominhhien97@gmail.com>
Co-authored-by: Louis <louis@jan.ai>
---
 electron/playwright.config.ts                 | 10 ++--
 .../{explore.e2e.spec.ts => hub.e2e.spec.ts}  | 18 ++++--
 electron/tests/main.e2e.spec.ts               | 55 -------------------
 electron/tests/navigation.e2e.spec.ts         | 29 +++++-----
 electron/tests/settings.e2e.spec.ts           | 10 +++-
 electron/tests/system-monitor.e2e.spec.ts     | 41 --------------
 web/screens/ExploreModels/index.tsx           |  7 ++-
 web/screens/Settings/index.tsx                |  5 +-
 web/screens/SystemMonitor/index.tsx           |  2 +-
 9 files changed, 51 insertions(+), 126 deletions(-)
 rename electron/tests/{explore.e2e.spec.ts => hub.e2e.spec.ts} (68%)
 delete mode 100644 electron/tests/main.e2e.spec.ts
 delete mode 100644 electron/tests/system-monitor.e2e.spec.ts

diff --git a/electron/playwright.config.ts b/electron/playwright.config.ts
index 98b2c7b45..1fa3313f2 100644
--- a/electron/playwright.config.ts
+++ b/electron/playwright.config.ts
@@ -1,9 +1,9 @@
-import { PlaywrightTestConfig } from "@playwright/test";
+import { PlaywrightTestConfig } from '@playwright/test'
 
 const config: PlaywrightTestConfig = {
-  testDir: "./tests",
+  testDir: './tests',
   retries: 0,
-  timeout: 120000,
-};
+  globalTimeout: 300000,
+}
 
-export default config;
+export default config
diff --git a/electron/tests/explore.e2e.spec.ts b/electron/tests/hub.e2e.spec.ts
similarity index 68%
rename from electron/tests/explore.e2e.spec.ts
rename to electron/tests/hub.e2e.spec.ts
index 77eb3dbda..6bfe45ac4 100644
--- a/electron/tests/explore.e2e.spec.ts
+++ b/electron/tests/hub.e2e.spec.ts
@@ -9,6 +9,7 @@ import {
 
 let electronApp: ElectronApplication
 let page: Page
+const TIMEOUT: number = parseInt(process.env.TEST_TIMEOUT || '300000')
 
 test.beforeAll(async () => {
   process.env.CI = 'e2e'
@@ -26,7 +27,9 @@ test.beforeAll(async () => {
   })
   await stubDialog(electronApp, 'showMessageBox', { response: 1 })
 
-  page = await electronApp.firstWindow()
+  page = await electronApp.firstWindow({
+    timeout: TIMEOUT,
+  })
 })
 
 test.afterAll(async () => {
@@ -34,8 +37,13 @@ test.afterAll(async () => {
   await page.close()
 })
 
-test('explores models', async () => {
-  await page.getByTestId('Hub').first().click()
-  await page.getByTestId('testid-explore-models').isVisible()
-  //   More test cases here...
+test('explores hub', async () => {
+  // Set the timeout for this test to 60 seconds
+  test.setTimeout(TIMEOUT)
+  await page.getByTestId('Hub').first().click({
+    timeout: TIMEOUT,
+  })
+  await page.getByTestId('hub-container-test-id').isVisible({
+    timeout: TIMEOUT,
+  })
 })
diff --git a/electron/tests/main.e2e.spec.ts b/electron/tests/main.e2e.spec.ts
deleted file mode 100644
index 1a5bfe696..000000000
--- a/electron/tests/main.e2e.spec.ts
+++ /dev/null
@@ -1,55 +0,0 @@
-import { _electron as electron } from 'playwright'
-import { ElectronApplication, Page, expect, test } from '@playwright/test'
-
-import {
-  findLatestBuild,
-  parseElectronApp,
-  stubDialog,
-} from 'electron-playwright-helpers'
-
-let electronApp: ElectronApplication
-let page: Page
-
-test.beforeAll(async () => {
-  process.env.CI = 'e2e'
-
-  const latestBuild = findLatestBuild('dist')
-  expect(latestBuild).toBeTruthy()
-
-  // parse the packaged Electron app and find paths and other info
-  const appInfo = parseElectronApp(latestBuild)
-  expect(appInfo).toBeTruthy()
-  expect(appInfo.asar).toBe(true)
-  expect(appInfo.executable).toBeTruthy()
-  expect(appInfo.main).toBeTruthy()
-  expect(appInfo.name).toBe('jan')
-  expect(appInfo.packageJson).toBeTruthy()
-  expect(appInfo.packageJson.name).toBe('jan')
-  expect(appInfo.platform).toBeTruthy()
-  expect(appInfo.platform).toBe(process.platform)
-  expect(appInfo.resourcesDir).toBeTruthy()
-
-  electronApp = await electron.launch({
-    args: [appInfo.main], // main file from package.json
-    executablePath: appInfo.executable, // path to the Electron executable
-  })
-  await stubDialog(electronApp, 'showMessageBox', { response: 1 })
-
-  page = await electronApp.firstWindow()
-})
-
-test.afterAll(async () => {
-  await electronApp.close()
-  await page.close()
-})
-
-test('renders the home page', async () => {
-  expect(page).toBeDefined()
-
-  // Welcome text is available
-  const welcomeText = await page
-    .getByTestId('testid-welcome-title')
-    .first()
-    .isVisible()
-  expect(welcomeText).toBe(false)
-})
diff --git a/electron/tests/navigation.e2e.spec.ts b/electron/tests/navigation.e2e.spec.ts
index 2f4f7b767..2066fa60a 100644
--- a/electron/tests/navigation.e2e.spec.ts
+++ b/electron/tests/navigation.e2e.spec.ts
@@ -9,6 +9,7 @@ import {
 
 let electronApp: ElectronApplication
 let page: Page
+const TIMEOUT: number = parseInt(process.env.TEST_TIMEOUT || '300000')
 
 test.beforeAll(async () => {
   process.env.CI = 'e2e'
@@ -26,7 +27,9 @@ test.beforeAll(async () => {
   })
   await stubDialog(electronApp, 'showMessageBox', { response: 1 })
 
-  page = await electronApp.firstWindow()
+  page = await electronApp.firstWindow({
+    timeout: TIMEOUT,
+  })
 })
 
 test.afterAll(async () => {
@@ -35,20 +38,20 @@ test.afterAll(async () => {
 })
 
 test('renders left navigation panel', async () => {
-  // Chat section should be there
-  const chatSection = await page.getByTestId('Chat').first().isVisible()
-  expect(chatSection).toBe(false)
-
-  // Home actions
-  /* Disable unstable feature tests
-   ** const botBtn = await page.getByTestId("Bot").first().isEnabled();
-   ** Enable back when it is whitelisted
-   */
-
   const systemMonitorBtn = await page
     .getByTestId('System Monitor')
     .first()
-    .isEnabled()
-  const settingsBtn = await page.getByTestId('Settings').first().isEnabled()
+    .isEnabled({
+      timeout: TIMEOUT,
+    })
+  const settingsBtn = await page
+    .getByTestId('Thread')
+    .first()
+    .isEnabled({ timeout: TIMEOUT })
   expect([systemMonitorBtn, settingsBtn].filter((e) => !e).length).toBe(0)
+  // Chat section should be there
+  const apiServer = await page.getByTestId('Local API Server').first()
+  expect(apiServer).toBeVisible({
+    timeout: TIMEOUT,
+  })
 })
diff --git a/electron/tests/settings.e2e.spec.ts b/electron/tests/settings.e2e.spec.ts
index 798504c70..765c3cba7 100644
--- a/electron/tests/settings.e2e.spec.ts
+++ b/electron/tests/settings.e2e.spec.ts
@@ -9,6 +9,7 @@ import {
 
 let electronApp: ElectronApplication
 let page: Page
+const TIMEOUT: number = parseInt(process.env.TEST_TIMEOUT || '300000')
 
 test.beforeAll(async () => {
   process.env.CI = 'e2e'
@@ -26,7 +27,9 @@ test.beforeAll(async () => {
   })
   await stubDialog(electronApp, 'showMessageBox', { response: 1 })
 
-  page = await electronApp.firstWindow()
+  page = await electronApp.firstWindow({
+    timeout: TIMEOUT,
+  })
 })
 
 test.afterAll(async () => {
@@ -35,6 +38,7 @@ test.afterAll(async () => {
 })
 
 test('shows settings', async () => {
-  await page.getByTestId('Settings').first().click()
-  await page.getByTestId('testid-setting-description').isVisible()
+  await page.getByTestId('Settings').first().click({ timeout: TIMEOUT })
+  const settingDescription = page.getByTestId('testid-setting-description')
+  expect(settingDescription).toBeVisible({ timeout: TIMEOUT })
 })
diff --git a/electron/tests/system-monitor.e2e.spec.ts b/electron/tests/system-monitor.e2e.spec.ts
deleted file mode 100644
index 747a8ae18..000000000
--- a/electron/tests/system-monitor.e2e.spec.ts
+++ /dev/null
@@ -1,41 +0,0 @@
-import { _electron as electron } from 'playwright'
-import { ElectronApplication, Page, expect, test } from '@playwright/test'
-
-import {
-  findLatestBuild,
-  parseElectronApp,
-  stubDialog,
-} from 'electron-playwright-helpers'
-
-let electronApp: ElectronApplication
-let page: Page
-
-test.beforeAll(async () => {
-  process.env.CI = 'e2e'
-
-  const latestBuild = findLatestBuild('dist')
-  expect(latestBuild).toBeTruthy()
-
-  // parse the packaged Electron app and find paths and other info
-  const appInfo = parseElectronApp(latestBuild)
-  expect(appInfo).toBeTruthy()
-
-  electronApp = await electron.launch({
-    args: [appInfo.main], // main file from package.json
-    executablePath: appInfo.executable, // path to the Electron executable
-  })
-  await stubDialog(electronApp, 'showMessageBox', { response: 1 })
-
-  page = await electronApp.firstWindow()
-})
-
-test.afterAll(async () => {
-  await electronApp.close()
-  await page.close()
-})
-
-test('shows system monitor', async () => {
-  await page.getByTestId('System Monitor').first().click()
-  await page.getByTestId('testid-system-monitor').isVisible()
-  //   More test cases here...
-})
diff --git a/web/screens/ExploreModels/index.tsx b/web/screens/ExploreModels/index.tsx
index d988fcafc..398b2db08 100644
--- a/web/screens/ExploreModels/index.tsx
+++ b/web/screens/ExploreModels/index.tsx
@@ -52,9 +52,12 @@ const ExploreModelsScreen = () => {
   if (loading) return <Loader description="loading ..." />
 
   return (
-    <div className="flex h-full w-full overflow-y-auto bg-background">
+    <div
+      className="flex h-full w-full overflow-y-auto bg-background"
+      data-testid="hub-container-test-id"
+    >
       <div className="h-full w-full p-4">
-        <div className="h-full" data-test-id="testid-explore-models">
+        <div className="h-full">
           <ScrollArea>
             <div className="relative">
               <img
diff --git a/web/screens/Settings/index.tsx b/web/screens/Settings/index.tsx
index 671f3be70..c70938f91 100644
--- a/web/screens/Settings/index.tsx
+++ b/web/screens/Settings/index.tsx
@@ -54,7 +54,10 @@ const SettingsScreen = () => {
   }, [])
 
   return (
-    <div className="flex h-full bg-background">
+    <div
+      className="flex h-full bg-background"
+      data-testid="testid-setting-description"
+    >
       <div className="flex h-full w-64 flex-shrink-0 flex-col overflow-y-auto border-r border-border">
         <ScrollArea className="h-full w-full">
           <div className="px-6 py-4">
diff --git a/web/screens/SystemMonitor/index.tsx b/web/screens/SystemMonitor/index.tsx
index ed3b057a1..3bf8bb35e 100644
--- a/web/screens/SystemMonitor/index.tsx
+++ b/web/screens/SystemMonitor/index.tsx
@@ -35,7 +35,7 @@ export default function SystemMonitorScreen() {
   return (
     <div className="flex h-full w-full bg-background dark:bg-background">
       <ScrollArea className="h-full w-full">
-        <div className="h-full p-8" data-test-id="testid-system-monitor">
+        <div className="h-full p-8" data-testid="testid-system-monitor">
           <div className="grid grid-cols-2 gap-8 lg:grid-cols-3">
             <div className="rounded-xl border border-border p-4">
               <div className="flex items-center justify-between">

From 5e58f67abd7acc43f0decfc36dcff0e69ebe08b8 Mon Sep 17 00:00:00 2001
From: Helloyunho <yunho050840@gmail.com>
Date: Wed, 31 Jan 2024 14:32:49 +0900
Subject: [PATCH 52/65] chore: add react developer tools to electron (#1858)

Co-authored-by: NamH <NamNh0122@gmail.com>
---
 electron/main.ts      | 16 ++++++++++++++++
 electron/package.json |  1 +
 2 files changed, 17 insertions(+)

diff --git a/electron/main.ts b/electron/main.ts
index fb7066cd0..5d7e59c0f 100644
--- a/electron/main.ts
+++ b/electron/main.ts
@@ -28,6 +28,22 @@ import { setupCore } from './utils/setup'
 
 app
   .whenReady()
+  .then(async () => {
+    if (!app.isPackaged) {
+      // Which means you're running from source code
+      const { default: installExtension, REACT_DEVELOPER_TOOLS } = await import(
+        'electron-devtools-installer'
+      ) // Don't use import on top level, since the installer package is dev-only
+      try {
+        const name = installExtension(REACT_DEVELOPER_TOOLS)
+        console.log(`Added Extension: ${name}`)
+      } catch (err) {
+        console.log('An error occurred while installing devtools:')
+        console.error(err)
+        // Only log the error and don't throw it because it's not critical
+      }
+    }
+  })
   .then(setupCore)
   .then(createUserSpace)
   .then(migrateExtensions)
diff --git a/electron/package.json b/electron/package.json
index 173e54f2b..4ee9a19b4 100644
--- a/electron/package.json
+++ b/electron/package.json
@@ -99,6 +99,7 @@
     "@typescript-eslint/parser": "^6.7.3",
     "electron": "28.0.0",
     "electron-builder": "^24.9.1",
+    "electron-devtools-installer": "^3.2.0",
     "electron-playwright-helpers": "^1.6.0",
     "eslint-plugin-react": "^7.33.2",
     "run-script-os": "^1.1.6"

From 50fb0bc9078e22a89135b8b34aadc7bed48d1b09 Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Tue, 30 Jan 2024 21:19:01 +0700
Subject: [PATCH 53/65] feat: add snackbar component and update style side
 banner

---
 web/containers/Providers/EventHandler.tsx |   1 +
 web/containers/Providers/index.tsx        |   2 +-
 web/containers/Toast/index.tsx            | 161 ++++++++++++++++++----
 web/hooks/useActiveModel.ts               |   1 +
 web/hooks/useDeleteModel.ts               |   1 +
 web/hooks/useDeleteThread.ts              |   1 +
 web/hooks/useDownloadState.ts             |   2 +
 web/hooks/useSendChatMessage.ts           |   2 +-
 web/screens/Chat/index.tsx                |  38 ++---
 web/screens/Settings/Advanced/index.tsx   |   1 +
 10 files changed, 152 insertions(+), 58 deletions(-)

diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index 5af6d4917..ac793b4ae 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -61,6 +61,7 @@ export default function EventHandler({ children }: { children: ReactNode }) {
       toaster({
         title: 'Success!',
         description: `Model ${model.id} has been started.`,
+        type: 'success',
       })
       setStateModel(() => ({
         state: 'stop',
diff --git a/web/containers/Providers/index.tsx b/web/containers/Providers/index.tsx
index f9726e43d..dd9069a95 100644
--- a/web/containers/Providers/index.tsx
+++ b/web/containers/Providers/index.tsx
@@ -82,7 +82,7 @@ const Providers = (props: PropsWithChildren) => {
                   </TooltipProvider>
                   {!isMac && <GPUDriverPrompt />}
                 </EventListenerWrapper>
-                <Toaster position="top-right" />
+                <Toaster />
               </FeatureToggleWrapper>
             </KeyListener>
           )}
diff --git a/web/containers/Toast/index.tsx b/web/containers/Toast/index.tsx
index c5e5f03da..7cffa89b9 100644
--- a/web/containers/Toast/index.tsx
+++ b/web/containers/Toast/index.tsx
@@ -6,7 +6,99 @@ import { twMerge } from 'tailwind-merge'
 type Props = {
   title?: string
   description?: string
-  type?: 'default' | 'error' | 'success'
+  type?: 'default' | 'error' | 'success' | 'warning'
+}
+
+const ErrorIcon = () => {
+  return (
+    <svg
+      width="20"
+      height="20"
+      viewBox="0 0 20 20"
+      fill="none"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M20 10C20 15.5228 15.5228 20 10 20H0.993697C0.110179 20 -0.332289 18.9229 0.292453 18.2929L2.2495 16.3195C0.843343 14.597 1.21409e-08 12.397 1.21409e-08 10C1.21409e-08 4.47715 4.47715 0 10 0C15.5228 0 20 4.47715 20 10ZM13.2071 6.79289C13.5976 7.18342 13.5976 7.81658 13.2071 8.20711L11.4142 10L13.2071 11.7929C13.5976 12.1834 13.5976 12.8166 13.2071 13.2071C12.8166 13.5976 12.1834 13.5976 11.7929 13.2071L10 11.4142L8.20711 13.2071C7.81658 13.5976 7.18342 13.5976 6.79289 13.2071C6.40237 12.8166 6.40237 12.1834 6.79289 11.7929L8.58579 10L6.79289 8.20711C6.40237 7.81658 6.40237 7.18342 6.79289 6.79289C7.18342 6.40237 7.81658 6.40237 8.20711 6.79289L10 8.58579L11.7929 6.79289C12.1834 6.40237 12.8166 6.40237 13.2071 6.79289Z"
+        fill="#EA2E4E"
+      />
+    </svg>
+  )
+}
+
+const WarningIcon = () => {
+  return (
+    <svg
+      width="20"
+      height="20"
+      viewBox="0 0 20 20"
+      fill="none"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M20 10C20 15.5228 15.5228 20 10 20H0.993697C0.110179 20 -0.332289 18.9229 0.292453 18.2929L2.2495 16.3195C0.843343 14.597 1.21409e-08 12.397 1.21409e-08 10C1.21409e-08 4.47715 4.47715 0 10 0C15.5228 0 20 4.47715 20 10ZM10.99 6C10.99 5.44772 10.5446 5 9.99502 5C9.44549 5 9 5.44772 9 6V10C9 10.5523 9.44549 11 9.99502 11C10.5446 11 10.99 10.5523 10.99 10V6ZM9.99502 13C9.44549 13 9 13.4477 9 14C9 14.5523 9.44549 15 9.99502 15H10.005C10.5545 15 11 14.5523 11 14C11 13.4477 10.5545 13 10.005 13H9.99502Z"
+        fill="#FACC15"
+      />
+    </svg>
+  )
+}
+
+const SuccessIcon = () => {
+  return (
+    <svg
+      width="20"
+      height="20"
+      viewBox="0 0 20 20"
+      fill="none"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M20 10C20 15.5228 15.5228 20 10 20H0.993697C0.110179 20 -0.332289 18.9229 0.292453 18.2929L2.2495 16.3195C0.843343 14.597 1.21409e-08 12.397 1.21409e-08 10C1.21409e-08 4.47715 4.47715 0 10 0C15.5228 0 20 4.47715 20 10ZM13.7071 8.70711C14.0976 8.31658 14.0976 7.68342 13.7071 7.29289C13.3166 6.90237 12.6834 6.90237 12.2929 7.29289L9 10.5858L7.70711 9.2929C7.31658 8.90237 6.68342 8.90237 6.29289 9.2929C5.90237 9.68342 5.90237 10.3166 6.29289 10.7071L8.29289 12.7071C8.48043 12.8946 8.73478 13 9 13C9.26522 13 9.51957 12.8946 9.70711 12.7071L13.7071 8.70711Z"
+        fill="#34D399"
+      />
+    </svg>
+  )
+}
+
+const DefaultIcon = () => {
+  return (
+    <svg
+      width="20"
+      height="20"
+      viewBox="0 0 20 20"
+      fill="none"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M10 20C15.5228 20 20 15.5228 20 10C20 4.47715 15.5228 0 10 0C4.47715 0 2.11188e-08 4.47715 2.11188e-08 10C2.11188e-08 12.397 0.843343 14.597 2.2495 16.3195L0.292453 18.2929C-0.332289 18.9229 0.110179 20 0.993697 20H10ZM5.5 8C5.5 7.44772 5.94772 7 6.5 7H13.5C14.0523 7 14.5 7.44772 14.5 8C14.5 8.55229 14.0523 9 13.5 9H6.5C5.94772 9 5.5 8.55229 5.5 8ZM6.5 11C5.94772 11 5.5 11.4477 5.5 12C5.5 12.5523 5.94772 13 6.5 13H9.5C10.0523 13 10.5 12.5523 10.5 12C10.5 11.4477 10.0523 11 9.5 11H6.5Z"
+        fill="#60A5FA"
+      />
+    </svg>
+  )
+}
+
+const renderIcon = (type: string) => {
+  switch (type) {
+    case 'warning':
+      return <WarningIcon />
+
+    case 'error':
+      return <ErrorIcon />
+
+    case 'success':
+      return <SuccessIcon />
+
+    default:
+      return <DefaultIcon />
+  }
 }
 
 export function toaster(props: Props) {
@@ -16,37 +108,52 @@ export function toaster(props: Props) {
       return (
         <div
           className={twMerge(
-            'unset-drag relative flex min-w-[200px] max-w-[350px] gap-x-4 rounded-lg border border-border bg-background px-4 py-3',
-            t.visible ? 'animate-enter' : 'animate-leave',
-            type === 'success' && 'bg-primary text-primary-foreground'
+            'unset-drag dark:bg-zinc-white relative flex animate-enter items-center gap-x-4 rounded-lg bg-foreground px-4 py-2 text-white dark:border dark:border-border',
+            t.visible ? 'animate-enter' : 'animate-leave'
           )}
         >
-          <div>
-            <h1
-              className={twMerge(
-                'font-medium',
-                type === 'success' && 'font-medium text-primary-foreground'
-              )}
-            >
-              {title}
-            </h1>
-            <p
-              className={twMerge(
-                'mt-1 text-muted-foreground',
-                type === 'success' && 'text-primary-foreground/80'
-              )}
-            >
-              {description}
-            </p>
+          <div className="flex items-start gap-x-3 dark:text-black">
+            <div className="mt-1">{renderIcon(type)}</div>
+            <div className="pr-4">
+              <h1 className="font-bold">{title}</h1>
+              <p>{description}</p>
+            </div>
+            <XIcon
+              size={24}
+              className="absolute right-2 top-2 w-4 cursor-pointer dark:text-black"
+              onClick={() => toast.dismiss(t.id)}
+            />
           </div>
-          <XIcon
-            size={24}
-            className="absolute right-2 top-2 w-4 cursor-pointer text-muted-foreground"
-            onClick={() => toast.dismiss(t.id)}
-          />
         </div>
       )
     },
-    { id: 'toast', duration: 3000 }
+    { id: 'toast', duration: 2000, position: 'top-right' }
+  )
+}
+
+export function snackbar(props: Props) {
+  const { description, type = 'default' } = props
+  return toast.custom(
+    (t) => {
+      return (
+        <div
+          className={twMerge(
+            'unset-drag dark:bg-zinc-white relative bottom-2 flex animate-enter items-center gap-x-4 rounded-lg bg-foreground px-4 py-2 text-white dark:border dark:border-border',
+            t.visible ? 'animate-enter' : 'animate-leave'
+          )}
+        >
+          <div className="flex items-start gap-x-3 dark:text-black">
+            <div>{renderIcon(type)}</div>
+            <p className="pr-4">{description}</p>
+            <XIcon
+              size={24}
+              className="absolute right-2 top-1/2 w-4 -translate-y-1/2 cursor-pointer dark:text-black"
+              onClick={() => toast.dismiss(t.id)}
+            />
+          </div>
+        </div>
+      )
+    },
+    { id: 'snackbar', duration: 2000, position: 'bottom-center' }
   )
 }
diff --git a/web/hooks/useActiveModel.ts b/web/hooks/useActiveModel.ts
index 336f0be21..a456d8787 100644
--- a/web/hooks/useActiveModel.ts
+++ b/web/hooks/useActiveModel.ts
@@ -42,6 +42,7 @@ export function useActiveModel() {
       toaster({
         title: `Model ${modelId} not found!`,
         description: `Please download the model first.`,
+        type: 'warning',
       })
       setStateModel(() => ({
         state: 'start',
diff --git a/web/hooks/useDeleteModel.ts b/web/hooks/useDeleteModel.ts
index cd7292997..fa0cfb45e 100644
--- a/web/hooks/useDeleteModel.ts
+++ b/web/hooks/useDeleteModel.ts
@@ -19,6 +19,7 @@ export default function useDeleteModel() {
     toaster({
       title: 'Model Deletion Successful',
       description: `The model ${model.id} has been successfully deleted.`,
+      type: 'success',
     })
   }
 
diff --git a/web/hooks/useDeleteThread.ts b/web/hooks/useDeleteThread.ts
index 00ba98b99..88710f777 100644
--- a/web/hooks/useDeleteThread.ts
+++ b/web/hooks/useDeleteThread.ts
@@ -86,6 +86,7 @@ export default function useDeleteThread() {
         toaster({
           title: 'Thread successfully deleted.',
           description: `Thread ${threadId} has been successfully deleted.`,
+          type: 'success',
         })
       }
 
diff --git a/web/hooks/useDownloadState.ts b/web/hooks/useDownloadState.ts
index d39ab5e58..37f41d2a1 100644
--- a/web/hooks/useDownloadState.ts
+++ b/web/hooks/useDownloadState.ts
@@ -26,6 +26,7 @@ const setDownloadStateSuccessAtom = atom(null, (get, set, modelId: string) => {
   toaster({
     title: 'Download Completed',
     description: `Download ${modelId} completed`,
+    type: 'success',
   })
 })
 
@@ -61,6 +62,7 @@ const setDownloadStateCancelledAtom = atom(
       toaster({
         title: 'Cancel Download',
         description: `Model ${modelId} cancel download`,
+        type: 'warning',
       })
 
       return
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index 71dc99d21..835bdfed4 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -160,7 +160,7 @@ export default function useSendChatMessage() {
       activeThread.assistants[0].model.id !== selectedModel?.id
     ) {
       if (!selectedModel) {
-        toaster({ title: 'Please select a model' })
+        toaster({ title: 'Please select a model', type: 'warning' })
         return
       }
       const assistantId = activeThread.assistants[0].assistant_id ?? ''
diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index cfd47ad39..887d9d035 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -5,7 +5,7 @@ import { useDropzone } from 'react-dropzone'
 
 import { useAtomValue, useSetAtom } from 'jotai'
 
-import { UploadCloudIcon, XIcon } from 'lucide-react'
+import { UploadCloudIcon } from 'lucide-react'
 
 import { twMerge } from 'tailwind-merge'
 
@@ -15,6 +15,8 @@ import ModelStart from '@/containers/Loader/ModelStart'
 import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
 import { showLeftSideBarAtom } from '@/containers/Providers/KeyListener'
 
+import { snackbar } from '@/containers/Toast'
+
 import { queuedMessageAtom, reloadModelAtom } from '@/hooks/useSendChatMessage'
 
 import ChatBody from '@/screens/Chat/ChatBody'
@@ -112,8 +114,13 @@ const ChatScreen: React.FC = () => {
     },
   })
 
-  // TODO @faisal change this until we have sneakbar component
   useEffect(() => {
+    if (dragRejected.code) {
+      snackbar({
+        description: renderError(dragRejected.code),
+        type: 'error',
+      })
+    }
     setTimeout(() => {
       if (dragRejected.code) {
         setDragRejected({ code: '' })
@@ -134,33 +141,6 @@ const ChatScreen: React.FC = () => {
         className="relative flex h-full w-full flex-col overflow-auto bg-background outline-none"
         {...getRootProps()}
       >
-        {dragRejected.code !== '' && (
-          <div className="absolute bottom-3 left-1/2 z-50 inline-flex w-full -translate-x-1/2 justify-center px-16">
-            <div className="flex items-start justify-between gap-x-4 rounded-lg bg-foreground px-4 py-2 text-white dark:border dark:border-border dark:bg-zinc-900">
-              <svg
-                width="20"
-                height="20"
-                viewBox="0 0 20 20"
-                fill="none"
-                xmlns="http://www.w3.org/2000/svg"
-              >
-                <path
-                  fillRule="evenodd"
-                  clipRule="evenodd"
-                  d="M20 10C20 15.5228 15.5228 20 10 20H0.993697C0.110179 20 -0.332289 18.9229 0.292453 18.2929L2.2495 16.3195C0.843343 14.597 1.21409e-08 12.397 1.21409e-08 10C1.21409e-08 4.47715 4.47715 0 10 0C15.5228 0 20 4.47715 20 10ZM13.2071 6.79289C13.5976 7.18342 13.5976 7.81658 13.2071 8.20711L11.4142 10L13.2071 11.7929C13.5976 12.1834 13.5976 12.8166 13.2071 13.2071C12.8166 13.5976 12.1834 13.5976 11.7929 13.2071L10 11.4142L8.20711 13.2071C7.81658 13.5976 7.18342 13.5976 6.79289 13.2071C6.40237 12.8166 6.40237 12.1834 6.79289 11.7929L8.58579 10L6.79289 8.20711C6.40237 7.81658 6.40237 7.18342 6.79289 6.79289C7.18342 6.40237 7.81658 6.40237 8.20711 6.79289L10 8.58579L11.7929 6.79289C12.1834 6.40237 12.8166 6.40237 13.2071 6.79289Z"
-                  fill="#F87171"
-                />
-              </svg>
-              <p>{renderError(dragRejected.code)}</p>
-              <XIcon
-                size={24}
-                className="cursor-pointer"
-                onClick={() => setDragRejected({ code: '' })}
-              />
-            </div>
-          </div>
-        )}
-
         {dragOver && (
           <div className="absolute z-50 mx-auto h-full w-full bg-background/50 p-8 backdrop-blur-lg">
             <div
diff --git a/web/screens/Settings/Advanced/index.tsx b/web/screens/Settings/Advanced/index.tsx
index 5c85a0e1e..2aaf19a74 100644
--- a/web/screens/Settings/Advanced/index.tsx
+++ b/web/screens/Settings/Advanced/index.tsx
@@ -62,6 +62,7 @@ const Advanced = () => {
     toaster({
       title: 'Logs cleared',
       description: 'All logs have been cleared.',
+      type: 'success',
     })
   }
 

From 8151ef031343e671b525b0b2f4f93544719ab8b5 Mon Sep 17 00:00:00 2001
From: NamH <NamNh0122@gmail.com>
Date: Wed, 31 Jan 2024 13:23:48 +0700
Subject: [PATCH 54/65] feat: add factory reset feature (#1750)

* feat(FactoryReset): add factory reset feature

Signed-off-by: nam <namnh0122@gmail.com>
Signed-off-by: James <james@jan.ai>
Co-authored-by: Faisal Amir <urmauur@gmail.com>
Co-authored-by: James <james@jan.ai>
---
 core/src/api/index.ts                         |  2 +-
 core/src/core.ts                              |  7 ++
 core/src/node/api/routes/fileManager.ts       |  2 +
 electron/handlers/fileManager.ts              |  6 +-
 electron/package.json                         |  2 +-
 .../inference-nitro-extension/package.json    |  2 +-
 uikit/package.json                            |  1 +
 uikit/src/button/styles.scss                  |  8 +-
 uikit/src/checkbox/index.tsx                  | 29 ++++++
 uikit/src/checkbox/styles.scss                |  7 ++
 uikit/src/index.ts                            |  1 +
 uikit/src/main.scss                           |  1 +
 web/hooks/useFactoryReset.ts                  | 59 +++++++++++
 web/hooks/useSettings.ts                      |  7 +-
 web/screens/LocalServer/index.tsx             |  6 +-
 .../FactoryReset/ModalConfirmReset.tsx        | 99 +++++++++++++++++++
 .../Settings/Advanced/FactoryReset/index.tsx  | 37 +++++++
 web/screens/Settings/Advanced/index.tsx       | 39 +++-----
 18 files changed, 277 insertions(+), 38 deletions(-)
 create mode 100644 uikit/src/checkbox/index.tsx
 create mode 100644 uikit/src/checkbox/styles.scss
 create mode 100644 web/hooks/useFactoryReset.ts
 create mode 100644 web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
 create mode 100644 web/screens/Settings/Advanced/FactoryReset/index.tsx

diff --git a/core/src/api/index.ts b/core/src/api/index.ts
index 0adc8b7e2..0d7cc51f7 100644
--- a/core/src/api/index.ts
+++ b/core/src/api/index.ts
@@ -3,7 +3,6 @@
  * @description Enum of all the routes exposed by the app
  */
 export enum AppRoute {
-  appDataPath = 'appDataPath',
   openExternalUrl = 'openExternalUrl',
   openAppDirectory = 'openAppDirectory',
   openFileExplore = 'openFileExplorer',
@@ -62,6 +61,7 @@ export enum FileManagerRoute {
   syncFile = 'syncFile',
   getJanDataFolderPath = 'getJanDataFolderPath',
   getResourcePath = 'getResourcePath',
+  getUserHomePath = 'getUserHomePath',
   fileStat = 'fileStat',
   writeBlob = 'writeBlob',
 }
diff --git a/core/src/core.ts b/core/src/core.ts
index 24053e55c..8831c6001 100644
--- a/core/src/core.ts
+++ b/core/src/core.ts
@@ -83,6 +83,12 @@ const openExternalUrl: (url: string) => Promise<any> = (url) =>
  */
 const getResourcePath: () => Promise<string> = () => global.core.api?.getResourcePath()
 
+/**
+ * Gets the user's home path.
+ * @returns return user's home path
+ */
+const getUserHomePath = (): Promise<string> => global.core.api?.getUserHomePath()
+
 /**
  * Log to file from browser processes.
  *
@@ -127,5 +133,6 @@ export {
   baseName,
   log,
   isSubdirectory,
+  getUserHomePath,
   FileStat,
 }
diff --git a/core/src/node/api/routes/fileManager.ts b/core/src/node/api/routes/fileManager.ts
index 159c23a0c..66056444e 100644
--- a/core/src/node/api/routes/fileManager.ts
+++ b/core/src/node/api/routes/fileManager.ts
@@ -8,5 +8,7 @@ export const fsRouter = async (app: HttpServer) => {
 
   app.post(`/app/${FileManagerRoute.getResourcePath}`, async (request: any, reply: any) => {})
 
+  app.post(`/app/${FileManagerRoute.getUserHomePath}`, async (request: any, reply: any) => {})
+
   app.post(`/app/${FileManagerRoute.fileStat}`, async (request: any, reply: any) => {})
 }
diff --git a/electron/handlers/fileManager.ts b/electron/handlers/fileManager.ts
index 2528aef71..e328cb53b 100644
--- a/electron/handlers/fileManager.ts
+++ b/electron/handlers/fileManager.ts
@@ -1,4 +1,4 @@
-import { ipcMain } from 'electron'
+import { ipcMain, app } from 'electron'
 // @ts-ignore
 import reflect from '@alumna/reflect'
 
@@ -38,6 +38,10 @@ export function handleFileMangerIPCs() {
     getResourcePath()
   )
 
+  ipcMain.handle(FileManagerRoute.getUserHomePath, async (_event) =>
+    app.getPath('home')
+  )
+
   // handle fs is directory here
   ipcMain.handle(
     FileManagerRoute.fileStat,
diff --git a/electron/package.json b/electron/package.json
index 4ee9a19b4..2892fedc6 100644
--- a/electron/package.json
+++ b/electron/package.json
@@ -86,7 +86,7 @@
     "request": "^2.88.2",
     "request-progress": "^3.0.0",
     "rimraf": "^5.0.5",
-    "typescript": "^5.3.3",
+    "typescript": "^5.2.2",
     "ulid": "^2.3.0",
     "use-debounce": "^9.0.4"
   },
diff --git a/extensions/inference-nitro-extension/package.json b/extensions/inference-nitro-extension/package.json
index 44727eb70..8ad516ad9 100644
--- a/extensions/inference-nitro-extension/package.json
+++ b/extensions/inference-nitro-extension/package.json
@@ -35,7 +35,7 @@
     "rollup-plugin-sourcemaps": "^0.6.3",
     "rollup-plugin-typescript2": "^0.36.0",
     "run-script-os": "^1.1.6",
-    "typescript": "^5.3.3"
+    "typescript": "^5.2.2"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
diff --git a/uikit/package.json b/uikit/package.json
index 43e73dcf2..66f05840b 100644
--- a/uikit/package.json
+++ b/uikit/package.json
@@ -18,6 +18,7 @@
   },
   "dependencies": {
     "@radix-ui/react-avatar": "^1.0.4",
+    "@radix-ui/react-checkbox": "^1.0.4",
     "@radix-ui/react-context": "^1.0.1",
     "@radix-ui/react-dialog": "^1.0.5",
     "@radix-ui/react-icons": "^1.3.0",
diff --git a/uikit/src/button/styles.scss b/uikit/src/button/styles.scss
index 74585ed1e..003df5b4d 100644
--- a/uikit/src/button/styles.scss
+++ b/uikit/src/button/styles.scss
@@ -9,7 +9,7 @@
   }
 
   &-secondary-blue {
-    @apply bg-blue-200 text-blue-600 hover:bg-blue-500/50;
+    @apply bg-blue-200 text-blue-600 hover:bg-blue-300/50 dark:hover:bg-blue-200/80;
   }
 
   &-danger {
@@ -17,7 +17,7 @@
   }
 
   &-secondary-danger {
-    @apply bg-red-200 text-red-600 hover:bg-red-500/50;
+    @apply bg-red-200 text-red-600 hover:bg-red-300/50 dark:hover:bg-red-200/80;
   }
 
   &-outline {
@@ -67,14 +67,18 @@
 [type='submit'] {
   &.btn-primary {
     @apply bg-primary hover:bg-primary/90;
+    @apply disabled:pointer-events-none disabled:bg-zinc-100 disabled:text-zinc-400;
   }
   &.btn-secondary {
     @apply bg-secondary hover:bg-secondary/80;
+    @apply disabled:pointer-events-none disabled:bg-zinc-100 disabled:text-zinc-400;
   }
   &.btn-secondary-blue {
     @apply bg-blue-200 text-blue-900 hover:bg-blue-200/80;
+    @apply disabled:pointer-events-none disabled:bg-zinc-100 disabled:text-zinc-400;
   }
   &.btn-danger {
     @apply bg-danger hover:bg-danger/90;
+    @apply disabled:pointer-events-none disabled:bg-zinc-100 disabled:text-zinc-400;
   }
 }
diff --git a/uikit/src/checkbox/index.tsx b/uikit/src/checkbox/index.tsx
new file mode 100644
index 000000000..1e78aeafb
--- /dev/null
+++ b/uikit/src/checkbox/index.tsx
@@ -0,0 +1,29 @@
+'use client'
+
+import * as React from 'react'
+import * as CheckboxPrimitive from '@radix-ui/react-checkbox'
+import { CheckIcon } from '@radix-ui/react-icons'
+
+import { twMerge } from 'tailwind-merge'
+
+const Checkbox = React.forwardRef<
+  React.ElementRef<typeof CheckboxPrimitive.Root>,
+  React.ComponentPropsWithoutRef<typeof CheckboxPrimitive.Root>
+>(({ className, ...props }, ref) => (
+  <CheckboxPrimitive.Root
+    ref={ref}
+    className={twMerge('checkbox', className)}
+    {...props}
+  >
+    <CheckboxPrimitive.Indicator
+      className={twMerge(
+        'flex flex-shrink-0 items-center justify-center text-current'
+      )}
+    >
+      <CheckIcon className="checkbox--icon" />
+    </CheckboxPrimitive.Indicator>
+  </CheckboxPrimitive.Root>
+))
+Checkbox.displayName = CheckboxPrimitive.Root.displayName
+
+export { Checkbox }
diff --git a/uikit/src/checkbox/styles.scss b/uikit/src/checkbox/styles.scss
new file mode 100644
index 000000000..33610f837
--- /dev/null
+++ b/uikit/src/checkbox/styles.scss
@@ -0,0 +1,7 @@
+.checkbox {
+  @apply border-border data-[state=checked]:bg-primary h-5 w-5 flex-shrink-0 rounded-md border data-[state=checked]:text-white;
+
+  &--icon {
+    @apply h-4 w-4;
+  }
+}
diff --git a/uikit/src/index.ts b/uikit/src/index.ts
index 3d5eaa82a..1b0a26bd1 100644
--- a/uikit/src/index.ts
+++ b/uikit/src/index.ts
@@ -12,3 +12,4 @@ export * from './command'
 export * from './textarea'
 export * from './select'
 export * from './slider'
+export * from './checkbox'
diff --git a/uikit/src/main.scss b/uikit/src/main.scss
index 546f22811..c1326ba19 100644
--- a/uikit/src/main.scss
+++ b/uikit/src/main.scss
@@ -16,6 +16,7 @@
 @import './textarea/styles.scss';
 @import './select/styles.scss';
 @import './slider/styles.scss';
+@import './checkbox/styles.scss';
 
 .animate-spin {
   animation: spin 1s linear infinite;
diff --git a/web/hooks/useFactoryReset.ts b/web/hooks/useFactoryReset.ts
new file mode 100644
index 000000000..56994d4c4
--- /dev/null
+++ b/web/hooks/useFactoryReset.ts
@@ -0,0 +1,59 @@
+import { useEffect, useState } from 'react'
+
+import { fs, AppConfiguration, joinPath, getUserHomePath } from '@janhq/core'
+
+export default function useFactoryReset() {
+  const [defaultJanDataFolder, setdefaultJanDataFolder] = useState('')
+
+  useEffect(() => {
+    async function getDefaultJanDataFolder() {
+      const homePath = await getUserHomePath()
+      const defaultJanDataFolder = await joinPath([homePath, 'jan'])
+      setdefaultJanDataFolder(defaultJanDataFolder)
+    }
+    getDefaultJanDataFolder()
+  }, [])
+
+  const resetAll = async (keepCurrentFolder?: boolean) => {
+    // read the place of jan data folder
+    const appConfiguration: AppConfiguration | undefined =
+      await window.core?.api?.getAppConfigurations()
+
+    if (!appConfiguration) {
+      console.debug('Failed to get app configuration')
+    }
+
+    console.debug('appConfiguration: ', appConfiguration)
+    const janDataFolderPath = appConfiguration!.data_folder
+
+    if (defaultJanDataFolder === janDataFolderPath) {
+      console.debug('Jan data folder is already at user home')
+    } else {
+      // if jan data folder is not at user home, we update the app configuration to point to user home
+      if (!keepCurrentFolder) {
+        const configuration: AppConfiguration = {
+          data_folder: defaultJanDataFolder,
+        }
+        await window.core?.api?.updateAppConfiguration(configuration)
+      }
+    }
+
+    const modelPath = await joinPath([janDataFolderPath, 'models'])
+    const threadPath = await joinPath([janDataFolderPath, 'threads'])
+
+    console.debug(`Removing models at ${modelPath}`)
+    await fs.rmdirSync(modelPath, { recursive: true })
+
+    console.debug(`Removing threads at ${threadPath}`)
+    await fs.rmdirSync(threadPath, { recursive: true })
+
+    // reset the localStorage
+    localStorage.clear()
+    await window.core?.api?.relaunch()
+  }
+
+  return {
+    defaultJanDataFolder,
+    resetAll,
+  }
+}
diff --git a/web/hooks/useSettings.ts b/web/hooks/useSettings.ts
index ef4e08480..168e72489 100644
--- a/web/hooks/useSettings.ts
+++ b/web/hooks/useSettings.ts
@@ -1,4 +1,4 @@
-import { useEffect, useState } from 'react'
+import { useCallback, useEffect, useState } from 'react'
 
 import { fs, joinPath } from '@janhq/core'
 import { atom, useAtom } from 'jotai'
@@ -32,7 +32,7 @@ export const useSettings = () => {
     })
   }
 
-  const readSettings = async () => {
+  const readSettings = useCallback(async () => {
     if (!window?.core?.api) {
       return
     }
@@ -42,7 +42,8 @@ export const useSettings = () => {
       return typeof settings === 'object' ? settings : JSON.parse(settings)
     }
     return {}
-  }
+  }, [])
+
   const saveSettings = async ({
     runMode,
     notify,
diff --git a/web/screens/LocalServer/index.tsx b/web/screens/LocalServer/index.tsx
index d75274f16..7e1ba1fab 100644
--- a/web/screens/LocalServer/index.tsx
+++ b/web/screens/LocalServer/index.tsx
@@ -91,11 +91,7 @@ const LocalServerScreen = () => {
   }
 
   useEffect(() => {
-    if (
-      localStorage.getItem(FIRST_TIME_VISIT_API_SERVER) === null ||
-      localStorage.getItem(FIRST_TIME_VISIT_API_SERVER) === 'true'
-    ) {
-      localStorage.setItem(FIRST_TIME_VISIT_API_SERVER, 'true')
+    if (localStorage.getItem(FIRST_TIME_VISIT_API_SERVER) == null) {
       setFirstTimeVisitAPIServer(true)
     }
   }, [firstTimeVisitAPIServer])
diff --git a/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx b/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
new file mode 100644
index 000000000..d8a2321a9
--- /dev/null
+++ b/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
@@ -0,0 +1,99 @@
+import React, { useCallback, useEffect, useState } from 'react'
+
+import { fs, AppConfiguration, joinPath, getUserHomePath } from '@janhq/core'
+
+import {
+  Modal,
+  ModalPortal,
+  ModalContent,
+  ModalHeader,
+  ModalTitle,
+  ModalFooter,
+  ModalClose,
+  Button,
+  Checkbox,
+  Input,
+} from '@janhq/uikit'
+import { atom, useAtom } from 'jotai'
+
+import useFactoryReset from '@/hooks/useFactoryReset'
+
+export const modalValidationAtom = atom(false)
+
+const ModalConfirmReset = () => {
+  const [modalValidation, setModalValidation] = useAtom(modalValidationAtom)
+  const { resetAll, defaultJanDataFolder } = useFactoryReset()
+  const [inputValue, setInputValue] = useState('')
+  const [currentDirectoryChecked, setCurrentDirectoryChecked] = useState(true)
+  const onFactoryResetClick = useCallback(
+    () => resetAll(currentDirectoryChecked),
+    [currentDirectoryChecked, resetAll]
+  )
+
+  return (
+    <Modal
+      open={modalValidation}
+      onOpenChange={() => setModalValidation(false)}
+    >
+      <ModalPortal />
+      <ModalContent>
+        <ModalHeader>
+          <ModalTitle>
+            Are you sure you want to reset to default settings?
+          </ModalTitle>
+        </ModalHeader>
+        <p className="text-muted-foreground">
+          It will reset the application to its original state, deleting all your
+          usage data, including model customizations and conversation history.
+          This action is irreversible.
+        </p>
+        <div>
+          <p className="mb-2 mt-1 text-muted-foreground">{`To confirm, please enter the word "RESET" below:`}</p>
+          <Input
+            placeholder='Enter "RESET"'
+            onChange={(e) => setInputValue(e.target.value)}
+          />
+        </div>
+        <div className="flex flex-shrink-0 items-start space-x-2">
+          <Checkbox
+            id="currentDirectory"
+            checked={currentDirectoryChecked}
+            onCheckedChange={(e) => setCurrentDirectoryChecked(Boolean(e))}
+          />
+          <div className="mt-0.5 flex flex-col">
+            <label
+              htmlFor="currentDirectory"
+              className="cursor-pointer text-sm font-medium leading-none"
+            >
+              Keep the current app data location
+            </label>
+            <p className="mt-2 leading-relaxed">
+              Otherwise it will reset back to its original location at:
+              {/* TODO should be from system */}
+              <span className="font-medium">{defaultJanDataFolder}</span>
+            </p>
+          </div>
+        </div>
+        <ModalFooter>
+          <div className="flex gap-x-2">
+            <ModalClose asChild onClick={() => setModalValidation(false)}>
+              <Button themes="outline">Cancel</Button>
+            </ModalClose>
+            <ModalClose asChild>
+              <Button
+                autoFocus
+                themes="danger"
+                disabled={inputValue !== 'RESET'}
+                onClick={onFactoryResetClick}
+              >
+                Reset Now
+              </Button>
+            </ModalClose>
+          </div>
+        </ModalFooter>
+      </ModalContent>
+    </Modal>
+  )
+}
+
+export default ModalConfirmReset
diff --git a/web/screens/Settings/Advanced/FactoryReset/index.tsx b/web/screens/Settings/Advanced/FactoryReset/index.tsx
new file mode 100644
index 000000000..e7b1e2995
--- /dev/null
+++ b/web/screens/Settings/Advanced/FactoryReset/index.tsx
@@ -0,0 +1,37 @@
+import { Button } from '@janhq/uikit'
+
+import { useSetAtom } from 'jotai'
+
+import ModalValidation, { modalValidationAtom } from './ModalConfirmReset'
+
+const FactoryReset = () => {
+  const setModalValidation = useSetAtom(modalValidationAtom)
+
+  return (
+    <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
+      <div className="w-4/5 flex-shrink-0 space-y-1.5">
+        <div className="flex gap-x-2">
+          <h6 className="text-sm font-semibold capitalize">
+            Reset to Factory Default
+          </h6>
+        </div>
+        <p className="whitespace-pre-wrap leading-relaxed">
+          Reset the application to its original state, deleting all your usage
+          data, including model customizations and conversation history. This
+          action is irreversible and recommended only if the application is in a
+          corrupted state.
+        </p>
+      </div>
+      <Button
+        size="sm"
+        themes="secondaryDanger"
+        onClick={() => setModalValidation(true)}
+      >
+        Reset
+      </Button>
+      <ModalValidation />
+    </div>
+  )
+}
+
+export default FactoryReset
diff --git a/web/screens/Settings/Advanced/index.tsx b/web/screens/Settings/Advanced/index.tsx
index 5c85a0e1e..df92afdd4 100644
--- a/web/screens/Settings/Advanced/index.tsx
+++ b/web/screens/Settings/Advanced/index.tsx
@@ -1,4 +1,3 @@
-/* eslint-disable react-hooks/exhaustive-deps */
 'use client'
 
 import {
@@ -21,6 +20,7 @@ import { FeatureToggleContext } from '@/context/FeatureToggle'
 import { useSettings } from '@/hooks/useSettings'
 
 import DataFolder from './DataFolder'
+import FactoryReset from './FactoryReset'
 
 const Advanced = () => {
   const {
@@ -36,6 +36,7 @@ const Advanced = () => {
 
   const { readSettings, saveSettings, validateSettings, setShowNotification } =
     useSettings()
+
   const onProxyChange = useCallback(
     (event: ChangeEvent<HTMLInputElement>) => {
       const value = event.target.value || ''
@@ -50,10 +51,12 @@ const Advanced = () => {
   )
 
   useEffect(() => {
-    readSettings().then((settings) => {
+    const setUseGpuIfPossible = async () => {
+      const settings = await readSettings()
       setGpuEnabled(settings.run_mode === 'gpu')
-    })
-  }, [])
+    }
+    setUseGpuIfPossible()
+  }, [readSettings])
 
   const clearLogs = async () => {
     if (await fs.existsSync(`file://logs`)) {
@@ -96,13 +99,7 @@ const Advanced = () => {
         </div>
         <Switch
           checked={experimentalFeature}
-          onCheckedChange={(e) => {
-            if (e === true) {
-              setExperimentalFeature(true)
-            } else {
-              setExperimentalFeature(false)
-            }
-          }}
+          onCheckedChange={setExperimentalFeature}
         />
       </div>
 
@@ -119,7 +116,7 @@ const Advanced = () => {
           </div>
           <Switch
             checked={gpuEnabled}
-            onCheckedChange={(e: boolean) => {
+            onCheckedChange={(e) => {
               if (e === true) {
                 saveSettings({ runMode: 'gpu' })
                 setGpuEnabled(true)
@@ -137,7 +134,7 @@ const Advanced = () => {
       )}
 
       {/* Directory */}
-      <DataFolder />
+      {experimentalFeature && <DataFolder />}
 
       {/* Proxy */}
       <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
@@ -170,16 +167,7 @@ const Advanced = () => {
             certain proxies.
           </p>
         </div>
-        <Switch
-          checked={ignoreSSL}
-          onCheckedChange={(e) => {
-            if (e === true) {
-              setIgnoreSSL(true)
-            } else {
-              setIgnoreSSL(false)
-            }
-          }}
-        />
+        <Switch checked={ignoreSSL} onCheckedChange={(e) => setIgnoreSSL(e)} />
       </div>
 
       {/* Open app directory */}
@@ -206,7 +194,7 @@ const Advanced = () => {
         </div>
       )}
 
-      {/* Claer log */}
+      {/* Clear log */}
       <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
         <div className="flex-shrink-0 space-y-1.5">
           <div className="flex gap-x-2">
@@ -218,6 +206,9 @@ const Advanced = () => {
           Clear
         </Button>
       </div>
+
+      {/* Factory Reset */}
+      <FactoryReset />
     </div>
   )
 }

From 509f6cba3947fb28593b3fdfd1cf1a1f3ea5937c Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Wed, 31 Jan 2024 17:32:37 +0700
Subject: [PATCH 55/65] feat: move open app directory into icon folder (#1879)

---
 .../Settings/Advanced/DataFolder/index.tsx    |  3 ++-
 web/screens/Settings/Advanced/index.tsx       | 24 -------------------
 2 files changed, 2 insertions(+), 25 deletions(-)

diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index 5abd5390b..8fa6af505 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -104,7 +104,8 @@ const DataFolder = () => {
             />
             <FolderOpenIcon
               size={16}
-              className="absolute right-2 top-1/2 -translate-y-1/2"
+              className="absolute right-2 top-1/2 z-10 -translate-y-1/2 cursor-pointer"
+              onClick={() => window.core?.api?.openAppDirectory()}
             />
           </div>
           <Button
diff --git a/web/screens/Settings/Advanced/index.tsx b/web/screens/Settings/Advanced/index.tsx
index df92afdd4..d8b11ed86 100644
--- a/web/screens/Settings/Advanced/index.tsx
+++ b/web/screens/Settings/Advanced/index.tsx
@@ -170,30 +170,6 @@ const Advanced = () => {
         <Switch checked={ignoreSSL} onCheckedChange={(e) => setIgnoreSSL(e)} />
       </div>
 
-      {/* Open app directory */}
-      {window.electronAPI && (
-        <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
-          <div className="w-4/5 flex-shrink-0 space-y-1.5">
-            <div className="flex gap-x-2">
-              <h6 className="text-sm font-semibold capitalize">
-                Open App Directory
-              </h6>
-            </div>
-            <p className="whitespace-pre-wrap leading-relaxed">
-              Open the directory where your app data, like conversation history
-              and model configurations, is located.
-            </p>
-          </div>
-          <Button
-            size="sm"
-            themes="secondaryBlue"
-            onClick={() => window.core?.api?.openAppDirectory()}
-          >
-            Open
-          </Button>
-        </div>
-      )}
-
       {/* Clear log */}
       <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
         <div className="flex-shrink-0 space-y-1.5">

From 8150f2f7b74316a66cdfb1f3d22bca1d0c6d09be Mon Sep 17 00:00:00 2001
From: Faisal Amir <urmauur@gmail.com>
Date: Wed, 31 Jan 2024 18:23:16 +0700
Subject: [PATCH 56/65] fix: add dialog confirm when move folder and next dest
 isn't empty

---
 .../DataFolder/ModalConfirmDestNotEmpty.tsx   | 59 +++++++++++++++++++
 .../Settings/Advanced/DataFolder/index.tsx    | 22 ++++++-
 2 files changed, 80 insertions(+), 1 deletion(-)
 create mode 100644 web/screens/Settings/Advanced/DataFolder/ModalConfirmDestNotEmpty.tsx

diff --git a/web/screens/Settings/Advanced/DataFolder/ModalConfirmDestNotEmpty.tsx b/web/screens/Settings/Advanced/DataFolder/ModalConfirmDestNotEmpty.tsx
new file mode 100644
index 000000000..e4aba41cc
--- /dev/null
+++ b/web/screens/Settings/Advanced/DataFolder/ModalConfirmDestNotEmpty.tsx
@@ -0,0 +1,59 @@
+import React from 'react'
+
+import {
+  Modal,
+  ModalPortal,
+  ModalContent,
+  ModalHeader,
+  ModalTitle,
+  ModalFooter,
+  ModalClose,
+  Button,
+} from '@janhq/uikit'
+
+import { atom, useAtom } from 'jotai'
+
+export const showDestNotEmptyConfirmAtom = atom(false)
+
+type Props = {
+  onUserConfirmed: () => void
+}
+
+const ModalChangeDestNotEmpty: React.FC<Props> = ({ onUserConfirmed }) => {
+  const [show, setShow] = useAtom(showDestNotEmptyConfirmAtom)
+
+  return (
+    <Modal open={show} onOpenChange={setShow}>
+      <ModalPortal />
+      <ModalContent>
+        <ModalHeader>
+          <ModalTitle>
+            <span className="block pr-8 leading-relaxed">
+              This folder is not empty. Are you sure you want to relocate Jan
+              Data Folder here?
+            </span>
+          </ModalTitle>
+        </ModalHeader>
+        <p className="text-muted-foreground">
+          You may accidentally delete your other personal data when uninstalling
+          the app in the future. Are you sure you want to proceed with this
+          folder? Please review your selection carefully.
+        </p>
+        <ModalFooter>
+          <div className="flex gap-x-2">
+            <ModalClose asChild onClick={() => setShow(false)}>
+              <Button themes="ghost">Cancel</Button>
+            </ModalClose>
+            <ModalClose asChild>
+              <Button onClick={onUserConfirmed} autoFocus themes="danger">
+                Yes, Proceed
+              </Button>
+            </ModalClose>
+          </div>
+        </ModalFooter>
+      </ModalContent>
+    </Modal>
+  )
+}
+
+export default ModalChangeDestNotEmpty
diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index 8fa6af505..fe590bfaa 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -12,6 +12,9 @@ export const SUCCESS_SET_NEW_DESTINATION = 'successSetNewDestination'
 import ModalChangeDirectory, {
   showDirectoryConfirmModalAtom,
 } from './ModalChangeDirectory'
+import ModalChangeDestNotEmpty, {
+  showDestNotEmptyConfirmAtom,
+} from './ModalConfirmDestNotEmpty'
 import ModalErrorSetDestGlobal, {
   showChangeFolderErrorAtom,
 } from './ModalErrorSetDestGlobal'
@@ -24,6 +27,7 @@ const DataFolder = () => {
   const setShowDirectoryConfirm = useSetAtom(showDirectoryConfirmModalAtom)
   const setShowSameDirectory = useSetAtom(showSamePathModalAtom)
   const setShowChangeFolderError = useSetAtom(showChangeFolderErrorAtom)
+  const showDestNotEmptyConfirm = useSetAtom(showDestNotEmptyConfirmAtom)
   const [destinationPath, setDestinationPath] = useState(undefined)
 
   useEffect(() => {
@@ -52,9 +56,24 @@ const DataFolder = () => {
       return
     }
 
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    const newDestChildren: any[] = await fs.readdirSync(destFolder)
+    const isNotEmpty =
+      newDestChildren.filter((x) => x !== '.DS_Store').length > 0
+
+    if (isNotEmpty) {
+      showDestNotEmptyConfirm(true)
+      return
+    }
+
     setDestinationPath(destFolder)
     setShowDirectoryConfirm(true)
-  }, [janDataFolderPath, setShowSameDirectory, setShowDirectoryConfirm])
+  }, [
+    janDataFolderPath,
+    setShowDirectoryConfirm,
+    setShowSameDirectory,
+    showDestNotEmptyConfirm,
+  ])
 
   const onUserConfirmed = useCallback(async () => {
     if (!destinationPath) return
@@ -124,6 +143,7 @@ const DataFolder = () => {
         onUserConfirmed={onUserConfirmed}
       />
       <ModalErrorSetDestGlobal />
+      <ModalChangeDestNotEmpty onUserConfirmed={onUserConfirmed} />
       {showLoader && <Loader description="Relocating Jan Data Folder..." />}
     </Fragment>
   )

From ad842dbc70756865ddf3e1c50faa5d4e4b80af78 Mon Sep 17 00:00:00 2001
From: Louis <louis@jan.ai>
Date: Wed, 31 Jan 2024 23:53:30 +0700
Subject: [PATCH 57/65] chore: mark RAG as experimental feature

---
 web/screens/Chat/ChatInput/index.tsx |  89 +++++++++---------
 web/screens/Chat/Sidebar/index.tsx   | 136 ++++++++++++++-------------
 web/screens/Chat/index.tsx           |  10 +-
 3 files changed, 127 insertions(+), 108 deletions(-)

diff --git a/web/screens/Chat/ChatInput/index.tsx b/web/screens/Chat/ChatInput/index.tsx
index b760ab44c..ee1ac9a41 100644
--- a/web/screens/Chat/ChatInput/index.tsx
+++ b/web/screens/Chat/ChatInput/index.tsx
@@ -1,5 +1,5 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
-import { useEffect, useRef, useState } from 'react'
+import { useContext, useEffect, useRef, useState } from 'react'
 
 import { InferenceEvent, MessageStatus, events } from '@janhq/core'
 
@@ -24,6 +24,8 @@ import { twMerge } from 'tailwind-merge'
 
 import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
 
+import { FeatureToggleContext } from '@/context/FeatureToggle'
+
 import { useActiveModel } from '@/hooks/useActiveModel'
 import { useClickOutside } from '@/hooks/useClickOutside'
 
@@ -53,7 +55,8 @@ const ChatInput: React.FC = () => {
   const textareaRef = useRef<HTMLTextAreaElement>(null)
   const fileInputRef = useRef<HTMLInputElement>(null)
   const imageInputRef = useRef<HTMLInputElement>(null)
-  const [ShowAttacmentMenus, setShowAttacmentMenus] = useState(false)
+  const [showAttacmentMenus, setShowAttacmentMenus] = useState(false)
+  const { experimentalFeature } = useContext(FeatureToggleContext)
 
   const onPromptChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
     setCurrentPrompt(e.target.value)
@@ -147,50 +150,52 @@ const ChatInput: React.FC = () => {
           value={currentPrompt}
           onChange={onPromptChange}
         />
-
-        <Tooltip>
-          <TooltipTrigger asChild>
-            <PaperclipIcon
-              size={20}
-              className="absolute bottom-2 right-4 cursor-pointer text-muted-foreground"
-              onClick={(e) => {
-                if (
-                  fileUpload.length > 0 ||
-                  (activeThread?.assistants[0].tools &&
-                    !activeThread?.assistants[0].tools[0]?.enabled)
-                ) {
-                  e.stopPropagation()
-                } else {
-                  setShowAttacmentMenus(!ShowAttacmentMenus)
-                }
-              }}
-            />
-          </TooltipTrigger>
-          <TooltipPortal>
-            {fileUpload.length > 0 ||
-              (activeThread?.assistants[0].tools &&
-                !activeThread?.assistants[0].tools[0]?.enabled && (
-                  <TooltipContent side="top" className="max-w-[154px] px-3">
-                    {fileUpload.length !== 0 && (
-                      <span>
-                        Currently, we only support 1 attachment at the same time
-                      </span>
-                    )}
-                    {activeThread?.assistants[0].tools &&
-                      activeThread?.assistants[0].tools[0]?.enabled ===
-                        false && (
+        {experimentalFeature && (
+          <Tooltip>
+            <TooltipTrigger asChild>
+              <PaperclipIcon
+                size={20}
+                className="absolute bottom-2 right-4 cursor-pointer text-muted-foreground"
+                onClick={(e) => {
+                  if (
+                    fileUpload.length > 0 ||
+                    (activeThread?.assistants[0].tools &&
+                      !activeThread?.assistants[0].tools[0]?.enabled)
+                  ) {
+                    e.stopPropagation()
+                  } else {
+                    setShowAttacmentMenus(!showAttacmentMenus)
+                  }
+                }}
+              />
+            </TooltipTrigger>
+            <TooltipPortal>
+              {fileUpload.length > 0 ||
+                (activeThread?.assistants[0].tools &&
+                  !activeThread?.assistants[0].tools[0]?.enabled && (
+                    <TooltipContent side="top" className="max-w-[154px] px-3">
+                      {fileUpload.length !== 0 && (
                         <span>
-                          Turn on Retrieval in Assistant Settings to use this
-                          feature
+                          Currently, we only support 1 attachment at the same
+                          time
                         </span>
                       )}
-                    <TooltipArrow />
-                  </TooltipContent>
-                ))}
-          </TooltipPortal>
-        </Tooltip>
+                      {activeThread?.assistants[0].tools &&
+                        activeThread?.assistants[0].tools[0]?.enabled ===
+                          false && (
+                          <span>
+                            Turn on Retrieval in Assistant Settings to use this
+                            feature
+                          </span>
+                        )}
+                      <TooltipArrow />
+                    </TooltipContent>
+                  ))}
+            </TooltipPortal>
+          </Tooltip>
+        )}
 
-        {ShowAttacmentMenus && (
+        {showAttacmentMenus && (
           <div
             ref={refAttachmentMenus}
             className="absolute bottom-10 right-0 w-36 cursor-pointer rounded-lg border border-border bg-background py-1 shadow"
diff --git a/web/screens/Chat/Sidebar/index.tsx b/web/screens/Chat/Sidebar/index.tsx
index 9b1a37eae..8088501b9 100644
--- a/web/screens/Chat/Sidebar/index.tsx
+++ b/web/screens/Chat/Sidebar/index.tsx
@@ -1,5 +1,5 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
-import React from 'react'
+import React, { useContext } from 'react'
 
 import { InferenceEngine } from '@janhq/core'
 import { Input, Textarea, Switch } from '@janhq/uikit'
@@ -15,6 +15,8 @@ import DropdownListSidebar, {
   selectedModelAtom,
 } from '@/containers/DropdownListSidebar'
 
+import { FeatureToggleContext } from '@/context/FeatureToggle'
+
 import { useCreateNewThread } from '@/hooks/useCreateNewThread'
 
 import { getConfigurationsData } from '@/utils/componentSettings'
@@ -39,6 +41,7 @@ const Sidebar: React.FC = () => {
   const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
   const selectedModel = useAtomValue(selectedModelAtom)
   const { updateThreadMetadata } = useCreateNewThread()
+  const { experimentalFeature } = useContext(FeatureToggleContext)
 
   const modelEngineParams = toSettingParams(activeModelParams)
   const modelRuntimeParams = toRuntimeParams(activeModelParams)
@@ -131,71 +134,74 @@ const Sidebar: React.FC = () => {
                 }}
               />
             </div>
-
-            <div>
-              {activeThread?.assistants[0]?.tools &&
-                componentDataAssistantSetting.length > 0 && (
-                  <div className="mt-2">
-                    <CardSidebar
-                      title="Retrieval"
-                      asChild
-                      rightAction={
-                        <Switch
-                          name="retrieval"
-                          className="mr-2"
-                          checked={activeThread?.assistants[0].tools[0].enabled}
-                          onCheckedChange={(e) => {
-                            if (activeThread)
-                              updateThreadMetadata({
-                                ...activeThread,
-                                assistants: [
-                                  {
-                                    ...activeThread.assistants[0],
-                                    tools: [
-                                      {
-                                        type: 'retrieval',
-                                        enabled: e,
-                                        settings:
-                                          (activeThread.assistants[0].tools &&
-                                            activeThread.assistants[0].tools[0]
-                                              ?.settings) ??
-                                          {},
-                                      },
-                                    ],
-                                  },
-                                ],
-                              })
-                          }}
-                        />
-                      }
-                    >
-                      {activeThread?.assistants[0]?.tools[0].enabled && (
-                        <div className="px-2 py-4">
-                          <div className="mb-4">
-                            <label
-                              id="tool-title"
-                              className="mb-2 inline-block font-bold text-zinc-500 dark:text-gray-300"
-                            >
-                              Embedding Engine
-                            </label>
-                            <div className="flex items-center justify-between">
-                              <label className="font-medium text-zinc-500 dark:text-gray-300">
-                                {selectedModel?.engine ===
-                                InferenceEngine.openai
-                                  ? 'OpenAI'
-                                  : 'Nitro'}
-                              </label>
-                            </div>
-                          </div>
-                          <AssistantSetting
-                            componentData={componentDataAssistantSetting}
+            {experimentalFeature && (
+              <div>
+                {activeThread?.assistants[0]?.tools &&
+                  componentDataAssistantSetting.length > 0 && (
+                    <div className="mt-2">
+                      <CardSidebar
+                        title="Retrieval"
+                        asChild
+                        rightAction={
+                          <Switch
+                            name="retrieval"
+                            className="mr-2"
+                            checked={
+                              activeThread?.assistants[0].tools[0].enabled
+                            }
+                            onCheckedChange={(e) => {
+                              if (activeThread)
+                                updateThreadMetadata({
+                                  ...activeThread,
+                                  assistants: [
+                                    {
+                                      ...activeThread.assistants[0],
+                                      tools: [
+                                        {
+                                          type: 'retrieval',
+                                          enabled: e,
+                                          settings:
+                                            (activeThread.assistants[0].tools &&
+                                              activeThread.assistants[0]
+                                                .tools[0]?.settings) ??
+                                            {},
+                                        },
+                                      ],
+                                    },
+                                  ],
+                                })
+                            }}
                           />
-                        </div>
-                      )}
-                    </CardSidebar>
-                  </div>
-                )}
-            </div>
+                        }
+                      >
+                        {activeThread?.assistants[0]?.tools[0].enabled && (
+                          <div className="px-2 py-4">
+                            <div className="mb-4">
+                              <label
+                                id="tool-title"
+                                className="mb-2 inline-block font-bold text-zinc-500 dark:text-gray-300"
+                              >
+                                Embedding Engine
+                              </label>
+                              <div className="flex items-center justify-between">
+                                <label className="font-medium text-zinc-500 dark:text-gray-300">
+                                  {selectedModel?.engine ===
+                                  InferenceEngine.openai
+                                    ? 'OpenAI'
+                                    : 'Nitro'}
+                                </label>
+                              </div>
+                            </div>
+                            <AssistantSetting
+                              componentData={componentDataAssistantSetting}
+                            />
+                          </div>
+                        )}
+                      </CardSidebar>
+                    </div>
+                  )}
+              </div>
+            )}
           </div>
         </CardSidebar>
         <CardSidebar title="Model">
diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index 887d9d035..e7cb82740 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -1,5 +1,5 @@
 /* eslint-disable @typescript-eslint/naming-convention */
-import React, { useEffect, useState } from 'react'
+import React, { useContext, useEffect, useState } from 'react'
 
 import { useDropzone } from 'react-dropzone'
 
@@ -17,6 +17,8 @@ import { showLeftSideBarAtom } from '@/containers/Providers/KeyListener'
 
 import { snackbar } from '@/containers/Toast'
 
+import { FeatureToggleContext } from '@/context/FeatureToggle'
+
 import { queuedMessageAtom, reloadModelAtom } from '@/hooks/useSendChatMessage'
 
 import ChatBody from '@/screens/Chat/ChatBody'
@@ -59,6 +61,8 @@ const ChatScreen: React.FC = () => {
   const reloadModel = useAtomValue(reloadModelAtom)
   const [dragRejected, setDragRejected] = useState({ code: '' })
   const setFileUpload = useSetAtom(fileUploadAtom)
+  const { experimentalFeature } = useContext(FeatureToggleContext)
+
   const { getRootProps, isDragReject } = useDropzone({
     noClick: true,
     multiple: false,
@@ -67,6 +71,8 @@ const ChatScreen: React.FC = () => {
     },
 
     onDragOver: (e) => {
+      // Retrieval file drag and drop is experimental feature
+      if (!experimentalFeature) return
       if (
         e.dataTransfer.items.length === 1 &&
         activeThread?.assistants[0].tools &&
@@ -84,6 +90,8 @@ const ChatScreen: React.FC = () => {
     },
     onDragLeave: () => setDragOver(false),
     onDrop: (files, rejectFiles) => {
+      // Retrieval file drag and drop is experimental feature
+      if (!experimentalFeature) return
       if (
         !files ||
         files.length !== 1 ||

From 4b8b13b5d3f7b038f0bccf7a4c0a3fe0c68d9507 Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Wed, 31 Jan 2024 20:23:20 +0000
Subject: [PATCH 58/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index e30f310ea..e4817f8dc 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-211.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-215.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-211.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-215.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-211.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-215.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-211.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-215.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-211.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-215.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 4116aaa98a390b35fb6cde7d02de76c52e2f04b0 Mon Sep 17 00:00:00 2001
From: NamH <NamNh0122@gmail.com>
Date: Thu, 1 Feb 2024 11:25:34 +0700
Subject: [PATCH 59/65] feat: add start/stop model via http api (#1862)

Signed-off-by: nam <namnh0122@gmail.com>
---
 core/src/node/api/common/builder.ts           |  17 +-
 core/src/node/api/common/consts.ts            |  19 +
 core/src/node/api/common/startStopModel.ts    | 351 ++++++++++++++++++
 core/src/node/api/routes/common.ts            |  22 +-
 core/src/node/utils/index.ts                  | 148 ++++++--
 core/src/types/index.ts                       |   1 +
 core/src/types/miscellaneous/index.ts         |   2 +
 .../src/types/miscellaneous/promptTemplate.ts |   6 +
 .../types/miscellaneous/systemResourceInfo.ts |   4 +
 core/src/types/model/modelEntity.ts           |   1 +
 .../src/@types/global.d.ts                    |  21 --
 .../inference-nitro-extension/src/index.ts    |   3 +-
 .../src/node/index.ts                         |  64 ++--
 .../src/node/utils.ts                         |  56 ---
 server/package.json                           |   3 +
 web/hooks/useCreateNewThread.ts               |   5 +-
 web/hooks/useSetActiveThread.ts               |   2 -
 web/screens/LocalServer/index.tsx             |  24 +-
 .../FactoryReset/ModalConfirmReset.tsx        |   4 +-
 19 files changed, 559 insertions(+), 194 deletions(-)
 create mode 100644 core/src/node/api/common/consts.ts
 create mode 100644 core/src/node/api/common/startStopModel.ts
 create mode 100644 core/src/types/miscellaneous/index.ts
 create mode 100644 core/src/types/miscellaneous/promptTemplate.ts
 create mode 100644 core/src/types/miscellaneous/systemResourceInfo.ts
 delete mode 100644 extensions/inference-nitro-extension/src/node/utils.ts

diff --git a/core/src/node/api/common/builder.ts b/core/src/node/api/common/builder.ts
index a9819bce6..5c99cf4d8 100644
--- a/core/src/node/api/common/builder.ts
+++ b/core/src/node/api/common/builder.ts
@@ -2,7 +2,8 @@ import fs from 'fs'
 import { JanApiRouteConfiguration, RouteConfiguration } from './configuration'
 import { join } from 'path'
 import { ContentType, MessageStatus, Model, ThreadMessage } from './../../../index'
-import { getJanDataFolderPath } from '../../utils'
+import { getEngineConfiguration, getJanDataFolderPath } from '../../utils'
+import { DEFAULT_CHAT_COMPLETION_URL } from './consts'
 
 export const getBuilder = async (configuration: RouteConfiguration) => {
   const directoryPath = join(getJanDataFolderPath(), configuration.dirName)
@@ -309,7 +310,7 @@ export const chatCompletions = async (request: any, reply: any) => {
   const engineConfiguration = await getEngineConfiguration(requestedModel.engine)
 
   let apiKey: string | undefined = undefined
-  let apiUrl: string = 'http://127.0.0.1:3928/inferences/llamacpp/chat_completion' // default nitro url
+  let apiUrl: string = DEFAULT_CHAT_COMPLETION_URL
 
   if (engineConfiguration) {
     apiKey = engineConfiguration.api_key
@@ -320,7 +321,7 @@ export const chatCompletions = async (request: any, reply: any) => {
     'Content-Type': 'text/event-stream',
     'Cache-Control': 'no-cache',
     'Connection': 'keep-alive',
-    "Access-Control-Allow-Origin": "*"
+    'Access-Control-Allow-Origin': '*',
   })
 
   const headers: Record<string, any> = {
@@ -346,13 +347,3 @@ export const chatCompletions = async (request: any, reply: any) => {
     response.body.pipe(reply.raw)
   }
 }
-
-const getEngineConfiguration = async (engineId: string) => {
-  if (engineId !== 'openai') {
-    return undefined
-  }
-  const directoryPath = join(getJanDataFolderPath(), 'engines')
-  const filePath = join(directoryPath, `${engineId}.json`)
-  const data = await fs.readFileSync(filePath, 'utf-8')
-  return JSON.parse(data)
-}
diff --git a/core/src/node/api/common/consts.ts b/core/src/node/api/common/consts.ts
new file mode 100644
index 000000000..bc3cfe300
--- /dev/null
+++ b/core/src/node/api/common/consts.ts
@@ -0,0 +1,19 @@
+// The PORT to use for the Nitro subprocess
+export const NITRO_DEFAULT_PORT = 3928
+
+// The HOST address to use for the Nitro subprocess
+export const LOCAL_HOST = '127.0.0.1'
+
+export const SUPPORTED_MODEL_FORMAT = '.gguf'
+
+// The URL for the Nitro subprocess
+const NITRO_HTTP_SERVER_URL = `http://${LOCAL_HOST}:${NITRO_DEFAULT_PORT}`
+// The URL for the Nitro subprocess to load a model
+export const NITRO_HTTP_LOAD_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/loadmodel`
+// The URL for the Nitro subprocess to validate a model
+export const NITRO_HTTP_VALIDATE_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/modelstatus`
+
+// The URL for the Nitro subprocess to kill itself
+export const NITRO_HTTP_KILL_URL = `${NITRO_HTTP_SERVER_URL}/processmanager/destroy`
+
+export const DEFAULT_CHAT_COMPLETION_URL = `http://${LOCAL_HOST}:${NITRO_DEFAULT_PORT}/inferences/llamacpp/chat_completion` // default nitro url
diff --git a/core/src/node/api/common/startStopModel.ts b/core/src/node/api/common/startStopModel.ts
new file mode 100644
index 000000000..766588380
--- /dev/null
+++ b/core/src/node/api/common/startStopModel.ts
@@ -0,0 +1,351 @@
+import fs from 'fs'
+import { join } from 'path'
+import { getJanDataFolderPath, getJanExtensionsPath, getSystemResourceInfo } from '../../utils'
+import { logServer } from '../../log'
+import { ChildProcessWithoutNullStreams, spawn } from 'child_process'
+import { Model, ModelSettingParams, PromptTemplate } from '../../../types'
+import {
+  LOCAL_HOST,
+  NITRO_DEFAULT_PORT,
+  NITRO_HTTP_KILL_URL,
+  NITRO_HTTP_LOAD_MODEL_URL,
+  NITRO_HTTP_VALIDATE_MODEL_URL,
+  SUPPORTED_MODEL_FORMAT,
+} from './consts'
+
+// The subprocess instance for Nitro
+let subprocess: ChildProcessWithoutNullStreams | undefined = undefined
+
+// TODO: move this to core type
+interface NitroModelSettings extends ModelSettingParams {
+  llama_model_path: string
+  cpu_threads: number
+}
+
+export const startModel = async (modelId: string, settingParams?: ModelSettingParams) => {
+  try {
+    await runModel(modelId, settingParams)
+
+    return {
+      message: `Model ${modelId} started`,
+    }
+  } catch (e) {
+    return {
+      error: e,
+    }
+  }
+}
+
+const runModel = async (modelId: string, settingParams?: ModelSettingParams): Promise<void> => {
+  const janDataFolderPath = getJanDataFolderPath()
+  const modelFolderFullPath = join(janDataFolderPath, 'models', modelId)
+
+  if (!fs.existsSync(modelFolderFullPath)) {
+    throw `Model not found: ${modelId}`
+  }
+
+  const files: string[] = fs.readdirSync(modelFolderFullPath)
+
+  // Look for GGUF model file
+  const ggufBinFile = files.find((file) => file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT))
+
+  const modelMetadataPath = join(modelFolderFullPath, 'model.json')
+  const modelMetadata: Model = JSON.parse(fs.readFileSync(modelMetadataPath, 'utf-8'))
+
+  if (!ggufBinFile) {
+    throw 'No GGUF model file found'
+  }
+  const modelBinaryPath = join(modelFolderFullPath, ggufBinFile)
+
+  const nitroResourceProbe = await getSystemResourceInfo()
+  const nitroModelSettings: NitroModelSettings = {
+    ...modelMetadata.settings,
+    ...settingParams,
+    llama_model_path: modelBinaryPath,
+    // This is critical and requires real CPU physical core count (or performance core)
+    cpu_threads: Math.max(1, nitroResourceProbe.numCpuPhysicalCore),
+    ...(modelMetadata.settings.mmproj && {
+      mmproj: join(modelFolderFullPath, modelMetadata.settings.mmproj),
+    }),
+  }
+
+  logServer(`[NITRO]::Debug: Nitro model settings: ${JSON.stringify(nitroModelSettings)}`)
+
+  // Convert settings.prompt_template to system_prompt, user_prompt, ai_prompt
+  if (modelMetadata.settings.prompt_template) {
+    const promptTemplate = modelMetadata.settings.prompt_template
+    const prompt = promptTemplateConverter(promptTemplate)
+    if (prompt?.error) {
+      return Promise.reject(prompt.error)
+    }
+    nitroModelSettings.system_prompt = prompt.system_prompt
+    nitroModelSettings.user_prompt = prompt.user_prompt
+    nitroModelSettings.ai_prompt = prompt.ai_prompt
+  }
+
+  await runNitroAndLoadModel(modelId, nitroModelSettings)
+}
+
+// TODO: move to util
+const promptTemplateConverter = (promptTemplate: string): PromptTemplate => {
+  // Split the string using the markers
+  const systemMarker = '{system_message}'
+  const promptMarker = '{prompt}'
+
+  if (promptTemplate.includes(systemMarker) && promptTemplate.includes(promptMarker)) {
+    // Find the indices of the markers
+    const systemIndex = promptTemplate.indexOf(systemMarker)
+    const promptIndex = promptTemplate.indexOf(promptMarker)
+
+    // Extract the parts of the string
+    const system_prompt = promptTemplate.substring(0, systemIndex)
+    const user_prompt = promptTemplate.substring(systemIndex + systemMarker.length, promptIndex)
+    const ai_prompt = promptTemplate.substring(promptIndex + promptMarker.length)
+
+    // Return the split parts
+    return { system_prompt, user_prompt, ai_prompt }
+  } else if (promptTemplate.includes(promptMarker)) {
+    // Extract the parts of the string for the case where only promptMarker is present
+    const promptIndex = promptTemplate.indexOf(promptMarker)
+    const user_prompt = promptTemplate.substring(0, promptIndex)
+    const ai_prompt = promptTemplate.substring(promptIndex + promptMarker.length)
+
+    // Return the split parts
+    return { user_prompt, ai_prompt }
+  }
+
+  // Return an error if none of the conditions are met
+  return { error: 'Cannot split prompt template' }
+}
+
+const runNitroAndLoadModel = async (modelId: string, modelSettings: NitroModelSettings) => {
+  // Gather system information for CPU physical cores and memory
+  const tcpPortUsed = require('tcp-port-used')
+
+  await stopModel(modelId)
+  await tcpPortUsed.waitUntilFree(NITRO_DEFAULT_PORT, 300, 5000)
+
+  /**
+   * There is a problem with Windows process manager
+   * Should wait for awhile to make sure the port is free and subprocess is killed
+   * The tested threshold is 500ms
+   **/
+  if (process.platform === 'win32') {
+    await new Promise((resolve) => setTimeout(resolve, 500))
+  }
+
+  await spawnNitroProcess()
+  await loadLLMModel(modelSettings)
+  await validateModelStatus()
+}
+
+const spawnNitroProcess = async (): Promise<void> => {
+  logServer(`[NITRO]::Debug: Spawning Nitro subprocess...`)
+
+  let binaryFolder = join(
+    getJanExtensionsPath(),
+    '@janhq',
+    'inference-nitro-extension',
+    'dist',
+    'bin'
+  )
+
+  let executableOptions = executableNitroFile()
+  const tcpPortUsed = require('tcp-port-used')
+
+  const args: string[] = ['1', LOCAL_HOST, NITRO_DEFAULT_PORT.toString()]
+  // Execute the binary
+  logServer(
+    `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`
+  )
+  subprocess = spawn(
+    executableOptions.executablePath,
+    ['1', LOCAL_HOST, NITRO_DEFAULT_PORT.toString()],
+    {
+      cwd: binaryFolder,
+      env: {
+        ...process.env,
+        CUDA_VISIBLE_DEVICES: executableOptions.cudaVisibleDevices,
+      },
+    }
+  )
+
+  // Handle subprocess output
+  subprocess.stdout.on('data', (data: any) => {
+    logServer(`[NITRO]::Debug: ${data}`)
+  })
+
+  subprocess.stderr.on('data', (data: any) => {
+    logServer(`[NITRO]::Error: ${data}`)
+  })
+
+  subprocess.on('close', (code: any) => {
+    logServer(`[NITRO]::Debug: Nitro exited with code: ${code}`)
+    subprocess = undefined
+  })
+
+  tcpPortUsed.waitUntilUsed(NITRO_DEFAULT_PORT, 300, 30000).then(() => {
+    logServer(`[NITRO]::Debug: Nitro is ready`)
+  })
+}
+
+type NitroExecutableOptions = {
+  executablePath: string
+  cudaVisibleDevices: string
+}
+
+const executableNitroFile = (): NitroExecutableOptions => {
+  const nvidiaInfoFilePath = join(getJanDataFolderPath(), 'settings', 'settings.json')
+  let binaryFolder = join(
+    getJanExtensionsPath(),
+    '@janhq',
+    'inference-nitro-extension',
+    'dist',
+    'bin'
+  )
+
+  let cudaVisibleDevices = ''
+  let binaryName = 'nitro'
+  /**
+   * The binary folder is different for each platform.
+   */
+  if (process.platform === 'win32') {
+    /**
+     *  For Windows: win-cpu, win-cuda-11-7, win-cuda-12-0
+     */
+    let nvidiaInfo = JSON.parse(fs.readFileSync(nvidiaInfoFilePath, 'utf-8'))
+    if (nvidiaInfo['run_mode'] === 'cpu') {
+      binaryFolder = join(binaryFolder, 'win-cpu')
+    } else {
+      if (nvidiaInfo['cuda'].version === '12') {
+        binaryFolder = join(binaryFolder, 'win-cuda-12-0')
+      } else {
+        binaryFolder = join(binaryFolder, 'win-cuda-11-7')
+      }
+      cudaVisibleDevices = nvidiaInfo['gpu_highest_vram']
+    }
+    binaryName = 'nitro.exe'
+  } else if (process.platform === 'darwin') {
+    /**
+     *  For MacOS: mac-arm64 (Silicon), mac-x64 (InteL)
+     */
+    if (process.arch === 'arm64') {
+      binaryFolder = join(binaryFolder, 'mac-arm64')
+    } else {
+      binaryFolder = join(binaryFolder, 'mac-x64')
+    }
+  } else {
+    /**
+     *  For Linux: linux-cpu, linux-cuda-11-7, linux-cuda-12-0
+     */
+    let nvidiaInfo = JSON.parse(fs.readFileSync(nvidiaInfoFilePath, 'utf-8'))
+    if (nvidiaInfo['run_mode'] === 'cpu') {
+      binaryFolder = join(binaryFolder, 'linux-cpu')
+    } else {
+      if (nvidiaInfo['cuda'].version === '12') {
+        binaryFolder = join(binaryFolder, 'linux-cuda-12-0')
+      } else {
+        binaryFolder = join(binaryFolder, 'linux-cuda-11-7')
+      }
+      cudaVisibleDevices = nvidiaInfo['gpu_highest_vram']
+    }
+  }
+
+  return {
+    executablePath: join(binaryFolder, binaryName),
+    cudaVisibleDevices,
+  }
+}
+
+const validateModelStatus = async (): Promise<void> => {
+  // Send a GET request to the validation URL.
+  // Retry the request up to 3 times if it fails, with a delay of 500 milliseconds between retries.
+  const fetchRT = require('fetch-retry')
+  const fetchRetry = fetchRT(fetch)
+
+  return fetchRetry(NITRO_HTTP_VALIDATE_MODEL_URL, {
+    method: 'GET',
+    headers: {
+      'Content-Type': 'application/json',
+    },
+    retries: 5,
+    retryDelay: 500,
+  }).then(async (res: Response) => {
+    logServer(`[NITRO]::Debug: Validate model state success with response ${JSON.stringify(res)}`)
+    // If the response is OK, check model_loaded status.
+    if (res.ok) {
+      const body = await res.json()
+      // If the model is loaded, return an empty object.
+      // Otherwise, return an object with an error message.
+      if (body.model_loaded) {
+        return Promise.resolve()
+      }
+    }
+    return Promise.reject('Validate model status failed')
+  })
+}
+
+const loadLLMModel = async (settings: NitroModelSettings): Promise<Response> => {
+  logServer(`[NITRO]::Debug: Loading model with params ${JSON.stringify(settings)}`)
+  const fetchRT = require('fetch-retry')
+  const fetchRetry = fetchRT(fetch)
+
+  return fetchRetry(NITRO_HTTP_LOAD_MODEL_URL, {
+    method: 'POST',
+    headers: {
+      'Content-Type': 'application/json',
+    },
+    body: JSON.stringify(settings),
+    retries: 3,
+    retryDelay: 500,
+  })
+    .then((res: any) => {
+      logServer(`[NITRO]::Debug: Load model success with response ${JSON.stringify(res)}`)
+      return Promise.resolve(res)
+    })
+    .catch((err: any) => {
+      logServer(`[NITRO]::Error: Load model failed with error ${err}`)
+      return Promise.reject()
+    })
+}
+
+/**
+ * Stop model and kill nitro process.
+ */
+export const stopModel = async (_modelId: string) => {
+  if (!subprocess) {
+    return {
+      error: "Model isn't running",
+    }
+  }
+  return new Promise((resolve, reject) => {
+    const controller = new AbortController()
+    setTimeout(() => {
+      controller.abort()
+      reject({
+        error: 'Failed to stop model: Timedout',
+      })
+    }, 5000)
+    const tcpPortUsed = require('tcp-port-used')
+    logServer(`[NITRO]::Debug: Request to kill Nitro`)
+
+    fetch(NITRO_HTTP_KILL_URL, {
+      method: 'DELETE',
+      signal: controller.signal,
+    })
+      .then(() => {
+        subprocess?.kill()
+        subprocess = undefined
+      })
+      .catch(() => {
+        // don't need to do anything, we still kill the subprocess
+      })
+      .then(() => tcpPortUsed.waitUntilFree(NITRO_DEFAULT_PORT, 300, 5000))
+      .then(() => logServer(`[NITRO]::Debug: Nitro process is terminated`))
+      .then(() =>
+        resolve({
+          message: 'Model stopped',
+        })
+      )
+  })
+}
diff --git a/core/src/node/api/routes/common.ts b/core/src/node/api/routes/common.ts
index a6c65a382..27385e561 100644
--- a/core/src/node/api/routes/common.ts
+++ b/core/src/node/api/routes/common.ts
@@ -10,6 +10,8 @@ import {
 } from '../common/builder'
 
 import { JanApiRouteConfiguration } from '../common/configuration'
+import { startModel, stopModel } from '../common/startStopModel'
+import { ModelSettingParams } from '../../../types'
 
 export const commonRouter = async (app: HttpServer) => {
   // Common Routes
@@ -17,19 +19,33 @@ export const commonRouter = async (app: HttpServer) => {
     app.get(`/${key}`, async (_request) => getBuilder(JanApiRouteConfiguration[key]))
 
     app.get(`/${key}/:id`, async (request: any) =>
-      retrieveBuilder(JanApiRouteConfiguration[key], request.params.id),
+      retrieveBuilder(JanApiRouteConfiguration[key], request.params.id)
     )
 
     app.delete(`/${key}/:id`, async (request: any) =>
-      deleteBuilder(JanApiRouteConfiguration[key], request.params.id),
+      deleteBuilder(JanApiRouteConfiguration[key], request.params.id)
     )
   })
 
   // Download Model Routes
   app.get(`/models/download/:modelId`, async (request: any) =>
-    downloadModel(request.params.modelId, { ignoreSSL: request.query.ignoreSSL === 'true', proxy: request.query.proxy }),
+    downloadModel(request.params.modelId, {
+      ignoreSSL: request.query.ignoreSSL === 'true',
+      proxy: request.query.proxy,
+    })
   )
 
+  app.put(`/models/:modelId/start`, async (request: any) => {
+    let settingParams: ModelSettingParams | undefined = undefined
+    if (Object.keys(request.body).length !== 0) {
+      settingParams = JSON.parse(request.body) as ModelSettingParams
+    }
+
+    return startModel(request.params.modelId, settingParams)
+  })
+
+  app.put(`/models/:modelId/stop`, async (request: any) => stopModel(request.params.modelId))
+
   // Chat Completion Routes
   app.post(`/chat/completions`, async (request: any, reply: any) => chatCompletions(request, reply))
 
diff --git a/core/src/node/utils/index.ts b/core/src/node/utils/index.ts
index 00db04c9b..4bcbf13b1 100644
--- a/core/src/node/utils/index.ts
+++ b/core/src/node/utils/index.ts
@@ -1,16 +1,18 @@
-import { AppConfiguration } from "../../types";
-import { join } from "path";
-import fs from "fs";
-import os from "os";
+import { AppConfiguration, SystemResourceInfo } from '../../types'
+import { join } from 'path'
+import fs from 'fs'
+import os from 'os'
+import { log, logServer } from '../log'
+import childProcess from 'child_process'
 
 // TODO: move this to core
-const configurationFileName = "settings.json";
+const configurationFileName = 'settings.json'
 
 // TODO: do no specify app name in framework module
-const defaultJanDataFolder = join(os.homedir(), "jan");
+const defaultJanDataFolder = join(os.homedir(), 'jan')
 const defaultAppConfig: AppConfiguration = {
   data_folder: defaultJanDataFolder,
-};
+}
 
 /**
  * Getting App Configurations.
@@ -20,39 +22,39 @@ const defaultAppConfig: AppConfiguration = {
 export const getAppConfigurations = (): AppConfiguration => {
   // Retrieve Application Support folder path
   // Fallback to user home directory if not found
-  const configurationFile = getConfigurationFilePath();
+  const configurationFile = getConfigurationFilePath()
 
   if (!fs.existsSync(configurationFile)) {
     // create default app config if we don't have one
-    console.debug(`App config not found, creating default config at ${configurationFile}`);
-    fs.writeFileSync(configurationFile, JSON.stringify(defaultAppConfig));
-    return defaultAppConfig;
+    console.debug(`App config not found, creating default config at ${configurationFile}`)
+    fs.writeFileSync(configurationFile, JSON.stringify(defaultAppConfig))
+    return defaultAppConfig
   }
 
   try {
     const appConfigurations: AppConfiguration = JSON.parse(
-      fs.readFileSync(configurationFile, "utf-8"),
-    );
-    return appConfigurations;
+      fs.readFileSync(configurationFile, 'utf-8')
+    )
+    return appConfigurations
   } catch (err) {
-    console.error(`Failed to read app config, return default config instead! Err: ${err}`);
-    return defaultAppConfig;
+    console.error(`Failed to read app config, return default config instead! Err: ${err}`)
+    return defaultAppConfig
   }
-};
+}
 
 const getConfigurationFilePath = () =>
   join(
-    global.core?.appPath() || process.env[process.platform == "win32" ? "USERPROFILE" : "HOME"],
-    configurationFileName,
-  );
+    global.core?.appPath() || process.env[process.platform == 'win32' ? 'USERPROFILE' : 'HOME'],
+    configurationFileName
+  )
 
 export const updateAppConfiguration = (configuration: AppConfiguration): Promise<void> => {
-  const configurationFile = getConfigurationFilePath();
-  console.debug("updateAppConfiguration, configurationFile: ", configurationFile);
+  const configurationFile = getConfigurationFilePath()
+  console.debug('updateAppConfiguration, configurationFile: ', configurationFile)
 
-  fs.writeFileSync(configurationFile, JSON.stringify(configuration));
-  return Promise.resolve();
-};
+  fs.writeFileSync(configurationFile, JSON.stringify(configuration))
+  return Promise.resolve()
+}
 
 /**
  * Utility function to get server log path
@@ -60,13 +62,13 @@ export const updateAppConfiguration = (configuration: AppConfiguration): Promise
  * @returns {string} The log path.
  */
 export const getServerLogPath = (): string => {
-  const appConfigurations = getAppConfigurations();
-  const logFolderPath = join(appConfigurations.data_folder, "logs");
+  const appConfigurations = getAppConfigurations()
+  const logFolderPath = join(appConfigurations.data_folder, 'logs')
   if (!fs.existsSync(logFolderPath)) {
-    fs.mkdirSync(logFolderPath, { recursive: true });
+    fs.mkdirSync(logFolderPath, { recursive: true })
   }
-  return join(logFolderPath, "server.log");
-};
+  return join(logFolderPath, 'server.log')
+}
 
 /**
  * Utility function to get app log path
@@ -74,13 +76,13 @@ export const getServerLogPath = (): string => {
  * @returns {string} The log path.
  */
 export const getAppLogPath = (): string => {
-  const appConfigurations = getAppConfigurations();
-  const logFolderPath = join(appConfigurations.data_folder, "logs");
+  const appConfigurations = getAppConfigurations()
+  const logFolderPath = join(appConfigurations.data_folder, 'logs')
   if (!fs.existsSync(logFolderPath)) {
-    fs.mkdirSync(logFolderPath, { recursive: true });
+    fs.mkdirSync(logFolderPath, { recursive: true })
   }
-  return join(logFolderPath, "app.log");
-};
+  return join(logFolderPath, 'app.log')
+}
 
 /**
  * Utility function to get data folder path
@@ -88,9 +90,9 @@ export const getAppLogPath = (): string => {
  * @returns {string} The data folder path.
  */
 export const getJanDataFolderPath = (): string => {
-  const appConfigurations = getAppConfigurations();
-  return appConfigurations.data_folder;
-};
+  const appConfigurations = getAppConfigurations()
+  return appConfigurations.data_folder
+}
 
 /**
  * Utility function to get extension path
@@ -98,6 +100,70 @@ export const getJanDataFolderPath = (): string => {
  * @returns {string} The extensions path.
  */
 export const getJanExtensionsPath = (): string => {
-  const appConfigurations = getAppConfigurations();
-  return join(appConfigurations.data_folder, "extensions");
-};
+  const appConfigurations = getAppConfigurations()
+  return join(appConfigurations.data_folder, 'extensions')
+}
+
+/**
+ * Utility function to physical cpu count
+ *
+ * @returns {number} The physical cpu count.
+ */
+export const physicalCpuCount = async (): Promise<number> => {
+  const platform = os.platform()
+  if (platform === 'linux') {
+    const output = await exec('lscpu -p | egrep -v "^#" | sort -u -t, -k 2,4 | wc -l')
+    return parseInt(output.trim(), 10)
+  } else if (platform === 'darwin') {
+    const output = await exec('sysctl -n hw.physicalcpu_max')
+    return parseInt(output.trim(), 10)
+  } else if (platform === 'win32') {
+    const output = await exec('WMIC CPU Get NumberOfCores')
+    return output
+      .split(os.EOL)
+      .map((line: string) => parseInt(line))
+      .filter((value: number) => !isNaN(value))
+      .reduce((sum: number, number: number) => sum + number, 1)
+  } else {
+    const cores = os.cpus().filter((cpu: any, index: number) => {
+      const hasHyperthreading = cpu.model.includes('Intel')
+      const isOdd = index % 2 === 1
+      return !hasHyperthreading || isOdd
+    })
+    return cores.length
+  }
+}
+
+const exec = async (command: string): Promise<string> => {
+  return new Promise((resolve, reject) => {
+    childProcess.exec(command, { encoding: 'utf8' }, (error, stdout) => {
+      if (error) {
+        reject(error)
+      } else {
+        resolve(stdout)
+      }
+    })
+  })
+}
+
+export const getSystemResourceInfo = async (): Promise<SystemResourceInfo> => {
+  const cpu = await physicalCpuCount()
+  const message = `[NITRO]::CPU informations - ${cpu}`
+  log(message)
+  logServer(message)
+
+  return {
+    numCpuPhysicalCore: cpu,
+    memAvailable: 0, // TODO: this should not be 0
+  }
+}
+
+export const getEngineConfiguration = async (engineId: string) => {
+  if (engineId !== 'openai') {
+    return undefined
+  }
+  const directoryPath = join(getJanDataFolderPath(), 'engines')
+  const filePath = join(directoryPath, `${engineId}.json`)
+  const data = fs.readFileSync(filePath, 'utf-8')
+  return JSON.parse(data)
+}
diff --git a/core/src/types/index.ts b/core/src/types/index.ts
index 3bdcb5421..ee6f4ef08 100644
--- a/core/src/types/index.ts
+++ b/core/src/types/index.ts
@@ -6,3 +6,4 @@ export * from './inference'
 export * from './monitoring'
 export * from './file'
 export * from './config'
+export * from './miscellaneous'
diff --git a/core/src/types/miscellaneous/index.ts b/core/src/types/miscellaneous/index.ts
new file mode 100644
index 000000000..02c973323
--- /dev/null
+++ b/core/src/types/miscellaneous/index.ts
@@ -0,0 +1,2 @@
+export * from './systemResourceInfo'
+export * from './promptTemplate'
diff --git a/core/src/types/miscellaneous/promptTemplate.ts b/core/src/types/miscellaneous/promptTemplate.ts
new file mode 100644
index 000000000..a6743c67c
--- /dev/null
+++ b/core/src/types/miscellaneous/promptTemplate.ts
@@ -0,0 +1,6 @@
+export type PromptTemplate = {
+  system_prompt?: string
+  ai_prompt?: string
+  user_prompt?: string
+  error?: string
+}
diff --git a/core/src/types/miscellaneous/systemResourceInfo.ts b/core/src/types/miscellaneous/systemResourceInfo.ts
new file mode 100644
index 000000000..1472cda47
--- /dev/null
+++ b/core/src/types/miscellaneous/systemResourceInfo.ts
@@ -0,0 +1,4 @@
+export type SystemResourceInfo = {
+  numCpuPhysicalCore: number
+  memAvailable: number
+}
diff --git a/core/src/types/model/modelEntity.ts b/core/src/types/model/modelEntity.ts
index 727ff085f..644c34dfb 100644
--- a/core/src/types/model/modelEntity.ts
+++ b/core/src/types/model/modelEntity.ts
@@ -123,6 +123,7 @@ export type ModelSettingParams = {
   user_prompt?: string
   llama_model_path?: string
   mmproj?: string
+  cont_batching?: boolean
 }
 
 /**
diff --git a/extensions/inference-nitro-extension/src/@types/global.d.ts b/extensions/inference-nitro-extension/src/@types/global.d.ts
index 5fb41f0f8..bc126337f 100644
--- a/extensions/inference-nitro-extension/src/@types/global.d.ts
+++ b/extensions/inference-nitro-extension/src/@types/global.d.ts
@@ -2,22 +2,6 @@ declare const NODE: string;
 declare const INFERENCE_URL: string;
 declare const TROUBLESHOOTING_URL: string;
 
-/**
- * The parameters for the initModel function.
- * @property settings - The settings for the machine learning model.
- * @property settings.ctx_len - The context length.
- * @property settings.ngl - The number of generated tokens.
- * @property settings.cont_batching - Whether to use continuous batching.
- * @property settings.embedding - Whether to use embedding.
- */
-interface EngineSettings {
-  ctx_len: number;
-  ngl: number;
-  cpu_threads: number;
-  cont_batching: boolean;
-  embedding: boolean;
-}
-
 /**
  * The response from the initModel function.
  * @property error - An error message if the model fails to load.
@@ -26,8 +10,3 @@ interface ModelOperationResponse {
   error?: any;
   modelFile?: string;
 }
-
-interface ResourcesInfo {
-  numCpuPhysicalCore: number;
-  memAvailable: number;
-}
\ No newline at end of file
diff --git a/extensions/inference-nitro-extension/src/index.ts b/extensions/inference-nitro-extension/src/index.ts
index 0e6edb992..aaa230ca3 100644
--- a/extensions/inference-nitro-extension/src/index.ts
+++ b/extensions/inference-nitro-extension/src/index.ts
@@ -24,6 +24,7 @@ import {
   MessageEvent,
   ModelEvent,
   InferenceEvent,
+  ModelSettingParams,
 } from "@janhq/core";
 import { requestInference } from "./helpers/sse";
 import { ulid } from "ulid";
@@ -45,7 +46,7 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
 
   private _currentModel: Model | undefined;
 
-  private _engineSettings: EngineSettings = {
+  private _engineSettings: ModelSettingParams = {
     ctx_len: 2048,
     ngl: 100,
     cpu_threads: 1,
diff --git a/extensions/inference-nitro-extension/src/node/index.ts b/extensions/inference-nitro-extension/src/node/index.ts
index 77060e414..443e686e8 100644
--- a/extensions/inference-nitro-extension/src/node/index.ts
+++ b/extensions/inference-nitro-extension/src/node/index.ts
@@ -3,11 +3,19 @@ import path from "path";
 import { ChildProcessWithoutNullStreams, spawn } from "child_process";
 import tcpPortUsed from "tcp-port-used";
 import fetchRT from "fetch-retry";
-import { log, getJanDataFolderPath } from "@janhq/core/node";
+import {
+  log,
+  getJanDataFolderPath,
+  getSystemResourceInfo,
+} from "@janhq/core/node";
 import { getNitroProcessInfo, updateNvidiaInfo } from "./nvidia";
-import { Model, InferenceEngine, ModelSettingParams } from "@janhq/core";
+import {
+  Model,
+  InferenceEngine,
+  ModelSettingParams,
+  PromptTemplate,
+} from "@janhq/core";
 import { executableNitroFile } from "./execute";
-import { physicalCpuCount } from "./utils";
 
 // Polyfill fetch with retry
 const fetchRetry = fetchRT(fetch);
@@ -20,16 +28,6 @@ interface ModelInitOptions {
   model: Model;
 }
 
-/**
- * The response object of Prompt Template parsing.
- */
-interface PromptTemplate {
-  system_prompt?: string;
-  ai_prompt?: string;
-  user_prompt?: string;
-  error?: string;
-}
-
 /**
  * Model setting args for Nitro model load.
  */
@@ -78,7 +76,7 @@ function stopModel(): Promise<void> {
  * TODO: Should pass absolute of the model file instead of just the name - So we can modurize the module.ts to npm package
  */
 async function runModel(
-  wrapper: ModelInitOptions,
+  wrapper: ModelInitOptions
 ): Promise<ModelOperationResponse | void> {
   if (wrapper.model.engine !== InferenceEngine.nitro) {
     // Not a nitro model
@@ -96,7 +94,7 @@ async function runModel(
   const ggufBinFile = files.find(
     (file) =>
       file === path.basename(currentModelFile) ||
-      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT),
+      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT)
   );
 
   if (!ggufBinFile) return Promise.reject("No GGUF model file found");
@@ -106,7 +104,7 @@ async function runModel(
   if (wrapper.model.engine !== InferenceEngine.nitro) {
     return Promise.reject("Not a nitro model");
   } else {
-    const nitroResourceProbe = await getResourcesInfo();
+    const nitroResourceProbe = await getSystemResourceInfo();
     // Convert settings.prompt_template to system_prompt, user_prompt, ai_prompt
     if (wrapper.model.settings.prompt_template) {
       const promptTemplate = wrapper.model.settings.prompt_template;
@@ -191,10 +189,10 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const system_prompt = promptTemplate.substring(0, systemIndex);
     const user_prompt = promptTemplate.substring(
       systemIndex + systemMarker.length,
-      promptIndex,
+      promptIndex
     );
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length,
+      promptIndex + promptMarker.length
     );
 
     // Return the split parts
@@ -204,7 +202,7 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const promptIndex = promptTemplate.indexOf(promptMarker);
     const user_prompt = promptTemplate.substring(0, promptIndex);
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length,
+      promptIndex + promptMarker.length
     );
 
     // Return the split parts
@@ -233,8 +231,8 @@ function loadLLMModel(settings: any): Promise<Response> {
     .then((res) => {
       log(
         `[NITRO]::Debug: Load model success with response ${JSON.stringify(
-          res,
-        )}`,
+          res
+        )}`
       );
       return Promise.resolve(res);
     })
@@ -263,8 +261,8 @@ async function validateModelStatus(): Promise<void> {
   }).then(async (res: Response) => {
     log(
       `[NITRO]::Debug: Validate model state success with response ${JSON.stringify(
-        res,
-      )}`,
+        res
+      )}`
     );
     // If the response is OK, check model_loaded status.
     if (res.ok) {
@@ -315,7 +313,7 @@ function spawnNitroProcess(): Promise<any> {
     const args: string[] = ["1", LOCAL_HOST, PORT.toString()];
     // Execute the binary
     log(
-      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`,
+      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`
     );
     subprocess = spawn(
       executableOptions.executablePath,
@@ -326,7 +324,7 @@ function spawnNitroProcess(): Promise<any> {
           ...process.env,
           CUDA_VISIBLE_DEVICES: executableOptions.cudaVisibleDevices,
         },
-      },
+      }
     );
 
     // Handle subprocess output
@@ -351,22 +349,6 @@ function spawnNitroProcess(): Promise<any> {
   });
 }
 
-/**
- * Get the system resources information
- * TODO: Move to Core so that it can be reused
- */
-function getResourcesInfo(): Promise<ResourcesInfo> {
-  return new Promise(async (resolve) => {
-    const cpu = await physicalCpuCount();
-    log(`[NITRO]::CPU informations - ${cpu}`);
-    const response: ResourcesInfo = {
-      numCpuPhysicalCore: cpu,
-      memAvailable: 0,
-    };
-    resolve(response);
-  });
-}
-
 /**
  * Every module should have a dispose function
  * This will be called when the extension is unloaded and should clean up any resources
diff --git a/extensions/inference-nitro-extension/src/node/utils.ts b/extensions/inference-nitro-extension/src/node/utils.ts
deleted file mode 100644
index c7ef2e9a6..000000000
--- a/extensions/inference-nitro-extension/src/node/utils.ts
+++ /dev/null
@@ -1,56 +0,0 @@
-import os from "os";
-import childProcess from "child_process";
-
-function exec(command: string): Promise<string> {
-  return new Promise((resolve, reject) => {
-    childProcess.exec(command, { encoding: "utf8" }, (error, stdout) => {
-      if (error) {
-        reject(error);
-      } else {
-        resolve(stdout);
-      }
-    });
-  });
-}
-
-let amount: number;
-const platform = os.platform();
-
-export async function physicalCpuCount(): Promise<number> {
-  return new Promise((resolve, reject) => {
-    if (platform === "linux") {
-      exec('lscpu -p | egrep -v "^#" | sort -u -t, -k 2,4 | wc -l')
-        .then((output) => {
-          amount = parseInt(output.trim(), 10);
-          resolve(amount);
-        })
-        .catch(reject);
-    } else if (platform === "darwin") {
-      exec("sysctl -n hw.physicalcpu_max")
-        .then((output) => {
-          amount = parseInt(output.trim(), 10);
-          resolve(amount);
-        })
-        .catch(reject);
-    } else if (platform === "win32") {
-      exec("WMIC CPU Get NumberOfCores")
-        .then((output) => {
-          amount = output
-            .split(os.EOL)
-            .map((line: string) => parseInt(line))
-            .filter((value: number) => !isNaN(value))
-            .reduce((sum: number, number: number) => sum + number, 1);
-          resolve(amount);
-        })
-        .catch(reject);
-    } else {
-      const cores = os.cpus().filter((cpu: any, index: number) => {
-        const hasHyperthreading = cpu.model.includes("Intel");
-        const isOdd = index % 2 === 1;
-        return !hasHyperthreading || isOdd;
-      });
-      amount = cores.length;
-      resolve(amount);
-    }
-  });
-}
diff --git a/server/package.json b/server/package.json
index 9495a0d65..f61730da4 100644
--- a/server/package.json
+++ b/server/package.json
@@ -26,6 +26,8 @@
     "dotenv": "^16.3.1",
     "fastify": "^4.24.3",
     "request": "^2.88.2",
+    "fetch-retry": "^5.0.6",
+    "tcp-port-used": "^1.0.2",
     "request-progress": "^3.0.0"
   },
   "devDependencies": {
@@ -35,6 +37,7 @@
     "@typescript-eslint/parser": "^6.7.3",
     "eslint-plugin-react": "^7.33.2",
     "run-script-os": "^1.1.6",
+    "@types/tcp-port-used": "^1.0.4",
     "typescript": "^5.2.2"
   }
 }
diff --git a/web/hooks/useCreateNewThread.ts b/web/hooks/useCreateNewThread.ts
index d9451a46c..aad42aba9 100644
--- a/web/hooks/useCreateNewThread.ts
+++ b/web/hooks/useCreateNewThread.ts
@@ -7,7 +7,7 @@ import {
   ThreadState,
   Model,
 } from '@janhq/core'
-import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
+import { atom, useAtomValue, useSetAtom } from 'jotai'
 
 import { fileUploadAtom } from '@/containers/Providers/Jotai'
 
@@ -48,7 +48,8 @@ export const useCreateNewThread = () => {
   const createNewThread = useSetAtom(createNewThreadAtom)
   const setActiveThreadId = useSetAtom(setActiveThreadIdAtom)
   const updateThread = useSetAtom(updateThreadAtom)
-  const [fileUpload, setFileUpload] = useAtom(fileUploadAtom)
+
+  const setFileUpload = useSetAtom(fileUploadAtom)
   const { deleteThread } = useDeleteThread()
 
   const requestCreateNewThread = async (
diff --git a/web/hooks/useSetActiveThread.ts b/web/hooks/useSetActiveThread.ts
index 035f0551a..76a744bcd 100644
--- a/web/hooks/useSetActiveThread.ts
+++ b/web/hooks/useSetActiveThread.ts
@@ -1,5 +1,3 @@
-import { useEffect } from 'react'
-
 import {
   InferenceEvent,
   ExtensionTypeEnum,
diff --git a/web/screens/LocalServer/index.tsx b/web/screens/LocalServer/index.tsx
index 7e1ba1fab..e7f3c7fc2 100644
--- a/web/screens/LocalServer/index.tsx
+++ b/web/screens/LocalServer/index.tsx
@@ -1,7 +1,6 @@
-/* eslint-disable @typescript-eslint/no-explicit-any */
 'use client'
 
-import React, { useEffect, useState } from 'react'
+import React, { useCallback, useEffect, useState } from 'react'
 
 import ScrollToBottom from 'react-scroll-to-bottom'
 
@@ -81,14 +80,17 @@ const LocalServerScreen = () => {
   const [firstTimeVisitAPIServer, setFirstTimeVisitAPIServer] =
     useState<boolean>(false)
 
-  const handleChangePort = (value: any) => {
-    if (Number(value) <= 0 || Number(value) >= 65536) {
-      setErrorRangePort(true)
-    } else {
-      setErrorRangePort(false)
-    }
-    setPort(value)
-  }
+  const handleChangePort = useCallback(
+    (value: string) => {
+      if (Number(value) <= 0 || Number(value) >= 65536) {
+        setErrorRangePort(true)
+      } else {
+        setErrorRangePort(false)
+      }
+      setPort(value)
+    },
+    [setPort]
+  )
 
   useEffect(() => {
     if (localStorage.getItem(FIRST_TIME_VISIT_API_SERVER) == null) {
@@ -98,7 +100,7 @@ const LocalServerScreen = () => {
 
   useEffect(() => {
     handleChangePort(port)
-  }, [])
+  }, [handleChangePort, port])
 
   return (
     <div className="flex h-full w-full">
diff --git a/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx b/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
index d8a2321a9..89a875955 100644
--- a/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
+++ b/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
@@ -1,6 +1,4 @@
-import React, { useCallback, useEffect, useState } from 'react'
-
-import { fs, AppConfiguration, joinPath, getUserHomePath } from '@janhq/core'
+import React, { useCallback, useState } from 'react'
 
 import {
   Modal,

From 5ddc6ea4c82e818fca10812d5668bc754a35cab4 Mon Sep 17 00:00:00 2001
From: Louis <louis@jan.ai>
Date: Thu, 1 Feb 2024 12:31:26 +0700
Subject: [PATCH 60/65] fix: the selected model auto revert back to previous
 used model with setting mismatch (#1883)

* fix: the selected model auto revert back to previous used model with setting mismatch

* fix: view in finder and view file action
---
 core/src/types/thread/threadEntity.ts         |  1 -
 .../inference-nitro-extension/bin/version.txt |  2 +-
 .../src/node/index.ts                         | 22 +++----
 web/containers/DropdownListSidebar/index.tsx  | 51 ++++-----------
 web/helpers/atoms/Thread.atom.ts              | 12 ----
 web/hooks/useCreateNewThread.ts               | 64 +++++++++----------
 web/hooks/useDeleteThread.ts                  | 22 ++-----
 web/hooks/usePath.ts                          | 38 +++++------
 web/hooks/useRecommendedModel.ts              | 25 ++------
 web/hooks/useSendChatMessage.ts               | 46 -------------
 web/hooks/useThreads.ts                       | 46 ++-----------
 web/hooks/useUpdateModelParameters.ts         | 32 ++++++----
 .../Chat/ModelSetting/SettingComponent.tsx    | 15 ++++-
 web/screens/Chat/SimpleTextMessage/index.tsx  | 16 +++--
 web/screens/Settings/Advanced/index.tsx       |  2 +-
 15 files changed, 132 insertions(+), 262 deletions(-)

diff --git a/core/src/types/thread/threadEntity.ts b/core/src/types/thread/threadEntity.ts
index 37136eae6..dd88b10ec 100644
--- a/core/src/types/thread/threadEntity.ts
+++ b/core/src/types/thread/threadEntity.ts
@@ -43,5 +43,4 @@ export type ThreadState = {
   waitingForResponse: boolean
   error?: Error
   lastMessage?: string
-  isFinishInit?: boolean
 }
diff --git a/extensions/inference-nitro-extension/bin/version.txt b/extensions/inference-nitro-extension/bin/version.txt
index 1c09c74e2..c2c0004f0 100644
--- a/extensions/inference-nitro-extension/bin/version.txt
+++ b/extensions/inference-nitro-extension/bin/version.txt
@@ -1 +1 @@
-0.3.3
+0.3.5
diff --git a/extensions/inference-nitro-extension/src/node/index.ts b/extensions/inference-nitro-extension/src/node/index.ts
index 443e686e8..749b68b1c 100644
--- a/extensions/inference-nitro-extension/src/node/index.ts
+++ b/extensions/inference-nitro-extension/src/node/index.ts
@@ -76,7 +76,7 @@ function stopModel(): Promise<void> {
  * TODO: Should pass absolute of the model file instead of just the name - So we can modurize the module.ts to npm package
  */
 async function runModel(
-  wrapper: ModelInitOptions
+  wrapper: ModelInitOptions,
 ): Promise<ModelOperationResponse | void> {
   if (wrapper.model.engine !== InferenceEngine.nitro) {
     // Not a nitro model
@@ -94,7 +94,7 @@ async function runModel(
   const ggufBinFile = files.find(
     (file) =>
       file === path.basename(currentModelFile) ||
-      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT)
+      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT),
   );
 
   if (!ggufBinFile) return Promise.reject("No GGUF model file found");
@@ -189,10 +189,10 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const system_prompt = promptTemplate.substring(0, systemIndex);
     const user_prompt = promptTemplate.substring(
       systemIndex + systemMarker.length,
-      promptIndex
+      promptIndex,
     );
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length
+      promptIndex + promptMarker.length,
     );
 
     // Return the split parts
@@ -202,7 +202,7 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const promptIndex = promptTemplate.indexOf(promptMarker);
     const user_prompt = promptTemplate.substring(0, promptIndex);
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length
+      promptIndex + promptMarker.length,
     );
 
     // Return the split parts
@@ -231,8 +231,8 @@ function loadLLMModel(settings: any): Promise<Response> {
     .then((res) => {
       log(
         `[NITRO]::Debug: Load model success with response ${JSON.stringify(
-          res
-        )}`
+          res,
+        )}`,
       );
       return Promise.resolve(res);
     })
@@ -261,8 +261,8 @@ async function validateModelStatus(): Promise<void> {
   }).then(async (res: Response) => {
     log(
       `[NITRO]::Debug: Validate model state success with response ${JSON.stringify(
-        res
-      )}`
+        res,
+      )}`,
     );
     // If the response is OK, check model_loaded status.
     if (res.ok) {
@@ -313,7 +313,7 @@ function spawnNitroProcess(): Promise<any> {
     const args: string[] = ["1", LOCAL_HOST, PORT.toString()];
     // Execute the binary
     log(
-      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`
+      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`,
     );
     subprocess = spawn(
       executableOptions.executablePath,
@@ -324,7 +324,7 @@ function spawnNitroProcess(): Promise<any> {
           ...process.env,
           CUDA_VISIBLE_DEVICES: executableOptions.cudaVisibleDevices,
         },
-      }
+      },
     );
 
     // Handle subprocess output
diff --git a/web/containers/DropdownListSidebar/index.tsx b/web/containers/DropdownListSidebar/index.tsx
index eb867f54e..140a1aba1 100644
--- a/web/containers/DropdownListSidebar/index.tsx
+++ b/web/containers/DropdownListSidebar/index.tsx
@@ -26,6 +26,8 @@ import { useMainViewState } from '@/hooks/useMainViewState'
 
 import useRecommendedModel from '@/hooks/useRecommendedModel'
 
+import useUpdateModelParameters from '@/hooks/useUpdateModelParameters'
+
 import { toGibibytes } from '@/utils/converter'
 
 import ModelLabel from '../ModelLabel'
@@ -34,10 +36,8 @@ import OpenAiKeyInput from '../OpenAiKeyInput'
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
 
 import {
-  ModelParams,
   activeThreadAtom,
   setThreadModelParamsAtom,
-  threadStatesAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 export const selectedModelAtom = atom<Model | undefined>(undefined)
@@ -49,7 +49,6 @@ const DropdownListSidebar = ({
   strictedThread?: boolean
 }) => {
   const activeThread = useAtomValue(activeThreadAtom)
-  const threadStates = useAtomValue(threadStatesAtom)
   const [selectedModel, setSelectedModel] = useAtom(selectedModelAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
 
@@ -58,15 +57,7 @@ const DropdownListSidebar = ({
   const { setMainViewState } = useMainViewState()
   const [loader, setLoader] = useState(0)
   const { recommendedModel, downloadedModels } = useRecommendedModel()
-
-  /**
-   * Default value for max_tokens and ctx_len
-   * Its to avoid OOM issue since a model can set a big number for these settings
-   */
-  const defaultValue = (value?: number) => {
-    if (value && value < 4096) return value
-    return 4096
-  }
+  const { updateModelParameter } = useUpdateModelParameters()
 
   useEffect(() => {
     if (!activeThread) return
@@ -78,31 +69,7 @@ const DropdownListSidebar = ({
       model = recommendedModel
     }
     setSelectedModel(model)
-    const finishInit = threadStates[activeThread.id].isFinishInit ?? true
-    if (finishInit) return
-    const modelParams: ModelParams = {
-      ...model?.parameters,
-      ...model?.settings,
-      /**
-       * This is to set default value for these settings instead of maximum value
-       * Should only apply when model.json has these settings
-       */
-      ...(model?.parameters.max_tokens && {
-        max_tokens: defaultValue(model?.parameters.max_tokens),
-      }),
-      ...(model?.settings.ctx_len && {
-        ctx_len: defaultValue(model?.settings.ctx_len),
-      }),
-    }
-    setThreadModelParams(activeThread.id, modelParams)
-  }, [
-    recommendedModel,
-    activeThread,
-    threadStates,
-    downloadedModels,
-    setThreadModelParams,
-    setSelectedModel,
-  ])
+  }, [recommendedModel, activeThread, downloadedModels, setSelectedModel])
 
   // This is fake loader please fix this when we have realtime percentage when load model
   useEffect(() => {
@@ -144,7 +111,16 @@ const DropdownListSidebar = ({
           ...model?.parameters,
           ...model?.settings,
         }
+        // Update model paramter to the thread state
         setThreadModelParams(activeThread.id, modelParams)
+
+        // Update model parameter to the thread file
+        if (model)
+          updateModelParameter(activeThread.id, {
+            params: modelParams,
+            modelId: model.id,
+            engine: model.engine,
+          })
       }
     },
     [
@@ -154,6 +130,7 @@ const DropdownListSidebar = ({
       setSelectedModel,
       setServerEnabled,
       setThreadModelParams,
+      updateModelParameter,
     ]
   )
 
diff --git a/web/helpers/atoms/Thread.atom.ts b/web/helpers/atoms/Thread.atom.ts
index 26b1e9c59..fcaa2a4af 100644
--- a/web/helpers/atoms/Thread.atom.ts
+++ b/web/helpers/atoms/Thread.atom.ts
@@ -46,18 +46,6 @@ export const deleteThreadStateAtom = atom(
   }
 )
 
-export const updateThreadInitSuccessAtom = atom(
-  null,
-  (get, set, threadId: string) => {
-    const currentState = { ...get(threadStatesAtom) }
-    currentState[threadId] = {
-      ...currentState[threadId],
-      isFinishInit: true,
-    }
-    set(threadStatesAtom, currentState)
-  }
-)
-
 export const updateThreadWaitingForResponseAtom = atom(
   null,
   (get, set, threadId: string, waitingForResponse: boolean) => {
diff --git a/web/hooks/useCreateNewThread.ts b/web/hooks/useCreateNewThread.ts
index aad42aba9..f2ae4fbd3 100644
--- a/web/hooks/useCreateNewThread.ts
+++ b/web/hooks/useCreateNewThread.ts
@@ -9,19 +9,21 @@ import {
 } from '@janhq/core'
 import { atom, useAtomValue, useSetAtom } from 'jotai'
 
+import { selectedModelAtom } from '@/containers/DropdownListSidebar'
 import { fileUploadAtom } from '@/containers/Providers/Jotai'
 
 import { generateThreadId } from '@/utils/thread'
 
-import useDeleteThread from './useDeleteThread'
+import useRecommendedModel from './useRecommendedModel'
+
+import useSetActiveThread from './useSetActiveThread'
 
 import { extensionManager } from '@/extension'
 import {
   threadsAtom,
-  setActiveThreadIdAtom,
   threadStatesAtom,
   updateThreadAtom,
-  updateThreadInitSuccessAtom,
+  setThreadModelParamsAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 const createNewThreadAtom = atom(null, (get, set, newThread: Thread) => {
@@ -32,7 +34,6 @@ const createNewThreadAtom = atom(null, (get, set, newThread: Thread) => {
     hasMore: false,
     waitingForResponse: false,
     lastMessage: undefined,
-    isFinishInit: false,
   }
   currentState[newThread.id] = threadState
   set(threadStatesAtom, currentState)
@@ -43,47 +44,35 @@ const createNewThreadAtom = atom(null, (get, set, newThread: Thread) => {
 })
 
 export const useCreateNewThread = () => {
-  const threadStates = useAtomValue(threadStatesAtom)
-  const updateThreadFinishInit = useSetAtom(updateThreadInitSuccessAtom)
   const createNewThread = useSetAtom(createNewThreadAtom)
-  const setActiveThreadId = useSetAtom(setActiveThreadIdAtom)
+  const { setActiveThread } = useSetActiveThread()
   const updateThread = useSetAtom(updateThreadAtom)
-
   const setFileUpload = useSetAtom(fileUploadAtom)
-  const { deleteThread } = useDeleteThread()
+  const setSelectedModel = useSetAtom(selectedModelAtom)
+  const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
+
+  const { recommendedModel, downloadedModels } = useRecommendedModel()
 
   const requestCreateNewThread = async (
     assistant: Assistant,
     model?: Model | undefined
   ) => {
-    // loop through threads state and filter if there's any thread that is not finish init
-    let unfinishedInitThreadId: string | undefined = undefined
-    for (const key in threadStates) {
-      const isFinishInit = threadStates[key].isFinishInit ?? true
-      if (!isFinishInit) {
-        unfinishedInitThreadId = key
-        break
-      }
-    }
+    const defaultModel = model ?? recommendedModel ?? downloadedModels[0]
 
-    if (unfinishedInitThreadId) {
-      await deleteThread(unfinishedInitThreadId)
-    }
-
-    const modelId = model ? model.id : '*'
     const createdAt = Date.now()
     const assistantInfo: ThreadAssistantInfo = {
       assistant_id: assistant.id,
       assistant_name: assistant.name,
       tools: assistant.tools,
       model: {
-        id: modelId,
-        settings: {},
-        parameters: {},
-        engine: undefined,
+        id: defaultModel?.id ?? '*',
+        settings: defaultModel?.settings ?? {},
+        parameters: defaultModel?.parameters ?? {},
+        engine: defaultModel?.engine,
       },
       instructions: assistant.instructions,
     }
+
     const threadId = generateThreadId(assistant.id)
     const thread: Thread = {
       id: threadId,
@@ -95,22 +84,27 @@ export const useCreateNewThread = () => {
     }
 
     // add the new thread on top of the thread list to the state
+    //TODO: Why do we have thread list then thread states? Should combine them
     createNewThread(thread)
-    setActiveThreadId(thread.id)
+
+    setSelectedModel(defaultModel)
+    setThreadModelParams(thread.id, {
+      ...defaultModel?.settings,
+      ...defaultModel?.parameters,
+    })
 
     // Delete the file upload state
     setFileUpload([])
+    // Update thread metadata
+    await updateThreadMetadata(thread)
+
+    setActiveThread(thread)
   }
 
-  function updateThreadMetadata(thread: Thread) {
+  async function updateThreadMetadata(thread: Thread) {
     updateThread(thread)
-    const threadState = threadStates[thread.id]
-    const isFinishInit = threadState?.isFinishInit ?? true
-    if (!isFinishInit) {
-      updateThreadFinishInit(thread.id)
-    }
 
-    extensionManager
+    await extensionManager
       .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
       ?.saveThread(thread)
   }
diff --git a/web/hooks/useDeleteThread.ts b/web/hooks/useDeleteThread.ts
index 88710f777..87cee125d 100644
--- a/web/hooks/useDeleteThread.ts
+++ b/web/hooks/useDeleteThread.ts
@@ -21,7 +21,6 @@ import {
   threadsAtom,
   setActiveThreadIdAtom,
   deleteThreadStateAtom,
-  threadStatesAtom,
   updateThreadStateLastMessageAtom,
 } from '@/helpers/atoms/Thread.atom'
 
@@ -34,7 +33,6 @@ export default function useDeleteThread() {
   const deleteMessages = useSetAtom(deleteChatMessagesAtom)
   const cleanMessages = useSetAtom(cleanChatMessagesAtom)
   const deleteThreadState = useSetAtom(deleteThreadStateAtom)
-  const threadStates = useAtomValue(threadStatesAtom)
   const updateThreadLastMessage = useSetAtom(updateThreadStateLastMessageAtom)
 
   const cleanThread = async (threadId: string) => {
@@ -74,22 +72,16 @@ export default function useDeleteThread() {
       const availableThreads = threads.filter((c) => c.id !== threadId)
       setThreads(availableThreads)
 
-      const deletingThreadState = threadStates[threadId]
-      const isFinishInit = deletingThreadState?.isFinishInit ?? true
-
       // delete the thread state
       deleteThreadState(threadId)
 
-      if (isFinishInit) {
-        deleteMessages(threadId)
-        setCurrentPrompt('')
-        toaster({
-          title: 'Thread successfully deleted.',
-          description: `Thread ${threadId} has been successfully deleted.`,
-          type: 'success',
-        })
-      }
-
+      deleteMessages(threadId)
+      setCurrentPrompt('')
+      toaster({
+        title: 'Thread successfully deleted.',
+        description: `Thread ${threadId} has been successfully deleted.`,
+        type: 'success',
+      })
       if (availableThreads.length > 0) {
         setActiveThreadId(availableThreads[0].id)
       } else {
diff --git a/web/hooks/usePath.ts b/web/hooks/usePath.ts
index e37c2457d..aea25bef1 100644
--- a/web/hooks/usePath.ts
+++ b/web/hooks/usePath.ts
@@ -3,23 +3,15 @@ import { useAtomValue } from 'jotai'
 
 import { selectedModelAtom } from '@/containers/DropdownListSidebar'
 
-import { activeThreadAtom, threadStatesAtom } from '@/helpers/atoms/Thread.atom'
+import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 export const usePath = () => {
   const activeThread = useAtomValue(activeThreadAtom)
-  const threadStates = useAtomValue(threadStatesAtom)
   const selectedModel = useAtomValue(selectedModelAtom)
 
   const onReviewInFinder = async (type: string) => {
     // TODO: this logic should be refactored.
-    if (type !== 'Model') {
-      if (!activeThread) return
-      const activeThreadState = threadStates[activeThread.id]
-      if (!activeThreadState.isFinishInit) {
-        alert('Thread is not started yet')
-        return
-      }
-    }
+    if (type !== 'Model' && !activeThread) return
 
     const userSpace = await getJanDataFolderPath()
     let filePath = undefined
@@ -48,14 +40,7 @@ export const usePath = () => {
 
   const onViewJson = async (type: string) => {
     // TODO: this logic should be refactored.
-    if (type !== 'Model') {
-      if (!activeThread) return
-      const activeThreadState = threadStates[activeThread.id]
-      if (!activeThreadState.isFinishInit) {
-        alert('Thread is not started yet')
-        return
-      }
-    }
+    if (type !== 'Model' && !activeThread) return
 
     const userSpace = await getJanDataFolderPath()
     let filePath = undefined
@@ -88,11 +73,6 @@ export const usePath = () => {
 
   const onViewFile = async (id: string) => {
     if (!activeThread) return
-    const activeThreadState = threadStates[activeThread.id]
-    if (!activeThreadState.isFinishInit) {
-      alert('Thread is not started yet')
-      return
-    }
 
     const userSpace = await getJanDataFolderPath()
     let filePath = undefined
@@ -102,9 +82,21 @@ export const usePath = () => {
     openFileExplorer(fullPath)
   }
 
+  const onViewFileContainer = async () => {
+    if (!activeThread) return
+
+    const userSpace = await getJanDataFolderPath()
+    let filePath = undefined
+    filePath = await joinPath(['threads', `${activeThread.id}/files`])
+    if (!filePath) return
+    const fullPath = await joinPath([userSpace, filePath])
+    openFileExplorer(fullPath)
+  }
+
   return {
     onReviewInFinder,
     onViewJson,
     onViewFile,
+    onViewFileContainer,
   }
 }
diff --git a/web/hooks/useRecommendedModel.ts b/web/hooks/useRecommendedModel.ts
index 582c8a949..427d2bf73 100644
--- a/web/hooks/useRecommendedModel.ts
+++ b/web/hooks/useRecommendedModel.ts
@@ -26,7 +26,6 @@ export default function useRecommendedModel() {
   const activeModel = useAtomValue(activeModelAtom)
   const [downloadedModels, setDownloadedModels] = useState<Model[]>([])
   const [recommendedModel, setRecommendedModel] = useState<Model | undefined>()
-  const threadStates = useAtomValue(threadStatesAtom)
   const activeThread = useAtomValue(activeThreadAtom)
 
   const getAndSortDownloadedModels = useCallback(async (): Promise<Model[]> => {
@@ -44,27 +43,11 @@ export default function useRecommendedModel() {
   > => {
     const models = await getAndSortDownloadedModels()
     if (!activeThread) return
+    const modelId = activeThread.assistants[0]?.model.id
+    const model = models.find((model) => model.id === modelId)
 
-    const finishInit = threadStates[activeThread.id].isFinishInit ?? true
-    if (finishInit) {
-      const modelId = activeThread.assistants[0]?.model.id
-      const model = models.find((model) => model.id === modelId)
-
-      if (model) {
-        setRecommendedModel(model)
-      }
-
-      return
-    } else {
-      const modelId = activeThread.assistants[0]?.model.id
-      if (modelId !== '*') {
-        const model = models.find((model) => model.id === modelId)
-
-        if (model) {
-          setRecommendedModel(model)
-        }
-        return
-      }
+    if (model) {
+      setRecommendedModel(model)
     }
 
     if (activeModel) {
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index 835bdfed4..379defa15 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -41,9 +41,7 @@ import {
   activeThreadAtom,
   engineParamsUpdateAtom,
   getActiveThreadModelParamsAtom,
-  threadStatesAtom,
   updateThreadAtom,
-  updateThreadInitSuccessAtom,
   updateThreadWaitingForResponseAtom,
 } from '@/helpers/atoms/Thread.atom'
 
@@ -64,8 +62,6 @@ export default function useSendChatMessage() {
   const setQueuedMessage = useSetAtom(queuedMessageAtom)
 
   const modelRef = useRef<Model | undefined>()
-  const threadStates = useAtomValue(threadStatesAtom)
-  const updateThreadInitSuccess = useSetAtom(updateThreadInitSuccessAtom)
   const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
   const engineParamsUpdate = useAtomValue(engineParamsUpdateAtom)
 
@@ -150,52 +146,10 @@ export default function useSendChatMessage() {
 
     if (engineParamsUpdate) setReloadModel(true)
 
-    const activeThreadState = threadStates[activeThread.id]
     const runtimeParams = toRuntimeParams(activeModelParams)
     const settingParams = toSettingParams(activeModelParams)
 
-    // if the thread is not initialized, we need to initialize it first
-    if (
-      !activeThreadState.isFinishInit ||
-      activeThread.assistants[0].model.id !== selectedModel?.id
-    ) {
-      if (!selectedModel) {
-        toaster({ title: 'Please select a model', type: 'warning' })
-        return
-      }
-      const assistantId = activeThread.assistants[0].assistant_id ?? ''
-      const assistantName = activeThread.assistants[0].assistant_name ?? ''
-      const instructions = activeThread.assistants[0].instructions ?? ''
-      const tools = activeThread.assistants[0].tools ?? []
-
-      const initThread: Thread = {
-        ...activeThread,
-        assistants: [
-          {
-            assistant_id: assistantId,
-            assistant_name: assistantName,
-            instructions: instructions,
-            tools: tools,
-            model: {
-              id: selectedModel.id,
-              settings: settingParams,
-              parameters: runtimeParams,
-              engine: selectedModel.engine,
-            },
-          },
-        ],
-      }
-
-      updateThreadInitSuccess(activeThread.id)
-      updateThread(initThread)
-
-      await extensionManager
-        .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
-        ?.saveThread(initThread)
-    }
-
     updateThreadWaiting(activeThread.id, true)
-
     const prompt = message.trim()
     setCurrentPrompt('')
 
diff --git a/web/hooks/useThreads.ts b/web/hooks/useThreads.ts
index 44be485fe..b7de014cc 100644
--- a/web/hooks/useThreads.ts
+++ b/web/hooks/useThreads.ts
@@ -5,7 +5,7 @@ import {
   ConversationalExtension,
 } from '@janhq/core'
 
-import { useAtom, useAtomValue } from 'jotai'
+import { useAtomValue, useSetAtom } from 'jotai'
 
 import useSetActiveThread from './useSetActiveThread'
 
@@ -19,11 +19,9 @@ import {
 } from '@/helpers/atoms/Thread.atom'
 
 const useThreads = () => {
-  const [threadStates, setThreadStates] = useAtom(threadStatesAtom)
-  const [threads, setThreads] = useAtom(threadsAtom)
-  const [threadModelRuntimeParams, setThreadModelRuntimeParams] = useAtom(
-    threadModelParamsAtom
-  )
+  const setThreadStates = useSetAtom(threadStatesAtom)
+  const setThreads = useSetAtom(threadsAtom)
+  const setThreadModelRuntimeParams = useSetAtom(threadModelParamsAtom)
   const activeThread = useAtomValue(activeThreadAtom)
   const { setActiveThread } = useSetActiveThread()
 
@@ -41,7 +39,6 @@ const useThreads = () => {
             hasMore: false,
             waitingForResponse: false,
             lastMessage,
-            isFinishInit: true,
           }
 
           const modelParams = thread.assistants?.[0]?.model?.parameters
@@ -53,41 +50,12 @@ const useThreads = () => {
         }
       })
 
-      // allow at max 1 unfinished init thread and it should be at the top of the list
-      let unfinishedThreadId: string | undefined = undefined
-      const unfinishedThreadState: Record<string, ThreadState> = {}
-
-      for (const key of Object.keys(threadStates)) {
-        const threadState = threadStates[key]
-        if (threadState.isFinishInit === false) {
-          unfinishedThreadState[key] = threadState
-          unfinishedThreadId = key
-          break
-        }
-      }
-      const unfinishedThread: Thread | undefined = threads.find(
-        (thread) => thread.id === unfinishedThreadId
-      )
-
-      let allThreads: Thread[] = [...localThreads]
-      if (unfinishedThread) {
-        allThreads = [unfinishedThread, ...localThreads]
-      }
-
-      if (unfinishedThreadId) {
-        localThreadStates[unfinishedThreadId] =
-          unfinishedThreadState[unfinishedThreadId]
-
-        threadModelParams[unfinishedThreadId] =
-          threadModelRuntimeParams[unfinishedThreadId]
-      }
-
       // updating app states
       setThreadStates(localThreadStates)
-      setThreads(allThreads)
+      setThreads(localThreads)
       setThreadModelRuntimeParams(threadModelParams)
-      if (allThreads.length && !activeThread) {
-        setActiveThread(allThreads[0])
+      if (localThreads.length && !activeThread) {
+        setActiveThread(localThreads[0])
       }
     } catch (error) {
       console.error(error)
diff --git a/web/hooks/useUpdateModelParameters.ts b/web/hooks/useUpdateModelParameters.ts
index 80070ef26..694394cee 100644
--- a/web/hooks/useUpdateModelParameters.ts
+++ b/web/hooks/useUpdateModelParameters.ts
@@ -2,12 +2,15 @@
 import {
   ConversationalExtension,
   ExtensionTypeEnum,
+  InferenceEngine,
   Thread,
   ThreadAssistantInfo,
 } from '@janhq/core'
 
 import { useAtomValue, useSetAtom } from 'jotai'
 
+import { selectedModelAtom } from '@/containers/DropdownListSidebar'
+
 import { toRuntimeParams, toSettingParams } from '@/utils/modelParam'
 
 import { extensionManager } from '@/extension'
@@ -19,16 +22,22 @@ import {
   threadsAtom,
 } from '@/helpers/atoms/Thread.atom'
 
+export type UpdateModelParameter = {
+  params?: ModelParams
+  modelId?: string
+  engine?: InferenceEngine
+}
+
 export default function useUpdateModelParameters() {
   const threads = useAtomValue(threadsAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
   const activeThreadState = useAtomValue(activeThreadStateAtom)
   const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
+  const selectedModel = useAtomValue(selectedModelAtom)
 
   const updateModelParameter = async (
     threadId: string,
-    name: string,
-    value: number | boolean | string
+    settings: UpdateModelParameter
   ) => {
     const thread = threads.find((thread) => thread.id === threadId)
     if (!thread) {
@@ -40,21 +49,18 @@ export default function useUpdateModelParameters() {
       console.error('No active thread')
       return
     }
+
+    const params = settings.modelId
+      ? settings.params
+      : { ...activeModelParams, ...settings.params }
+
     const updatedModelParams: ModelParams = {
-      ...activeModelParams,
-      // Explicitly set the value to an array if the name is 'stop'
-      // This is because the inference engine would only accept an array for the 'stop' parameter
-      [name]: name === 'stop' ? (value === '' ? [] : [value]) : value,
+      ...params,
     }
 
     // update the state
     setThreadModelParams(thread.id, updatedModelParams)
 
-    if (!activeThreadState.isFinishInit) {
-      // if thread is not initialized, we don't need to update thread.json
-      return
-    }
-
     const assistants = thread.assistants.map(
       (assistant: ThreadAssistantInfo) => {
         const runtimeParams = toRuntimeParams(updatedModelParams)
@@ -62,6 +68,10 @@ export default function useUpdateModelParameters() {
 
         assistant.model.parameters = runtimeParams
         assistant.model.settings = settingParams
+        if (selectedModel) {
+          assistant.model.id = settings.modelId ?? selectedModel?.id
+          assistant.model.engine = settings.engine ?? selectedModel?.engine
+        }
         return assistant
       }
     )
diff --git a/web/screens/Chat/ModelSetting/SettingComponent.tsx b/web/screens/Chat/ModelSetting/SettingComponent.tsx
index bb91d47e7..e2e43e944 100644
--- a/web/screens/Chat/ModelSetting/SettingComponent.tsx
+++ b/web/screens/Chat/ModelSetting/SettingComponent.tsx
@@ -56,7 +56,7 @@ const SettingComponent = ({
   updater?: (
     threadId: string,
     name: string,
-    value: string | number | boolean
+    value: string | number | boolean | string[]
   ) => void
 }) => {
   const { updateModelParameter } = useUpdateModelParameters()
@@ -73,7 +73,10 @@ const SettingComponent = ({
 
   const { stopModel } = useActiveModel()
 
-  const onValueChanged = (name: string, value: string | number | boolean) => {
+  const onValueChanged = (
+    name: string,
+    value: string | number | boolean | string[]
+  ) => {
     if (!threadId) return
     if (engineParams.some((x) => x.name.includes(name))) {
       setEngineParamsUpdate(true)
@@ -83,7 +86,13 @@ const SettingComponent = ({
     }
     if (updater) updater(threadId, name, value)
     else {
-      updateModelParameter(threadId, name, value)
+      // Convert stop string to array
+      if (name === 'stop' && typeof value === 'string') {
+        value = [value]
+      }
+      updateModelParameter(threadId, {
+        params: { [name]: value },
+      })
     }
   }
 
diff --git a/web/screens/Chat/SimpleTextMessage/index.tsx b/web/screens/Chat/SimpleTextMessage/index.tsx
index feed96168..261bb3497 100644
--- a/web/screens/Chat/SimpleTextMessage/index.tsx
+++ b/web/screens/Chat/SimpleTextMessage/index.tsx
@@ -43,7 +43,7 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
     text = props.content[0]?.text?.value ?? ''
   }
   const clipboard = useClipboard({ timeout: 1000 })
-  const { onViewFile } = usePath()
+  const { onViewFile, onViewFileContainer } = usePath()
 
   const marked: Marked = new Marked(
     markedHighlight({
@@ -200,13 +200,14 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
                 className="aspect-auto h-[300px]"
                 alt={props.content[0]?.text.name}
                 src={props.content[0]?.text.annotations[0]}
+                onClick={() => onViewFile(`${props.id}.png`)}
               />
               <div className="absolute left-0 top-0 z-20 hidden h-full w-full bg-black/20 group-hover/image:inline-block" />
               <Tooltip>
                 <TooltipTrigger asChild>
                   <div
                     className="absolute right-2 top-2 z-20 hidden h-8 w-8 cursor-pointer items-center justify-center rounded-md bg-background group-hover/image:flex"
-                    onClick={() => onViewFile(`${props.id}.png`)}
+                    onClick={onViewFileContainer}
                   >
                     <FolderOpenIcon size={20} />
                   </div>
@@ -223,14 +224,17 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
 
           {props.content[0]?.type === ContentType.Pdf && (
             <div className="group/file relative mb-2 inline-flex w-60 cursor-pointer gap-x-3 overflow-hidden rounded-lg bg-secondary p-4">
-              <div className="absolute left-0 top-0 z-20 hidden h-full w-full bg-black/20 backdrop-blur-sm group-hover/file:inline-block" />
+              <div
+                className="absolute left-0 top-0 z-20 hidden h-full w-full bg-black/20 backdrop-blur-sm group-hover/file:inline-block"
+                onClick={() =>
+                  onViewFile(`${props.id}.${props.content[0]?.type}`)
+                }
+              />
               <Tooltip>
                 <TooltipTrigger asChild>
                   <div
                     className="absolute right-2 top-2 z-20 hidden h-8 w-8 cursor-pointer items-center justify-center rounded-md bg-background group-hover/file:flex"
-                    onClick={() =>
-                      onViewFile(`${props.id}.${props.content[0]?.type}`)
-                    }
+                    onClick={onViewFileContainer}
                   >
                     <FolderOpenIcon size={20} />
                   </div>
diff --git a/web/screens/Settings/Advanced/index.tsx b/web/screens/Settings/Advanced/index.tsx
index 5ddf4ecf4..109431515 100644
--- a/web/screens/Settings/Advanced/index.tsx
+++ b/web/screens/Settings/Advanced/index.tsx
@@ -135,7 +135,7 @@ const Advanced = () => {
       )}
 
       {/* Directory */}
-      {experimentalFeature && <DataFolder />}
+      <DataFolder />
 
       {/* Proxy */}
       <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">

From ae073d2703d79438b5b99878b8c8cbace07b40ff Mon Sep 17 00:00:00 2001
From: Service Account <service@jan.ai>
Date: Thu, 1 Feb 2024 06:09:29 +0000
Subject: [PATCH 61/65] janhq/jan: Update README.md with nightly build artifact
 URL

---
 README.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index e4817f8dc..34eecc9f3 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-215.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-216.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-215.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-216.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-215.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-216.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-215.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-216.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-215.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-216.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>

From 11e2a763cbfcdf16d0bc16b687213663da6cddf0 Mon Sep 17 00:00:00 2001
From: hiro <22463238+hiro-v@users.noreply.github.com>
Date: Thu, 1 Feb 2024 19:11:05 +0700
Subject: [PATCH 62/65] feat: Add default value for ngl (#1886)

* fix: Add fallback value for ngl

* fix: Handling type
---
 .../src/node/index.ts                         | 36 ++++++++-----------
 1 file changed, 15 insertions(+), 21 deletions(-)

diff --git a/extensions/inference-nitro-extension/src/node/index.ts b/extensions/inference-nitro-extension/src/node/index.ts
index 749b68b1c..296433d42 100644
--- a/extensions/inference-nitro-extension/src/node/index.ts
+++ b/extensions/inference-nitro-extension/src/node/index.ts
@@ -27,15 +27,6 @@ interface ModelInitOptions {
   modelFullPath: string;
   model: Model;
 }
-
-/**
- * Model setting args for Nitro model load.
- */
-interface ModelSettingArgs extends ModelSettingParams {
-  llama_model_path: string;
-  cpu_threads: number;
-}
-
 // The PORT to use for the Nitro subprocess
 const PORT = 3928;
 // The HOST address to use for the Nitro subprocess
@@ -58,7 +49,7 @@ let subprocess: ChildProcessWithoutNullStreams | undefined = undefined;
 // The current model file url
 let currentModelFile: string = "";
 // The current model settings
-let currentSettings: ModelSettingArgs | undefined = undefined;
+let currentSettings: ModelSettingParams | undefined = undefined;
 
 /**
  * Stops a Nitro subprocess.
@@ -76,7 +67,7 @@ function stopModel(): Promise<void> {
  * TODO: Should pass absolute of the model file instead of just the name - So we can modurize the module.ts to npm package
  */
 async function runModel(
-  wrapper: ModelInitOptions,
+  wrapper: ModelInitOptions
 ): Promise<ModelOperationResponse | void> {
   if (wrapper.model.engine !== InferenceEngine.nitro) {
     // Not a nitro model
@@ -94,7 +85,7 @@ async function runModel(
   const ggufBinFile = files.find(
     (file) =>
       file === path.basename(currentModelFile) ||
-      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT),
+      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT)
   );
 
   if (!ggufBinFile) return Promise.reject("No GGUF model file found");
@@ -189,10 +180,10 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const system_prompt = promptTemplate.substring(0, systemIndex);
     const user_prompt = promptTemplate.substring(
       systemIndex + systemMarker.length,
-      promptIndex,
+      promptIndex
     );
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length,
+      promptIndex + promptMarker.length
     );
 
     // Return the split parts
@@ -202,7 +193,7 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const promptIndex = promptTemplate.indexOf(promptMarker);
     const user_prompt = promptTemplate.substring(0, promptIndex);
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length,
+      promptIndex + promptMarker.length
     );
 
     // Return the split parts
@@ -218,6 +209,9 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
  * @returns A Promise that resolves when the model is loaded successfully, or rejects with an error message if the model is not found or fails to load.
  */
 function loadLLMModel(settings: any): Promise<Response> {
+  if (!settings?.ngl) {
+    settings.ngl = 100;
+  }
   log(`[NITRO]::Debug: Loading model with params ${JSON.stringify(settings)}`);
   return fetchRetry(NITRO_HTTP_LOAD_MODEL_URL, {
     method: "POST",
@@ -231,8 +225,8 @@ function loadLLMModel(settings: any): Promise<Response> {
     .then((res) => {
       log(
         `[NITRO]::Debug: Load model success with response ${JSON.stringify(
-          res,
-        )}`,
+          res
+        )}`
       );
       return Promise.resolve(res);
     })
@@ -261,8 +255,8 @@ async function validateModelStatus(): Promise<void> {
   }).then(async (res: Response) => {
     log(
       `[NITRO]::Debug: Validate model state success with response ${JSON.stringify(
-        res,
-      )}`,
+        res
+      )}`
     );
     // If the response is OK, check model_loaded status.
     if (res.ok) {
@@ -313,7 +307,7 @@ function spawnNitroProcess(): Promise<any> {
     const args: string[] = ["1", LOCAL_HOST, PORT.toString()];
     // Execute the binary
     log(
-      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`,
+      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`
     );
     subprocess = spawn(
       executableOptions.executablePath,
@@ -324,7 +318,7 @@ function spawnNitroProcess(): Promise<any> {
           ...process.env,
           CUDA_VISIBLE_DEVICES: executableOptions.cudaVisibleDevices,
         },
-      },
+      }
     );
 
     // Handle subprocess output

From 36cd5988d42a5f7104b8fd2724ee92b77377bb78 Mon Sep 17 00:00:00 2001
From: Hieu <150573299+hieu-jan@users.noreply.github.com>
Date: Thu, 1 Feb 2024 23:00:16 +0900
Subject: [PATCH 63/65] feat: integrate umami (#1809)

* feat: integrate umami

* fix: linter issue

* fix: run eslint

* fix window umami null

* fix property type error

* fix: check configuration before requesting analytics script

* fix: test cases

---------

Co-authored-by: Louis <louis@jan.ai>
---
 .../workflows/template-build-linux-x64.yml    |  4 +-
 .github/workflows/template-build-macos.yml    |  4 +-
 .../workflows/template-build-windows-x64.yml  |  4 +-
 docs/.env.example                             |  4 +-
 electron/tests/hub.e2e.spec.ts                |  1 -
 electron/tests/navigation.e2e.spec.ts         |  8 ++-
 electron/tests/settings.e2e.spec.ts           |  3 +-
 web/containers/Providers/index.tsx            | 39 +++++------
 web/next.config.js                            |  6 +-
 web/screens/LocalServer/index.tsx             |  2 +-
 web/utils/posthog.ts                          | 50 --------------
 web/utils/umami.tsx                           | 65 +++++++++++++++++++
 12 files changed, 101 insertions(+), 89 deletions(-)
 delete mode 100644 web/utils/posthog.ts
 create mode 100644 web/utils/umami.tsx

diff --git a/.github/workflows/template-build-linux-x64.yml b/.github/workflows/template-build-linux-x64.yml
index c6d1eac97..08cb1dada 100644
--- a/.github/workflows/template-build-linux-x64.yml
+++ b/.github/workflows/template-build-linux-x64.yml
@@ -98,8 +98,8 @@ jobs:
           make build-and-publish
         env:
           GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-          ANALYTICS_ID: ${{ secrets.JAN_APP_POSTHOG_PROJECT_API_KEY }}
-          ANALYTICS_HOST: ${{ secrets.JAN_APP_POSTHOG_URL }}
+          ANALYTICS_ID: ${{ secrets.JAN_APP_UMAMI_PROJECT_API_KEY }}
+          ANALYTICS_HOST: ${{ secrets.JAN_APP_UMAMI_URL }}
 
       - name: Upload Artifact .deb file
         if: inputs.public_provider != 'github'
diff --git a/.github/workflows/template-build-macos.yml b/.github/workflows/template-build-macos.yml
index bc48e6c21..0ad1d3a6a 100644
--- a/.github/workflows/template-build-macos.yml
+++ b/.github/workflows/template-build-macos.yml
@@ -137,8 +137,8 @@ jobs:
           APPLE_APP_SPECIFIC_PASSWORD: ${{ secrets.APPLE_APP_SPECIFIC_PASSWORD }}
           APP_PATH: "."
           DEVELOPER_ID: ${{ secrets.DEVELOPER_ID }}
-          ANALYTICS_ID: ${{ secrets.JAN_APP_POSTHOG_PROJECT_API_KEY }}
-          ANALYTICS_HOST: ${{ secrets.JAN_APP_POSTHOG_URL }}
+          ANALYTICS_ID: ${{ secrets.JAN_APP_UMAMI_PROJECT_API_KEY }}
+          ANALYTICS_HOST: ${{ secrets.JAN_APP_UMAMI_URL }}
 
       - name: Upload Artifact
         if: inputs.public_provider != 'github'
diff --git a/.github/workflows/template-build-windows-x64.yml b/.github/workflows/template-build-windows-x64.yml
index 5d96b3f49..b81997bde 100644
--- a/.github/workflows/template-build-windows-x64.yml
+++ b/.github/workflows/template-build-windows-x64.yml
@@ -127,8 +127,8 @@ jobs:
           make build-and-publish
         env:
           GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-          ANALYTICS_ID: ${{ secrets.JAN_APP_POSTHOG_PROJECT_API_KEY }}
-          ANALYTICS_HOST: ${{ secrets.JAN_APP_POSTHOG_URL }}
+          ANALYTICS_ID: ${{ secrets.JAN_APP_UMAMI_PROJECT_API_KEY }}
+          ANALYTICS_HOST: ${{ secrets.JAN_APP_UMAMI_URL }}
           AZURE_KEY_VAULT_URI: ${{ secrets.AZURE_KEY_VAULT_URI }}
           AZURE_CLIENT_ID: ${{ secrets.AZURE_CLIENT_ID }}
           AZURE_TENANT_ID: ${{ secrets.AZURE_TENANT_ID }}
diff --git a/docs/.env.example b/docs/.env.example
index 6755f2520..b4a7fa5f1 100644
--- a/docs/.env.example
+++ b/docs/.env.example
@@ -1,5 +1,5 @@
 GTM_ID=xxxx
-POSTHOG_PROJECT_API_KEY=xxxx
-POSTHOG_APP_URL=xxxx
+UMAMI_PROJECT_API_KEY=xxxx
+UMAMI_APP_URL=xxxx
 ALGOLIA_API_KEY=xxxx
 ALGOLIA_APP_ID=xxxx
\ No newline at end of file
diff --git a/electron/tests/hub.e2e.spec.ts b/electron/tests/hub.e2e.spec.ts
index 6bfe45ac4..cc72e037e 100644
--- a/electron/tests/hub.e2e.spec.ts
+++ b/electron/tests/hub.e2e.spec.ts
@@ -38,7 +38,6 @@ test.afterAll(async () => {
 })
 
 test('explores hub', async () => {
-  // Set the timeout for this test to 60 seconds
   test.setTimeout(TIMEOUT)
   await page.getByTestId('Hub').first().click({
     timeout: TIMEOUT,
diff --git a/electron/tests/navigation.e2e.spec.ts b/electron/tests/navigation.e2e.spec.ts
index 2066fa60a..5c8721c2f 100644
--- a/electron/tests/navigation.e2e.spec.ts
+++ b/electron/tests/navigation.e2e.spec.ts
@@ -38,6 +38,7 @@ test.afterAll(async () => {
 })
 
 test('renders left navigation panel', async () => {
+  test.setTimeout(TIMEOUT)
   const systemMonitorBtn = await page
     .getByTestId('System Monitor')
     .first()
@@ -50,8 +51,11 @@ test('renders left navigation panel', async () => {
     .isEnabled({ timeout: TIMEOUT })
   expect([systemMonitorBtn, settingsBtn].filter((e) => !e).length).toBe(0)
   // Chat section should be there
-  const apiServer = await page.getByTestId('Local API Server').first()
-  expect(apiServer).toBeVisible({
+  await page.getByTestId('Local API Server').first().click({
+    timeout: TIMEOUT,
+  })
+  const localServer = await page.getByTestId('local-server-testid').first()
+  await expect(localServer).toBeVisible({
     timeout: TIMEOUT,
   })
 })
diff --git a/electron/tests/settings.e2e.spec.ts b/electron/tests/settings.e2e.spec.ts
index 765c3cba7..ad2d7b4a4 100644
--- a/electron/tests/settings.e2e.spec.ts
+++ b/electron/tests/settings.e2e.spec.ts
@@ -38,7 +38,8 @@ test.afterAll(async () => {
 })
 
 test('shows settings', async () => {
+  test.setTimeout(TIMEOUT)
   await page.getByTestId('Settings').first().click({ timeout: TIMEOUT })
   const settingDescription = page.getByTestId('testid-setting-description')
-  expect(settingDescription).toBeVisible({ timeout: TIMEOUT })
+  await expect(settingDescription).toBeVisible({ timeout: TIMEOUT })
 })
diff --git a/web/containers/Providers/index.tsx b/web/containers/Providers/index.tsx
index dd9069a95..895c22177 100644
--- a/web/containers/Providers/index.tsx
+++ b/web/containers/Providers/index.tsx
@@ -6,8 +6,6 @@ import { Toaster } from 'react-hot-toast'
 
 import { TooltipProvider } from '@janhq/uikit'
 
-import { PostHogProvider } from 'posthog-js/react'
-
 import GPUDriverPrompt from '@/containers/GPUDriverPromptModal'
 import EventListenerWrapper from '@/containers/Providers/EventListener'
 import JotaiWrapper from '@/containers/Providers/Jotai'
@@ -21,7 +19,7 @@ import {
   setupBaseExtensions,
 } from '@/services/extensionService'
 
-import { instance } from '@/utils/posthog'
+import Umami from '@/utils/umami'
 
 import KeyListener from './KeyListener'
 
@@ -70,25 +68,22 @@ const Providers = (props: PropsWithChildren) => {
   }, [setupCore])
 
   return (
-    <PostHogProvider client={instance}>
-      <JotaiWrapper>
-        <ThemeWrapper>
-          {setupCore && activated && (
-            <KeyListener>
-              <FeatureToggleWrapper>
-                <EventListenerWrapper>
-                  <TooltipProvider delayDuration={0}>
-                    {children}
-                  </TooltipProvider>
-                  {!isMac && <GPUDriverPrompt />}
-                </EventListenerWrapper>
-                <Toaster />
-              </FeatureToggleWrapper>
-            </KeyListener>
-          )}
-        </ThemeWrapper>
-      </JotaiWrapper>
-    </PostHogProvider>
+    <JotaiWrapper>
+      <ThemeWrapper>
+        <Umami />
+        {setupCore && activated && (
+          <KeyListener>
+            <FeatureToggleWrapper>
+              <EventListenerWrapper>
+                <TooltipProvider delayDuration={0}>{children}</TooltipProvider>
+                {!isMac && <GPUDriverPrompt />}
+              </EventListenerWrapper>
+              <Toaster />
+            </FeatureToggleWrapper>
+          </KeyListener>
+        )}
+      </ThemeWrapper>
+    </JotaiWrapper>
   )
 }
 
diff --git a/web/next.config.js b/web/next.config.js
index 0b6a8bc92..a2e202c51 100644
--- a/web/next.config.js
+++ b/web/next.config.js
@@ -25,10 +25,8 @@ const nextConfig = {
       ...config.plugins,
       new webpack.DefinePlugin({
         VERSION: JSON.stringify(packageJson.version),
-        ANALYTICS_ID:
-          JSON.stringify(process.env.ANALYTICS_ID) ?? JSON.stringify('xxx'),
-        ANALYTICS_HOST:
-          JSON.stringify(process.env.ANALYTICS_HOST) ?? JSON.stringify('xxx'),
+        ANALYTICS_ID: JSON.stringify(process.env.ANALYTICS_ID),
+        ANALYTICS_HOST: JSON.stringify(process.env.ANALYTICS_HOST),
         API_BASE_URL: JSON.stringify('http://localhost:1337'),
         isMac: process.platform === 'darwin',
         isWindows: process.platform === 'win32',
diff --git a/web/screens/LocalServer/index.tsx b/web/screens/LocalServer/index.tsx
index e7f3c7fc2..b96f4c228 100644
--- a/web/screens/LocalServer/index.tsx
+++ b/web/screens/LocalServer/index.tsx
@@ -103,7 +103,7 @@ const LocalServerScreen = () => {
   }, [handleChangePort, port])
 
   return (
-    <div className="flex h-full w-full">
+    <div className="flex h-full w-full" data-testid="local-server-testid">
       {/* Left SideBar */}
       <div className="flex h-full w-60 flex-shrink-0 flex-col overflow-y-auto border-r border-border">
         <div className="p-4">
diff --git a/web/utils/posthog.ts b/web/utils/posthog.ts
deleted file mode 100644
index 9bcbaa8ce..000000000
--- a/web/utils/posthog.ts
+++ /dev/null
@@ -1,50 +0,0 @@
-import posthog, { Properties } from 'posthog-js'
-
-// Initialize PostHog
-posthog.init(ANALYTICS_ID, {
-  api_host: ANALYTICS_HOST,
-  autocapture: false,
-  capture_pageview: false,
-  capture_pageleave: false,
-  rageclick: false,
-})
-// Export the PostHog instance
-export const instance = posthog
-
-// Enum for Analytics Events
-export enum AnalyticsEvent {
-  Ping = 'Ping',
-}
-
-// Function to determine the operating system
-function getOperatingSystem(): string {
-  if (isMac) return 'MacOS'
-  if (isWindows) return 'Windows'
-  if (isLinux) return 'Linux'
-  return 'Unknown'
-}
-
-function captureAppVersionAndOS() {
-  const properties: Properties = {
-    $appVersion: VERSION,
-    $userOperatingSystem: getOperatingSystem(),
-    // Set the following Posthog default properties to empty strings
-    $initial_browser: '',
-    $browser: '',
-    $initial_browser_version: '',
-    $browser_version: '',
-    $initial_current_url: '',
-    $current_url: '',
-    $initial_device_type: '',
-    $device_type: '',
-    $initial_pathname: '',
-    $pathname: '',
-    $initial_referrer: '',
-    $referrer: '',
-    $initial_referring_domain: '',
-    $referring_domain: '',
-  }
-  posthog.capture(AnalyticsEvent.Ping, properties)
-}
-
-captureAppVersionAndOS()
diff --git a/web/utils/umami.tsx b/web/utils/umami.tsx
new file mode 100644
index 000000000..ac9e70304
--- /dev/null
+++ b/web/utils/umami.tsx
@@ -0,0 +1,65 @@
+import { useEffect } from 'react'
+
+import Script from 'next/script'
+
+// Define the type for the umami data object
+interface UmamiData {
+  version: string
+}
+
+declare global {
+  interface Window {
+    umami:
+      | {
+          track: (event: string, data?: UmamiData) => void
+        }
+      | undefined
+  }
+}
+
+const Umami = () => {
+  const appVersion = VERSION
+  const analyticsHost = ANALYTICS_HOST
+  const analyticsId = ANALYTICS_ID
+
+  useEffect(() => {
+    if (!appVersion || !analyticsHost || !analyticsId) return
+    const ping = () => {
+      // Check if umami is defined before ping
+      if (window.umami !== null && typeof window.umami !== 'undefined') {
+        window.umami.track(appVersion, {
+          version: appVersion,
+        })
+      }
+    }
+
+    // Wait for umami to be defined before ping
+    if (window.umami !== null && typeof window.umami !== 'undefined') {
+      ping()
+    } else {
+      // Listen for umami script load event
+      document.addEventListener('umami:loaded', ping)
+    }
+
+    // Cleanup function to remove event listener if the component unmounts
+    return () => {
+      document.removeEventListener('umami:loaded', ping)
+    }
+  }, [appVersion, analyticsHost, analyticsId])
+
+  return (
+    <>
+      {appVersion && analyticsHost && analyticsId && (
+        <Script
+          src={analyticsHost}
+          data-website-id={analyticsId}
+          data-cache="true"
+          defer
+          onLoad={() => document.dispatchEvent(new Event('umami:loaded'))}
+        />
+      )}
+    </>
+  )
+}
+
+export default Umami

From 5ce2e422f8a80ad040597ce58e17ea81655c6fbd Mon Sep 17 00:00:00 2001
From: Louis <louis@jan.ai>
Date: Thu, 1 Feb 2024 23:28:15 +0700
Subject: [PATCH 64/65] fix: display error message on model load fail (#1894)

---
 core/src/node/api/common/startStopModel.ts    |  2 +-
 .../inference-nitro-extension/src/index.ts    |  5 +-
 .../src/node/index.ts                         | 34 ++++++++-----
 web/containers/Providers/EventHandler.tsx     | 21 ++++++--
 web/helpers/atoms/SystemBar.atom.ts           |  1 +
 web/helpers/atoms/Thread.atom.ts              |  1 +
 web/hooks/useActiveModel.ts                   |  5 +-
 web/hooks/useGetSystemResources.ts            |  6 +++
 web/hooks/useInference.ts                     | 15 ------
 web/hooks/useSendChatMessage.ts               | 40 ++++++++-------
 web/hooks/useSetActiveThread.ts               |  3 ++
 web/screens/Chat/ChatBody/index.tsx           | 15 ++----
 web/screens/Chat/ErrorMessage/index.tsx       | 50 ++++++++-----------
 .../Chat/LoadModelErrorMessage/index.tsx      | 48 ++++++++++++++++++
 web/screens/Chat/index.tsx                    | 12 +++++
 15 files changed, 166 insertions(+), 92 deletions(-)
 delete mode 100644 web/hooks/useInference.ts
 create mode 100644 web/screens/Chat/LoadModelErrorMessage/index.tsx

diff --git a/core/src/node/api/common/startStopModel.ts b/core/src/node/api/common/startStopModel.ts
index 766588380..0d4934e1c 100644
--- a/core/src/node/api/common/startStopModel.ts
+++ b/core/src/node/api/common/startStopModel.ts
@@ -305,7 +305,7 @@ const loadLLMModel = async (settings: NitroModelSettings): Promise<Response> =>
     })
     .catch((err: any) => {
       logServer(`[NITRO]::Error: Load model failed with error ${err}`)
-      return Promise.reject()
+      return Promise.reject(err)
     })
 }
 
diff --git a/extensions/inference-nitro-extension/src/index.ts b/extensions/inference-nitro-extension/src/index.ts
index aaa230ca3..9f1f00263 100644
--- a/extensions/inference-nitro-extension/src/index.ts
+++ b/extensions/inference-nitro-extension/src/index.ts
@@ -134,6 +134,7 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
 
     const modelFullPath = await joinPath(["models", model.id]);
 
+    this._currentModel = model;
     const nitroInitResult = await executeOnMain(NODE, "runModel", {
       modelFullPath,
       model,
@@ -144,7 +145,6 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
       return;
     }
 
-    this._currentModel = model;
     events.emit(ModelEvent.OnModelReady, model);
 
     this.getNitroProcesHealthIntervalId = setInterval(
@@ -226,6 +226,9 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
    */
   private async onMessageRequest(data: MessageRequest) {
     if (data.model?.engine !== InferenceEngine.nitro || !this._currentModel) {
+      console.log(
+        `Model is not nitro or no model loaded ${data.model?.engine} ${this._currentModel}`
+      );
       return;
     }
 
diff --git a/extensions/inference-nitro-extension/src/node/index.ts b/extensions/inference-nitro-extension/src/node/index.ts
index 296433d42..7ba90b556 100644
--- a/extensions/inference-nitro-extension/src/node/index.ts
+++ b/extensions/inference-nitro-extension/src/node/index.ts
@@ -67,7 +67,7 @@ function stopModel(): Promise<void> {
  * TODO: Should pass absolute of the model file instead of just the name - So we can modurize the module.ts to npm package
  */
 async function runModel(
-  wrapper: ModelInitOptions
+  wrapper: ModelInitOptions,
 ): Promise<ModelOperationResponse | void> {
   if (wrapper.model.engine !== InferenceEngine.nitro) {
     // Not a nitro model
@@ -85,7 +85,7 @@ async function runModel(
   const ggufBinFile = files.find(
     (file) =>
       file === path.basename(currentModelFile) ||
-      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT)
+      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT),
   );
 
   if (!ggufBinFile) return Promise.reject("No GGUF model file found");
@@ -180,10 +180,10 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const system_prompt = promptTemplate.substring(0, systemIndex);
     const user_prompt = promptTemplate.substring(
       systemIndex + systemMarker.length,
-      promptIndex
+      promptIndex,
     );
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length
+      promptIndex + promptMarker.length,
     );
 
     // Return the split parts
@@ -193,7 +193,7 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
     const promptIndex = promptTemplate.indexOf(promptMarker);
     const user_prompt = promptTemplate.substring(0, promptIndex);
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length
+      promptIndex + promptMarker.length,
     );
 
     // Return the split parts
@@ -225,14 +225,14 @@ function loadLLMModel(settings: any): Promise<Response> {
     .then((res) => {
       log(
         `[NITRO]::Debug: Load model success with response ${JSON.stringify(
-          res
-        )}`
+          res,
+        )}`,
       );
       return Promise.resolve(res);
     })
     .catch((err) => {
       log(`[NITRO]::Error: Load model failed with error ${err}`);
-      return Promise.reject();
+      return Promise.reject(err);
     });
 }
 
@@ -254,8 +254,8 @@ async function validateModelStatus(): Promise<void> {
     retryDelay: 500,
   }).then(async (res: Response) => {
     log(
-      `[NITRO]::Debug: Validate model state success with response ${JSON.stringify(
-        res
+      `[NITRO]::Debug: Validate model state with response ${JSON.stringify(
+        res.status
       )}`
     );
     // If the response is OK, check model_loaded status.
@@ -264,9 +264,19 @@ async function validateModelStatus(): Promise<void> {
       // If the model is loaded, return an empty object.
       // Otherwise, return an object with an error message.
       if (body.model_loaded) {
+        log(
+          `[NITRO]::Debug: Validate model state success with response ${JSON.stringify(
+            body
+          )}`
+        );
         return Promise.resolve();
       }
     }
+    log(
+      `[NITRO]::Debug: Validate model state failed with response ${JSON.stringify(
+        res.statusText
+      )}`
+    );
     return Promise.reject("Validate model status failed");
   });
 }
@@ -307,7 +317,7 @@ function spawnNitroProcess(): Promise<any> {
     const args: string[] = ["1", LOCAL_HOST, PORT.toString()];
     // Execute the binary
     log(
-      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`
+      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`,
     );
     subprocess = spawn(
       executableOptions.executablePath,
@@ -318,7 +328,7 @@ function spawnNitroProcess(): Promise<any> {
           ...process.env,
           CUDA_VISIBLE_DEVICES: executableOptions.cudaVisibleDevices,
         },
-      }
+      },
     );
 
     // Handle subprocess output
diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index ac793b4ae..9f29226d0 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -13,9 +13,15 @@ import {
 } from '@janhq/core'
 import { useAtomValue, useSetAtom } from 'jotai'
 
-import { activeModelAtom, stateModelAtom } from '@/hooks/useActiveModel'
+import {
+  activeModelAtom,
+  loadModelErrorAtom,
+  stateModelAtom,
+} from '@/hooks/useActiveModel'
 import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
 
+import { queuedMessageAtom } from '@/hooks/useSendChatMessage'
+
 import { toaster } from '../Toast'
 
 import { extensionManager } from '@/extension'
@@ -26,6 +32,7 @@ import {
 import {
   updateThreadWaitingForResponseAtom,
   threadsAtom,
+  isGeneratingResponseAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 export default function EventHandler({ children }: { children: ReactNode }) {
@@ -34,11 +41,14 @@ export default function EventHandler({ children }: { children: ReactNode }) {
   const { downloadedModels } = useGetDownloadedModels()
   const setActiveModel = useSetAtom(activeModelAtom)
   const setStateModel = useSetAtom(stateModelAtom)
+  const setQueuedMessage = useSetAtom(queuedMessageAtom)
+  const setLoadModelError = useSetAtom(loadModelErrorAtom)
 
   const updateThreadWaiting = useSetAtom(updateThreadWaitingForResponseAtom)
   const threads = useAtomValue(threadsAtom)
   const modelsRef = useRef(downloadedModels)
   const threadsRef = useRef(threads)
+  const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
 
   useEffect(() => {
     threadsRef.current = threads
@@ -51,8 +61,9 @@ export default function EventHandler({ children }: { children: ReactNode }) {
   const onNewMessageResponse = useCallback(
     (message: ThreadMessage) => {
       addNewMessage(message)
+      setIsGeneratingResponse(false)
     },
-    [addNewMessage]
+    [addNewMessage, setIsGeneratingResponse]
   )
 
   const onModelReady = useCallback(
@@ -83,13 +94,15 @@ export default function EventHandler({ children }: { children: ReactNode }) {
     (res: any) => {
       const errorMessage = `${res.error}`
       console.error('Failed to load model: ' + errorMessage)
+      setLoadModelError(errorMessage)
       setStateModel(() => ({
         state: 'start',
         loading: false,
         model: res.modelId,
       }))
+      setQueuedMessage(false)
     },
-    [setStateModel]
+    [setStateModel, setQueuedMessage, setLoadModelError]
   )
 
   const onMessageResponseUpdate = useCallback(
@@ -108,6 +121,8 @@ export default function EventHandler({ children }: { children: ReactNode }) {
       // Mark the thread as not waiting for response
       updateThreadWaiting(message.thread_id, false)
 
+      setIsGeneratingResponse(false)
+
       const thread = threadsRef.current?.find((e) => e.id == message.thread_id)
       if (thread) {
         const messageContent = message.content[0]?.text.value ?? ''
diff --git a/web/helpers/atoms/SystemBar.atom.ts b/web/helpers/atoms/SystemBar.atom.ts
index aa5e77d58..42ef7b29f 100644
--- a/web/helpers/atoms/SystemBar.atom.ts
+++ b/web/helpers/atoms/SystemBar.atom.ts
@@ -2,5 +2,6 @@ import { atom } from 'jotai'
 
 export const totalRamAtom = atom<number>(0)
 export const usedRamAtom = atom<number>(0)
+export const availableRamAtom = atom<number>(0)
 
 export const cpuUsageAtom = atom<number>(0)
diff --git a/web/helpers/atoms/Thread.atom.ts b/web/helpers/atoms/Thread.atom.ts
index fcaa2a4af..cab286bd1 100644
--- a/web/helpers/atoms/Thread.atom.ts
+++ b/web/helpers/atoms/Thread.atom.ts
@@ -23,6 +23,7 @@ export const setActiveThreadIdAtom = atom(
 
 export const waitingToSendMessage = atom<boolean | undefined>(undefined)
 
+export const isGeneratingResponseAtom = atom<boolean | undefined>(undefined)
 /**
  * Stores all thread states for the current user
  */
diff --git a/web/hooks/useActiveModel.ts b/web/hooks/useActiveModel.ts
index a456d8787..54a1fdbe0 100644
--- a/web/hooks/useActiveModel.ts
+++ b/web/hooks/useActiveModel.ts
@@ -1,5 +1,5 @@
 import { events, Model, ModelEvent } from '@janhq/core'
-import { atom, useAtom, useAtomValue } from 'jotai'
+import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 
 import { toaster } from '@/containers/Toast'
 
@@ -9,6 +9,7 @@ import { LAST_USED_MODEL_ID } from './useRecommendedModel'
 import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 export const activeModelAtom = atom<Model | undefined>(undefined)
+export const loadModelErrorAtom = atom<string | undefined>(undefined)
 
 export const stateModelAtom = atom({
   state: 'start',
@@ -21,6 +22,7 @@ export function useActiveModel() {
   const activeThread = useAtomValue(activeThreadAtom)
   const [stateModel, setStateModel] = useAtom(stateModelAtom)
   const { downloadedModels } = useGetDownloadedModels()
+  const setLoadModelError = useSetAtom(loadModelErrorAtom)
 
   const startModel = async (modelId: string) => {
     if (
@@ -31,6 +33,7 @@ export function useActiveModel() {
       return
     }
     // TODO: incase we have multiple assistants, the configuration will be from assistant
+    setLoadModelError(undefined)
 
     setActiveModel(undefined)
 
diff --git a/web/hooks/useGetSystemResources.ts b/web/hooks/useGetSystemResources.ts
index 8dffa8eb4..de595ad7b 100644
--- a/web/hooks/useGetSystemResources.ts
+++ b/web/hooks/useGetSystemResources.ts
@@ -6,6 +6,7 @@ import { useSetAtom } from 'jotai'
 
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
+  availableRamAtom,
   cpuUsageAtom,
   totalRamAtom,
   usedRamAtom,
@@ -16,6 +17,7 @@ export default function useGetSystemResources() {
   const [cpu, setCPU] = useState<number>(0)
   const setTotalRam = useSetAtom(totalRamAtom)
   const setUsedRam = useSetAtom(usedRamAtom)
+  const setAvailableRam = useSetAtom(availableRamAtom)
   const setCpuUsage = useSetAtom(cpuUsageAtom)
 
   const getSystemResources = async () => {
@@ -40,6 +42,10 @@ export default function useGetSystemResources() {
       setTotalRam(resourceInfor.mem.totalMemory)
 
     setRam(Math.round(ram * 100))
+    if (resourceInfor.mem.totalMemory && resourceInfor.mem.usedMemory)
+      setAvailableRam(
+        resourceInfor.mem.totalMemory - resourceInfor.mem.usedMemory
+      )
     setCPU(Math.round(currentLoadInfor?.cpu?.usage ?? 0))
     setCpuUsage(Math.round(currentLoadInfor?.cpu?.usage ?? 0))
   }
diff --git a/web/hooks/useInference.ts b/web/hooks/useInference.ts
deleted file mode 100644
index 8ada18cb7..000000000
--- a/web/hooks/useInference.ts
+++ /dev/null
@@ -1,15 +0,0 @@
-import { useAtomValue } from 'jotai'
-
-import { threadStatesAtom } from '@/helpers/atoms/Thread.atom'
-
-export default function useInference() {
-  const threadStates = useAtomValue(threadStatesAtom)
-
-  const isGeneratingResponse = Object.values(threadStates).some(
-    (threadState) => threadState.waitingForResponse
-  )
-
-  return {
-    isGeneratingResponse,
-  }
-}
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index 379defa15..5d1894db8 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -25,12 +25,10 @@ import { ulid } from 'ulid'
 import { selectedModelAtom } from '@/containers/DropdownListSidebar'
 import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
 
-import { toaster } from '@/containers/Toast'
-
 import { getBase64 } from '@/utils/base64'
 import { toRuntimeParams, toSettingParams } from '@/utils/modelParam'
 
-import { useActiveModel } from './useActiveModel'
+import { loadModelErrorAtom, useActiveModel } from './useActiveModel'
 
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
@@ -59,9 +57,11 @@ export default function useSendChatMessage() {
   const { activeModel } = useActiveModel()
   const selectedModel = useAtomValue(selectedModelAtom)
   const { startModel } = useActiveModel()
-  const setQueuedMessage = useSetAtom(queuedMessageAtom)
+  const [queuedMessage, setQueuedMessage] = useAtom(queuedMessageAtom)
+  const loadModelFailed = useAtomValue(loadModelErrorAtom)
 
   const modelRef = useRef<Model | undefined>()
+  const loadModelFailedRef = useRef<string | undefined>()
   const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
   const engineParamsUpdate = useAtomValue(engineParamsUpdateAtom)
 
@@ -73,6 +73,10 @@ export default function useSendChatMessage() {
     modelRef.current = activeModel
   }, [activeModel])
 
+  useEffect(() => {
+    loadModelFailedRef.current = loadModelFailed
+  }, [loadModelFailed])
+
   const resendChatMessage = async (currentMessage: ThreadMessage) => {
     if (!activeThread) {
       console.error('No active thread')
@@ -121,21 +125,6 @@ export default function useSendChatMessage() {
     events.emit(MessageEvent.OnMessageSent, messageRequest)
   }
 
-  // TODO: Refactor @louis
-  const waitForModelStarting = async (modelId: string) => {
-    return new Promise<void>((resolve) => {
-      setTimeout(async () => {
-        if (modelRef.current?.id !== modelId) {
-          console.debug('waiting for model to start')
-          await waitForModelStarting(modelId)
-          resolve()
-        } else {
-          resolve()
-        }
-      }, 200)
-    })
-  }
-
   const sendChatMessage = async (message: string) => {
     if (!message || message.trim().length === 0) return
 
@@ -304,6 +293,19 @@ export default function useSendChatMessage() {
     setEngineParamsUpdate(false)
   }
 
+  const waitForModelStarting = async (modelId: string) => {
+    return new Promise<void>((resolve) => {
+      setTimeout(async () => {
+        if (modelRef.current?.id !== modelId && !loadModelFailedRef.current) {
+          await waitForModelStarting(modelId)
+          resolve()
+        } else {
+          resolve()
+        }
+      }, 200)
+    })
+  }
+
   return {
     sendChatMessage,
     resendChatMessage,
diff --git a/web/hooks/useSetActiveThread.ts b/web/hooks/useSetActiveThread.ts
index 76a744bcd..3545d0d23 100644
--- a/web/hooks/useSetActiveThread.ts
+++ b/web/hooks/useSetActiveThread.ts
@@ -13,6 +13,7 @@ import { setConvoMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
 import {
   ModelParams,
   getActiveThreadIdAtom,
+  isGeneratingResponseAtom,
   setActiveThreadIdAtom,
   setThreadModelParamsAtom,
 } from '@/helpers/atoms/Thread.atom'
@@ -22,6 +23,7 @@ export default function useSetActiveThread() {
   const setActiveThreadId = useSetAtom(setActiveThreadIdAtom)
   const setThreadMessage = useSetAtom(setConvoMessagesAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
+  const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
 
   const setActiveThread = async (thread: Thread) => {
     if (activeThreadId === thread.id) {
@@ -29,6 +31,7 @@ export default function useSetActiveThread() {
       return
     }
 
+    setIsGeneratingResponse(false)
     events.emit(InferenceEvent.OnInferenceStopped, thread.id)
 
     // load the corresponding messages
diff --git a/web/screens/Chat/ChatBody/index.tsx b/web/screens/Chat/ChatBody/index.tsx
index e0a34a1a1..1ce6b591f 100644
--- a/web/screens/Chat/ChatBody/index.tsx
+++ b/web/screens/Chat/ChatBody/index.tsx
@@ -8,14 +8,11 @@ import { useAtomValue } from 'jotai'
 
 import LogoMark from '@/containers/Brand/Logo/Mark'
 
-import GenerateResponse from '@/containers/Loader/GenerateResponse'
-
 import { MainViewState } from '@/constants/screens'
 
-import { activeModelAtom } from '@/hooks/useActiveModel'
+import { loadModelErrorAtom } from '@/hooks/useActiveModel'
 import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
 
-import useInference from '@/hooks/useInference'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import ChatItem from '../ChatItem'
@@ -26,10 +23,9 @@ import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
 
 const ChatBody: React.FC = () => {
   const messages = useAtomValue(getCurrentChatMessagesAtom)
-  const activeModel = useAtomValue(activeModelAtom)
   const { downloadedModels } = useGetDownloadedModels()
   const { setMainViewState } = useMainViewState()
-  const { isGeneratingResponse } = useInference()
+  const loadModelError = useAtomValue(loadModelErrorAtom)
 
   if (downloadedModels.length === 0)
     return (
@@ -90,15 +86,14 @@ const ChatBody: React.FC = () => {
                 message.content.length > 0) && (
                 <ChatItem {...message} key={message.id} />
               )}
-              {(message.status === MessageStatus.Error ||
-                message.status === MessageStatus.Stopped) &&
+              {!loadModelError &&
+                (message.status === MessageStatus.Error ||
+                  message.status === MessageStatus.Stopped) &&
                 index === messages.length - 1 && (
                   <ErrorMessage message={message} />
                 )}
             </div>
           ))}
-
-          {activeModel && isGeneratingResponse && <GenerateResponse />}
         </ScrollToBottom>
       )}
     </Fragment>
diff --git a/web/screens/Chat/ErrorMessage/index.tsx b/web/screens/Chat/ErrorMessage/index.tsx
index 8879b15be..84a89cee8 100644
--- a/web/screens/Chat/ErrorMessage/index.tsx
+++ b/web/screens/Chat/ErrorMessage/index.tsx
@@ -17,7 +17,6 @@ import {
   deleteMessageAtom,
   getCurrentChatMessagesAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
-import { totalRamAtom } from '@/helpers/atoms/SystemBar.atom'
 import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 const ErrorMessage = ({ message }: { message: ThreadMessage }) => {
@@ -25,8 +24,6 @@ const ErrorMessage = ({ message }: { message: ThreadMessage }) => {
   const thread = useAtomValue(activeThreadAtom)
   const deleteMessage = useSetAtom(deleteMessageAtom)
   const { resendChatMessage } = useSendChatMessage()
-  const { activeModel } = useActiveModel()
-  const totalRam = useAtomValue(totalRamAtom)
 
   const regenerateMessage = async () => {
     const lastMessageIndex = messages.length - 1
@@ -70,33 +67,26 @@ const ErrorMessage = ({ message }: { message: ThreadMessage }) => {
       {message.status === MessageStatus.Error && (
         <div key={message.id} className="mt-10 flex flex-col items-center">
           <span className="mb-3 text-center text-sm font-medium text-gray-500">
-            {Number(activeModel?.metadata.size) > totalRam ? (
-              <>
-                Oops! Model size exceeds available RAM. Consider selecting a
-                smaller model or upgrading your RAM for smoother performance.
-              </>
-            ) : (
-              <>
-                <p>Apologies, something&apos;s amiss!</p>
-                Jan&apos;s in beta. Find troubleshooting guides{' '}
-                <a
-                  href="https://jan.ai/guides/troubleshooting"
-                  target="_blank"
-                  className="text-blue-600 hover:underline dark:text-blue-300"
-                >
-                  here
-                </a>{' '}
-                or reach out to us on{' '}
-                <a
-                  href="https://discord.gg/AsJ8krTT3N"
-                  target="_blank"
-                  className="text-blue-600 hover:underline dark:text-blue-300"
-                >
-                  Discord
-                </a>{' '}
-                for assistance.
-              </>
-            )}
+            <>
+              <p>Apologies, something&apos;s amiss!</p>
+              Jan&apos;s in beta. Find troubleshooting guides{' '}
+              <a
+                href="https://jan.ai/guides/troubleshooting"
+                target="_blank"
+                className="text-blue-600 hover:underline dark:text-blue-300"
+              >
+                here
+              </a>{' '}
+              or reach out to us on{' '}
+              <a
+                href="https://discord.gg/AsJ8krTT3N"
+                target="_blank"
+                className="text-blue-600 hover:underline dark:text-blue-300"
+              >
+                Discord
+              </a>{' '}
+              for assistance.
+            </>
           </span>
         </div>
       )}
diff --git a/web/screens/Chat/LoadModelErrorMessage/index.tsx b/web/screens/Chat/LoadModelErrorMessage/index.tsx
new file mode 100644
index 000000000..d3c4a704d
--- /dev/null
+++ b/web/screens/Chat/LoadModelErrorMessage/index.tsx
@@ -0,0 +1,48 @@
+import { MessageStatus, ThreadMessage } from '@janhq/core'
+import { useAtomValue } from 'jotai'
+
+import { useActiveModel } from '@/hooks/useActiveModel'
+
+import { totalRamAtom } from '@/helpers/atoms/SystemBar.atom'
+
+const LoadModelErrorMessage = () => {
+  const { activeModel } = useActiveModel()
+  const availableRam = useAtomValue(totalRamAtom)
+
+  return (
+    <>
+      <div className="mt-10 flex flex-col items-center">
+        <span className="mb-3 text-center text-sm font-medium text-gray-500">
+          {Number(activeModel?.metadata.size) > availableRam ? (
+            <>
+              Oops! Model size exceeds available RAM. Consider selecting a
+              smaller model or upgrading your RAM for smoother performance.
+            </>
+          ) : (
+            <>
+              <p>Apologies, something&apos;s amiss!</p>
+              Jan&apos;s in beta. Find troubleshooting guides{' '}
+              <a
+                href="https://jan.ai/guides/troubleshooting"
+                target="_blank"
+                className="text-blue-600 hover:underline dark:text-blue-300"
+              >
+                here
+              </a>{' '}
+              or reach out to us on{' '}
+              <a
+                href="https://discord.gg/AsJ8krTT3N"
+                target="_blank"
+                className="text-blue-600 hover:underline dark:text-blue-300"
+              >
+                Discord
+              </a>{' '}
+              for assistance.
+            </>
+          )}
+        </span>
+      </div>
+    </>
+  )
+}
+export default LoadModelErrorMessage
diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index e7cb82740..1f7896604 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -9,6 +9,7 @@ import { UploadCloudIcon } from 'lucide-react'
 
 import { twMerge } from 'tailwind-merge'
 
+import GenerateResponse from '@/containers/Loader/GenerateResponse'
 import ModelReload from '@/containers/Loader/ModelReload'
 import ModelStart from '@/containers/Loader/ModelStart'
 
@@ -19,6 +20,7 @@ import { snackbar } from '@/containers/Toast'
 
 import { FeatureToggleContext } from '@/context/FeatureToggle'
 
+import { activeModelAtom, loadModelErrorAtom } from '@/hooks/useActiveModel'
 import { queuedMessageAtom, reloadModelAtom } from '@/hooks/useSendChatMessage'
 
 import ChatBody from '@/screens/Chat/ChatBody'
@@ -26,12 +28,14 @@ import ChatBody from '@/screens/Chat/ChatBody'
 import ThreadList from '@/screens/Chat/ThreadList'
 
 import ChatInput from './ChatInput'
+import LoadModelErrorMessage from './LoadModelErrorMessage'
 import RequestDownloadModel from './RequestDownloadModel'
 import Sidebar from './Sidebar'
 
 import {
   activeThreadAtom,
   engineParamsUpdateAtom,
+  isGeneratingResponseAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 const renderError = (code: string) => {
@@ -63,6 +67,11 @@ const ChatScreen: React.FC = () => {
   const setFileUpload = useSetAtom(fileUploadAtom)
   const { experimentalFeature } = useContext(FeatureToggleContext)
 
+  const activeModel = useAtomValue(activeModelAtom)
+
+  const isGeneratingResponse = useAtomValue(isGeneratingResponseAtom)
+  const loadModelError = useAtomValue(loadModelErrorAtom)
+
   const { getRootProps, isDragReject } = useDropzone({
     noClick: true,
     multiple: false,
@@ -202,6 +211,9 @@ const ChatScreen: React.FC = () => {
               </span>
             </div>
           )}
+
+          {activeModel && isGeneratingResponse && <GenerateResponse />}
+          {loadModelError && <LoadModelErrorMessage />}
           <ChatInput />
         </div>
       </div>

From 9e4658f5b2cbb8a23caa48ee05f7339e8d56c5ae Mon Sep 17 00:00:00 2001
From: Louis <louis@jan.ai>
Date: Thu, 1 Feb 2024 23:59:45 +0700
Subject: [PATCH 65/65] fix: show generate response on message send (#1895)

* fix: show generate response on message send

* chore: typo
---
 web/containers/Providers/EventHandler.tsx                 | 7 ++++---
 web/hooks/useCreateNewThread.ts                           | 2 +-
 web/hooks/useSendChatMessage.ts                           | 6 +++++-
 web/screens/Chat/ThreadList/index.tsx                     | 8 +++++---
 .../Settings/Advanced/FactoryReset/ModalConfirmReset.tsx  | 2 +-
 5 files changed, 16 insertions(+), 9 deletions(-)

diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index 9f29226d0..ec0fbfc90 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -61,9 +61,8 @@ export default function EventHandler({ children }: { children: ReactNode }) {
   const onNewMessageResponse = useCallback(
     (message: ThreadMessage) => {
       addNewMessage(message)
-      setIsGeneratingResponse(false)
     },
-    [addNewMessage, setIsGeneratingResponse]
+    [addNewMessage]
   )
 
   const onModelReady = useCallback(
@@ -114,8 +113,10 @@ export default function EventHandler({ children }: { children: ReactNode }) {
         message.status
       )
       if (message.status === MessageStatus.Pending) {
-        if (message.content.length)
+        if (message.content.length) {
           updateThreadWaiting(message.thread_id, false)
+          setIsGeneratingResponse(false)
+        }
         return
       }
       // Mark the thread as not waiting for response
diff --git a/web/hooks/useCreateNewThread.ts b/web/hooks/useCreateNewThread.ts
index f2ae4fbd3..ee8df22df 100644
--- a/web/hooks/useCreateNewThread.ts
+++ b/web/hooks/useCreateNewThread.ts
@@ -7,7 +7,7 @@ import {
   ThreadState,
   Model,
 } from '@janhq/core'
-import { atom, useAtomValue, useSetAtom } from 'jotai'
+import { atom, useSetAtom } from 'jotai'
 
 import { selectedModelAtom } from '@/containers/DropdownListSidebar'
 import { fileUploadAtom } from '@/containers/Providers/Jotai'
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index 5d1894db8..7d89764db 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -39,6 +39,7 @@ import {
   activeThreadAtom,
   engineParamsUpdateAtom,
   getActiveThreadModelParamsAtom,
+  isGeneratingResponseAtom,
   updateThreadAtom,
   updateThreadWaitingForResponseAtom,
 } from '@/helpers/atoms/Thread.atom'
@@ -57,7 +58,7 @@ export default function useSendChatMessage() {
   const { activeModel } = useActiveModel()
   const selectedModel = useAtomValue(selectedModelAtom)
   const { startModel } = useActiveModel()
-  const [queuedMessage, setQueuedMessage] = useAtom(queuedMessageAtom)
+  const setQueuedMessage = useSetAtom(queuedMessageAtom)
   const loadModelFailed = useAtomValue(loadModelErrorAtom)
 
   const modelRef = useRef<Model | undefined>()
@@ -68,6 +69,7 @@ export default function useSendChatMessage() {
   const setEngineParamsUpdate = useSetAtom(engineParamsUpdateAtom)
   const setReloadModel = useSetAtom(reloadModelAtom)
   const [fileUpload, setFileUpload] = useAtom(fileUploadAtom)
+  const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
 
   useEffect(() => {
     modelRef.current = activeModel
@@ -82,6 +84,7 @@ export default function useSendChatMessage() {
       console.error('No active thread')
       return
     }
+    setIsGeneratingResponse(true)
     updateThreadWaiting(activeThread.id, true)
     const messages: ChatCompletionMessage[] = [
       activeThread.assistants[0]?.instructions,
@@ -132,6 +135,7 @@ export default function useSendChatMessage() {
       console.error('No active thread')
       return
     }
+    setIsGeneratingResponse(true)
 
     if (engineParamsUpdate) setReloadModel(true)
 
diff --git a/web/screens/Chat/ThreadList/index.tsx b/web/screens/Chat/ThreadList/index.tsx
index 19298062b..b4a045b1d 100644
--- a/web/screens/Chat/ThreadList/index.tsx
+++ b/web/screens/Chat/ThreadList/index.tsx
@@ -1,4 +1,4 @@
-import { useEffect } from 'react'
+import { useEffect, useState } from 'react'
 
 import {
   Modal,
@@ -49,17 +49,19 @@ export default function ThreadList() {
   const activeThread = useAtomValue(activeThreadAtom)
   const { deleteThread, cleanThread } = useDeleteThread()
   const { downloadedModels } = useGetDownloadedModels()
+  const [isThreadsReady, setIsThreadsReady] = useState(false)
 
   const { activeThreadId, setActiveThread: onThreadClick } =
     useSetActiveThread()
 
   useEffect(() => {
-    getThreads()
+    getThreads().then(() => setIsThreadsReady(true))
     // eslint-disable-next-line react-hooks/exhaustive-deps
   }, [])
 
   useEffect(() => {
     if (
+      isThreadsReady &&
       downloadedModels.length !== 0 &&
       threads.length === 0 &&
       assistants.length !== 0 &&
@@ -68,7 +70,7 @@ export default function ThreadList() {
       requestCreateNewThread(assistants[0])
     }
     // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [assistants, threads, downloadedModels, activeThread])
+  }, [assistants, threads, downloadedModels, activeThread, isThreadsReady])
 
   return (
     <div className="px-3 py-4">
diff --git a/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx b/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
index 89a875955..7b2a4027a 100644
--- a/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
+++ b/web/screens/Settings/Advanced/FactoryReset/ModalConfirmReset.tsx
@@ -66,7 +66,7 @@ const ModalConfirmReset = () => {
               Keep the current app data location
             </label>
             <p className="mt-2 leading-relaxed">
-              Otherwise it will reset back to its original location at:
+              Otherwise it will reset back to its original location at:{' '}
               {/* TODO should be from system */}
               <span className="font-medium">{defaultJanDataFolder}</span>
             </p>