diff --git a/.devcontainer/devcontainer.json b/.devcontainer/devcontainer.json
index f980b9df7..db1eed38d 100644
--- a/.devcontainer/devcontainer.json
+++ b/.devcontainer/devcontainer.json
@@ -1,4 +1,4 @@
 {
-    "name": "jan",
-    "image": "node:20"
-}
\ No newline at end of file
+  "name": "jan",
+  "image": "node:20"
+}
diff --git a/.github/workflows/jan-electron-linter-and-test.yml b/.github/workflows/jan-electron-linter-and-test.yml
index 6d5aaf150..40085391f 100644
--- a/.github/workflows/jan-electron-linter-and-test.yml
+++ b/.github/workflows/jan-electron-linter-and-test.yml
@@ -1,5 +1,6 @@
 name: Jan Electron Linter & Test
 on:
+  workflow_dispatch:
   push:
     branches:
       - main
diff --git a/.github/workflows/jan-server-build-nightly.yml b/.github/workflows/jan-server-build-nightly.yml
new file mode 100644
index 000000000..0d1bc3ca8
--- /dev/null
+++ b/.github/workflows/jan-server-build-nightly.yml
@@ -0,0 +1,40 @@
+name: Jan Build Docker Nightly or Manual
+
+on:
+  push:
+    branches:
+      - main
+      - feature/helmchart-and-ci-jan-server
+    paths-ignore:
+      - 'README.md'
+      - 'docs/**'
+  schedule:
+    - cron: '0 20 * * 1,2,3' # At 8 PM UTC on Monday, Tuesday, and Wednesday which is 3 AM UTC+7 Tuesday, Wednesday, and Thursday
+  workflow_dispatch:
+
+jobs:
+  # Job create Update app version based on latest release tag with build number and save to output
+  get-update-version:
+    uses: ./.github/workflows/template-get-update-version.yml
+
+  build-cpu:
+    uses: ./.github/workflows/template-build-jan-server.yml
+    permissions:
+      packages: write
+    secrets: inherit
+    needs: [get-update-version]
+    with:
+      dockerfile_path: ./Dockerfile
+      docker_image_tag: "ghcr.io/janhq/jan-server:dev-cpu-latest,ghcr.io/janhq/jan-server:dev-cpu-${{ needs.get-update-version.outputs.new_version }}"
+
+  build-gpu:
+    uses: ./.github/workflows/template-build-jan-server.yml
+    permissions:
+      packages: write
+    secrets: inherit
+    needs: [get-update-version]
+    with:
+      dockerfile_path: ./Dockerfile.gpu
+      docker_image_tag: "ghcr.io/janhq/jan-server:dev-cuda-12.2-latest,ghcr.io/janhq/jan-server:dev-cuda-12.2-${{ needs.get-update-version.outputs.new_version }}"
+    
+
diff --git a/.github/workflows/jan-server-build.yml b/.github/workflows/jan-server-build.yml
new file mode 100644
index 000000000..0665838d6
--- /dev/null
+++ b/.github/workflows/jan-server-build.yml
@@ -0,0 +1,30 @@
+name: Jan Build Docker
+
+on:
+  push:
+    tags: ["v[0-9]+.[0-9]+.[0-9]+"]
+
+jobs:
+  # Job create Update app version based on latest release tag with build number and save to output
+  get-update-version:
+    uses: ./.github/workflows/template-get-update-version.yml
+
+  build-cpu:
+    permissions:
+      packages: write
+    uses: ./.github/workflows/template-build-jan-server.yml
+    secrets: inherit
+    needs: [get-update-version]
+    with:
+      dockerfile_path: ./Dockerfile
+      docker_image_tag: "ghcr.io/janhq/jan-server:cpu-latest,ghcr.io/janhq/jan-server:cpu-${{ needs.get-update-version.outputs.new_version }}"
+
+  build-gpu:
+    permissions:
+      packages: write
+    uses: ./.github/workflows/template-build-jan-server.yml
+    secrets: inherit
+    needs: [get-update-version]
+    with:
+      dockerfile_path: ./Dockerfile.gpu
+      docker_image_tag: "ghcr.io/janhq/jan-server:cuda-12.2-latest,ghcr.io/janhq/jan-server:cuda-12.2-${{ needs.get-update-version.outputs.new_version }}"
diff --git a/.github/workflows/template-build-jan-server.yml b/.github/workflows/template-build-jan-server.yml
new file mode 100644
index 000000000..9bb772605
--- /dev/null
+++ b/.github/workflows/template-build-jan-server.yml
@@ -0,0 +1,39 @@
+name: build-jan-server
+on:
+  workflow_call:
+    inputs:
+      dockerfile_path:
+        required: false
+        type: string
+        default: './Dockerfile'
+      docker_image_tag:
+        required: true
+        type: string
+        default: 'ghcr.io/janhq/jan-server:dev-latest'
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    env:
+      REGISTRY: ghcr.io
+      IMAGE_NAME: janhq/jan-server
+    permissions:
+      packages: write
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Log in to the Container registry
+        uses: docker/login-action@v3
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Build and push Docker image
+        uses: docker/build-push-action@v3
+        with:
+          context: .
+          file: ${{ inputs.dockerfile_path }}
+          push: true
+          tags: ${{ inputs.docker_image_tag }}
\ No newline at end of file
diff --git a/.gitignore b/.gitignore
index 4540e5c7a..62878011e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -5,6 +5,7 @@
 error.log
 node_modules
 *.tgz
+!charts/server/charts/*.tgz
 yarn.lock
 dist
 build
@@ -28,4 +29,5 @@ extensions/inference-nitro-extension/bin/*/*.exp
 extensions/inference-nitro-extension/bin/*/*.lib
 extensions/inference-nitro-extension/bin/saved-*
 extensions/inference-nitro-extension/bin/*.tar.gz
-
+extensions/inference-nitro-extension/bin/vulkaninfoSDK.exe
+extensions/inference-nitro-extension/bin/vulkaninfo
diff --git a/core/.prettierignore b/.prettierignore
similarity index 100%
rename from core/.prettierignore
rename to .prettierignore
diff --git a/core/.prettierrc b/.prettierrc
similarity index 100%
rename from core/.prettierrc
rename to .prettierrc
diff --git a/Dockerfile b/Dockerfile
index 949a92673..48b2d254f 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -1,39 +1,61 @@
-FROM node:20-bullseye AS base
+FROM node:20-bookworm AS base
 
 # 1. Install dependencies only when needed
-FROM base AS deps
+FROM base AS builder
+
+# Install g++ 11
+RUN apt update && apt install -y gcc-11 g++-11 cpp-11 jq xsel && rm -rf /var/lib/apt/lists/*
+
 WORKDIR /app
 
 # Install dependencies based on the preferred package manager
-COPY package.json yarn.lock* package-lock.json* pnpm-lock.yaml* ./
-RUN yarn install
+COPY . ./
+
+RUN export NITRO_VERSION=$(cat extensions/inference-nitro-extension/bin/version.txt) && \
+    jq --arg nitroVersion $NITRO_VERSION '(.scripts."downloadnitro:linux" | gsub("\\${NITRO_VERSION}"; $nitroVersion)) | gsub("\r"; "")' extensions/inference-nitro-extension/package.json > /tmp/newcommand.txt && export NEW_COMMAND=$(sed 's/^"//;s/"$//' /tmp/newcommand.txt) && jq --arg newCommand "$NEW_COMMAND" '.scripts."downloadnitro:linux" = $newCommand' extensions/inference-nitro-extension/package.json > /tmp/package.json && mv /tmp/package.json extensions/inference-nitro-extension/package.json
+RUN make install-and-build
 
 # # 2. Rebuild the source code only when needed
-FROM base AS builder
-WORKDIR /app
-COPY --from=deps /app/node_modules ./node_modules
-COPY . .
-# This will do the trick, use the corresponding env file for each environment.
-RUN yarn workspace server install
-RUN yarn server:prod
-
-# 3. Production image, copy all the files and run next
 FROM base AS runner
+
+# Install g++ 11
+RUN apt update && apt install -y gcc-11 g++-11 cpp-11 jq xsel && rm -rf /var/lib/apt/lists/*
+
 WORKDIR /app
 
-ENV NODE_ENV=production
+# Copy the package.json and yarn.lock of root yarn space to leverage Docker cache
+COPY --from=builder /app/package.json ./package.json
+COPY --from=builder /app/node_modules ./node_modules/
+COPY --from=builder /app/yarn.lock ./yarn.lock
 
-# RUN addgroup -g 1001 -S nodejs;
-COPY --from=builder /app/server/build ./
+# Copy the package.json, yarn.lock, and build output of server yarn space to leverage Docker cache
+COPY --from=builder /app/core ./core/
+COPY --from=builder /app/server ./server/
+RUN cd core && yarn install && yarn run build
+RUN yarn workspace @janhq/server install && yarn workspace @janhq/server build
+COPY --from=builder /app/docs/openapi ./docs/openapi/
 
-# Automatically leverage output traces to reduce image size
-# https://nextjs.org/docs/advanced-features/output-file-tracing
-COPY --from=builder /app/server/node_modules ./node_modules
-COPY --from=builder /app/server/package.json ./package.json
+# Copy pre-install dependencies
+COPY --from=builder /app/pre-install ./pre-install/
 
-EXPOSE 4000 3928
+# Copy the package.json, yarn.lock, and output of web yarn space to leverage Docker cache
+COPY --from=builder /app/uikit ./uikit/
+COPY --from=builder /app/web ./web/
+COPY --from=builder /app/models ./models/
 
-ENV PORT 4000
-ENV APPDATA /app/data
+RUN yarn workspace @janhq/uikit install && yarn workspace @janhq/uikit build
+RUN yarn workspace jan-web install
 
-CMD ["node", "main.js"]
\ No newline at end of file
+RUN npm install -g serve@latest
+
+EXPOSE 1337 3000 3928
+
+ENV JAN_API_HOST 0.0.0.0
+ENV JAN_API_PORT 1337
+
+ENV API_BASE_URL http://localhost:1337
+
+CMD ["sh", "-c", "export NODE_ENV=production && yarn workspace jan-web build && cd web && npx serve out & cd server && node build/main.js"]
+
+# docker build -t jan .
+# docker run -p 1337:1337 -p 3000:3000 -p 3928:3928 jan
diff --git a/Dockerfile.gpu b/Dockerfile.gpu
new file mode 100644
index 000000000..832e2c18c
--- /dev/null
+++ b/Dockerfile.gpu
@@ -0,0 +1,88 @@
+# Please change the base image to the appropriate CUDA version base on NVIDIA Driver Compatibility
+# Run nvidia-smi to check the CUDA version and the corresponding driver version
+# Then update the base image to the appropriate CUDA version refer https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda/tags
+
+FROM nvidia/cuda:12.2.0-runtime-ubuntu22.04 AS base 
+
+# 1. Install dependencies only when needed
+FROM base AS builder
+
+# Install g++ 11
+RUN apt update && apt install -y gcc-11 g++-11 cpp-11 jq xsel curl gnupg make python3-dev && curl -sL https://deb.nodesource.com/setup_20.x | bash - && apt install nodejs -y && rm -rf /var/lib/apt/lists/*
+
+# Update alternatives for GCC and related tools
+RUN update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-11 110 \
+                         --slave /usr/bin/g++ g++ /usr/bin/g++-11 \
+                         --slave /usr/bin/gcov gcov /usr/bin/gcov-11 \
+                         --slave /usr/bin/gcc-ar gcc-ar /usr/bin/gcc-ar-11 \
+                         --slave /usr/bin/gcc-ranlib gcc-ranlib /usr/bin/gcc-ranlib-11 && \
+    update-alternatives --install /usr/bin/cpp cpp /usr/bin/cpp-11 110
+
+RUN npm install -g yarn
+
+WORKDIR /app
+
+# Install dependencies based on the preferred package manager
+COPY . ./
+
+RUN export NITRO_VERSION=$(cat extensions/inference-nitro-extension/bin/version.txt) && \
+    jq --arg nitroVersion $NITRO_VERSION '(.scripts."downloadnitro:linux" | gsub("\\${NITRO_VERSION}"; $nitroVersion)) | gsub("\r"; "")' extensions/inference-nitro-extension/package.json > /tmp/newcommand.txt && export NEW_COMMAND=$(sed 's/^"//;s/"$//' /tmp/newcommand.txt) && jq --arg newCommand "$NEW_COMMAND" '.scripts."downloadnitro:linux" = $newCommand' extensions/inference-nitro-extension/package.json > /tmp/package.json && mv /tmp/package.json extensions/inference-nitro-extension/package.json
+RUN make install-and-build
+
+# # 2. Rebuild the source code only when needed
+FROM base AS runner
+
+# Install g++ 11
+RUN apt update && apt install -y gcc-11 g++-11 cpp-11 jq xsel curl gnupg make python3-dev && curl -sL https://deb.nodesource.com/setup_20.x | bash - && apt-get install nodejs -y && rm -rf /var/lib/apt/lists/*
+
+# Update alternatives for GCC and related tools
+RUN update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-11 110 \
+                         --slave /usr/bin/g++ g++ /usr/bin/g++-11 \
+                         --slave /usr/bin/gcov gcov /usr/bin/gcov-11 \
+                         --slave /usr/bin/gcc-ar gcc-ar /usr/bin/gcc-ar-11 \
+                         --slave /usr/bin/gcc-ranlib gcc-ranlib /usr/bin/gcc-ranlib-11 && \
+    update-alternatives --install /usr/bin/cpp cpp /usr/bin/cpp-11 110
+
+RUN npm install -g yarn
+
+WORKDIR /app
+
+# Copy the package.json and yarn.lock of root yarn space to leverage Docker cache
+COPY --from=builder /app/package.json ./package.json
+COPY --from=builder /app/node_modules ./node_modules/
+COPY --from=builder /app/yarn.lock ./yarn.lock
+
+# Copy the package.json, yarn.lock, and build output of server yarn space to leverage Docker cache
+COPY --from=builder /app/core ./core/
+COPY --from=builder /app/server ./server/
+RUN cd core && yarn install && yarn run build
+RUN yarn workspace @janhq/server install && yarn workspace @janhq/server build
+COPY --from=builder /app/docs/openapi ./docs/openapi/
+
+# Copy pre-install dependencies
+COPY --from=builder /app/pre-install ./pre-install/
+
+# Copy the package.json, yarn.lock, and output of web yarn space to leverage Docker cache
+COPY --from=builder /app/uikit ./uikit/
+COPY --from=builder /app/web ./web/
+COPY --from=builder /app/models ./models/
+
+RUN yarn workspace @janhq/uikit install && yarn workspace @janhq/uikit build
+RUN yarn workspace jan-web install
+
+RUN npm install -g serve@latest
+
+EXPOSE 1337 3000 3928
+
+ENV LD_LIBRARY_PATH=/usr/local/cuda/targets/x86_64-linux/lib:/usr/local/cuda-12.0/compat${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}
+
+ENV JAN_API_HOST 0.0.0.0
+ENV JAN_API_PORT 1337
+
+ENV API_BASE_URL http://localhost:1337
+
+CMD ["sh", "-c", "export NODE_ENV=production && yarn workspace jan-web build && cd web && npx serve out & cd server && node build/main.js"]
+
+# pre-requisites: nvidia-docker
+# docker build -t jan-gpu . -f Dockerfile.gpu
+# docker run -p 1337:1337 -p 3000:3000 -p 3928:3928 --gpus all jan-gpu
diff --git a/Makefile b/Makefile
index 905a68321..a45477b29 100644
--- a/Makefile
+++ b/Makefile
@@ -24,9 +24,9 @@ endif
 
 check-file-counts: install-and-build
 ifeq ($(OS),Windows_NT)
-	powershell -Command "if ((Get-ChildItem -Path electron/pre-install -Filter *.tgz | Measure-Object | Select-Object -ExpandProperty Count) -ne (Get-ChildItem -Path extensions -Directory | Measure-Object | Select-Object -ExpandProperty Count)) { Write-Host 'Number of .tgz files in electron/pre-install does not match the number of subdirectories in extension'; exit 1 } else { Write-Host 'Extension build successful' }"
+	powershell -Command "if ((Get-ChildItem -Path pre-install -Filter *.tgz | Measure-Object | Select-Object -ExpandProperty Count) -ne (Get-ChildItem -Path extensions -Directory | Measure-Object | Select-Object -ExpandProperty Count)) { Write-Host 'Number of .tgz files in pre-install does not match the number of subdirectories in extension'; exit 1 } else { Write-Host 'Extension build successful' }"
 else
-	@tgz_count=$$(find electron/pre-install -type f -name "*.tgz" | wc -l); dir_count=$$(find extensions -mindepth 1 -maxdepth 1 -type d | wc -l); if [ $$tgz_count -ne $$dir_count ]; then echo "Number of .tgz files in electron/pre-install ($$tgz_count) does not match the number of subdirectories in extension ($$dir_count)"; exit 1; else echo "Extension build successful"; fi
+	@tgz_count=$$(find pre-install -type f -name "*.tgz" | wc -l); dir_count=$$(find extensions -mindepth 1 -maxdepth 1 -type d | wc -l); if [ $$tgz_count -ne $$dir_count ]; then echo "Number of .tgz files in pre-install ($$tgz_count) does not match the number of subdirectories in extension ($$dir_count)"; exit 1; else echo "Extension build successful"; fi
 endif
 
 dev: check-file-counts
@@ -52,18 +52,28 @@ build: check-file-counts
 
 clean:
 ifeq ($(OS),Windows_NT)
-	powershell -Command "Get-ChildItem -Path . -Include node_modules, .next, dist -Recurse -Directory | Remove-Item -Recurse -Force"
+	powershell -Command "Get-ChildItem -Path . -Include node_modules, .next, dist, build, out -Recurse -Directory | Remove-Item -Recurse -Force"
+	powershell -Command "Remove-Item -Recurse -Force ./pre-install/*.tgz"
+	powershell -Command "Remove-Item -Recurse -Force ./electron/pre-install/*.tgz"
 	rmdir /s /q "%USERPROFILE%\jan\extensions"
 else ifeq ($(shell uname -s),Linux)
 	find . -name "node_modules" -type d -prune -exec rm -rf '{}' +
 	find . -name ".next" -type d -exec rm -rf '{}' +
 	find . -name "dist" -type d -exec rm -rf '{}' +
+	find . -name "build" -type d -exec rm -rf '{}' +
+	find . -name "out" -type d -exec rm -rf '{}' +
+	rm -rf ./pre-install/*.tgz
+	rm -rf ./electron/pre-install/*.tgz
 	rm -rf "~/jan/extensions"
 	rm -rf "~/.cache/jan*"
 else
 	find . -name "node_modules" -type d -prune -exec rm -rf '{}' +
 	find . -name ".next" -type d -exec rm -rf '{}' +
 	find . -name "dist" -type d -exec rm -rf '{}' +
+	find . -name "build" -type d -exec rm -rf '{}' +
+	find . -name "out" -type d -exec rm -rf '{}' +
+	rm -rf ./pre-install/*.tgz
+	rm -rf ./electron/pre-install/*.tgz
 	rm -rf ~/jan/extensions
 	rm -rf ~/Library/Caches/jan*
 endif
diff --git a/README.md b/README.md
index e1f74ef23..425ea69be 100644
--- a/README.md
+++ b/README.md
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.6-263.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.6-285.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.6-263.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.6-285.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.6-263.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.6-285.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.6-263.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.6-285.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.6-263.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.6-285.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>
@@ -167,6 +167,7 @@ To reset your installation:
    - Clear Application cache in `~/Library/Caches/jan`
 
 ## Requirements for running Jan
+
 - MacOS: 13 or higher
 - Windows:
   - Windows 10 or higher
@@ -194,17 +195,17 @@ Contributions are welcome! Please read the [CONTRIBUTING.md](CONTRIBUTING.md) fi
 
 1. **Clone the repository and prepare:**
 
-    ```bash
-    git clone https://github.com/janhq/jan
-    cd jan
-    git checkout -b DESIRED_BRANCH
-    ```
+   ```bash
+   git clone https://github.com/janhq/jan
+   cd jan
+   git checkout -b DESIRED_BRANCH
+   ```
 
 2. **Run development and use Jan Desktop**
 
-    ```bash
-    make dev
-    ```
+   ```bash
+   make dev
+   ```
 
 This will start the development server and open the desktop app.
 
@@ -218,6 +219,101 @@ make build
 
 This will build the app MacOS m1/m2 for production (with code signing already done) and put the result in `dist` folder.
 
+### Docker mode
+
+- Supported OS: Linux, WSL2 Docker
+- Pre-requisites:
+
+  - Docker Engine and Docker Compose are required to run Jan in Docker mode. Follow the [instructions](https://docs.docker.com/engine/install/ubuntu/) below to get started with Docker Engine on Ubuntu.
+
+    ```bash
+    curl -fsSL https://get.docker.com -o get-docker.sh
+    sudo sh ./get-docker.sh --dry-run
+    ```
+
+  - If you intend to run Jan in GPU mode, you need to install `nvidia-driver` and `nvidia-docker2`. Follow the instruction [here](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html) for installation.
+
+- Run Jan in Docker mode
+
+| Docker compose Profile | Description                                  |
+| ---------------------- | -------------------------------------------- |
+| `cpu-fs`               | Run Jan in CPU mode with default file system |
+| `cpu-s3fs`             | Run Jan in CPU mode with S3 file system      |
+| `gpu-fs`               | Run Jan in GPU mode with default file system |
+| `gpu-s3fs`             | Run Jan in GPU mode with S3 file system      |
+
+| Environment Variable    | Description                                                                                             |
+| ----------------------- | ------------------------------------------------------------------------------------------------------- |
+| `S3_BUCKET_NAME`        | S3 bucket name - leave blank for default file system                                                    |
+| `AWS_ACCESS_KEY_ID`     | AWS access key ID - leave blank for default file system                                                 |
+| `AWS_SECRET_ACCESS_KEY` | AWS secret access key - leave blank for default file system                                             |
+| `AWS_ENDPOINT`          | AWS endpoint URL - leave blank for default file system                                                  |
+| `AWS_REGION`            | AWS region - leave blank for default file system                                                        |
+| `API_BASE_URL`          | Jan Server URL, please modify it as your public ip address or domain name default http://localhost:1377 |
+
+- **Option 1**: Run Jan in CPU mode
+
+  ```bash
+  # cpu mode with default file system
+  docker compose --profile cpu-fs up -d
+
+  # cpu mode with S3 file system
+  docker compose --profile cpu-s3fs up -d
+  ```
+
+- **Option 2**: Run Jan in GPU mode
+
+  - **Step 1**: Check CUDA compatibility with your NVIDIA driver by running `nvidia-smi` and check the CUDA version in the output
+
+    ```bash
+    nvidia-smi
+
+    # Output
+    +---------------------------------------------------------------------------------------+
+    | NVIDIA-SMI 531.18                 Driver Version: 531.18       CUDA Version: 12.1     |
+    |-----------------------------------------+----------------------+----------------------+
+    | GPU  Name                      TCC/WDDM | Bus-Id        Disp.A | Volatile Uncorr. ECC |
+    | Fan  Temp  Perf            Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
+    |                                         |                      |               MIG M. |
+    |=========================================+======================+======================|
+    |   0  NVIDIA GeForce RTX 4070 Ti    WDDM | 00000000:01:00.0  On |                  N/A |
+    |  0%   44C    P8               16W / 285W|   1481MiB / 12282MiB |      2%      Default |
+    |                                         |                      |                  N/A |
+    +-----------------------------------------+----------------------+----------------------+
+    |   1  NVIDIA GeForce GTX 1660 Ti    WDDM | 00000000:02:00.0 Off |                  N/A |
+    |  0%   49C    P8               14W / 120W|      0MiB /  6144MiB |      0%      Default |
+    |                                         |                      |                  N/A |
+    +-----------------------------------------+----------------------+----------------------+
+    |   2  NVIDIA GeForce GTX 1660 Ti    WDDM | 00000000:05:00.0 Off |                  N/A |
+    | 29%   38C    P8               11W / 120W|      0MiB /  6144MiB |      0%      Default |
+    |                                         |                      |                  N/A |
+    +-----------------------------------------+----------------------+----------------------+
+
+    +---------------------------------------------------------------------------------------+
+    | Processes:                                                                            |
+    |  GPU   GI   CI        PID   Type   Process name                            GPU Memory |
+    |        ID   ID                                                             Usage      |
+    |=======================================================================================|
+    ```
+
+  - **Step 2**: Visit [NVIDIA NGC Catalog ](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda/tags) and find the smallest minor version of image tag that matches your CUDA version (e.g., 12.1 -> 12.1.0)
+
+  - **Step 3**: Update the `Dockerfile.gpu` line number 5 with the latest minor version of the image tag from step 2 (e.g. change `FROM nvidia/cuda:12.2.0-runtime-ubuntu22.04 AS base` to `FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04 AS base`)
+
+  - **Step 4**: Run command to start Jan in GPU mode
+
+    ```bash
+    # GPU mode with default file system
+    docker compose --profile gpu up -d
+
+    # GPU mode with S3 file system
+    docker compose --profile gpu-s3fs up -d
+    ```
+
+This will start the web server and you can access Jan at `http://localhost:3000`.
+
+> Note: RAG feature is not supported in Docker mode with s3fs yet.
+
 ## Acknowledgements
 
 Jan builds on top of other open-source projects:
diff --git a/charts/server/Chart.lock b/charts/server/Chart.lock
new file mode 100644
index 000000000..915788d61
--- /dev/null
+++ b/charts/server/Chart.lock
@@ -0,0 +1,6 @@
+dependencies:
+- name: common
+  repository: oci://ghcr.io/janhq/charts
+  version: 0.1.2
+digest: sha256:35e98bde174130787755b0f8ea2359b7b6790d965a7157c2f7cabf1bc8c04471
+generated: "2024-02-20T16:20:37.6530108+07:00"
diff --git a/charts/server/Chart.yaml b/charts/server/Chart.yaml
new file mode 100644
index 000000000..fb2e1c91b
--- /dev/null
+++ b/charts/server/Chart.yaml
@@ -0,0 +1,10 @@
+apiVersion: v2
+name: jan-server
+description: A Helm chart for Kubernetes
+type: application
+version: 0.1.0
+appVersion: '1.0.0'
+dependencies:
+  - name: common
+    version: 0.1.2 # common-chart-version
+    repository: oci://ghcr.io/janhq/charts
diff --git a/charts/server/charts/common-0.1.2.tgz b/charts/server/charts/common-0.1.2.tgz
new file mode 100644
index 000000000..946617eab
Binary files /dev/null and b/charts/server/charts/common-0.1.2.tgz differ
diff --git a/charts/server/config.json b/charts/server/config.json
new file mode 100644
index 000000000..62e9682fa
--- /dev/null
+++ b/charts/server/config.json
@@ -0,0 +1,4 @@
+{
+    "image-list": "server=ghcr.io/janhq/jan-server",
+    "platforms": "linux/amd64"
+}
\ No newline at end of file
diff --git a/charts/server/values.yaml b/charts/server/values.yaml
new file mode 100644
index 000000000..70f463174
--- /dev/null
+++ b/charts/server/values.yaml
@@ -0,0 +1,256 @@
+common:
+  imageTag: v0.4.6-cpu
+  # DO NOT CHANGE THE LINE ABOVE. MAKE ALL CHANGES BELOW
+
+  # Global pvc for all workload
+  pvc:
+    enabled: false
+    name: 'janroot'
+    accessModes: 'ReadWriteOnce'
+    storageClassName: ''
+    capacity: '50Gi'
+
+  # Global image pull secret
+  imagePullSecrets: []
+
+  externalSecret:
+    create: false
+    name: ''
+    annotations: {}
+
+  nameOverride: 'jan-server'
+  fullnameOverride: 'jan-server'
+
+  serviceAccount:
+    create: true
+    annotations: {}
+    name: 'jan-server-service-account'
+
+  podDisruptionBudget:
+    create: false
+    minAvailable: 1
+
+  workloads:
+    - name: server
+      image:
+        repository: ghcr.io/janhq/jan-server
+        pullPolicy: Always
+
+      command: ['/bin/sh', '-c']
+      args: ['cd server && node build/main.js']
+
+      replicaCount: 1
+      ports:
+        containerPort: 1337
+
+      strategy:
+        canary:
+          steps:
+            - setWeight: 50
+            - pause: { duration: 1m }
+
+      ingress:
+        enabled: true
+        className: 'nginx'
+        annotations:
+          nginx.ingress.kubernetes.io/proxy-body-size: '100m'
+          nginx.ingress.kubernetes.io/proxy-read-timeout: '1800'
+          nginx.ingress.kubernetes.io/proxy-send-timeout: '1800'
+          # cert-manager.io/cluster-issuer: 'jan-ai-dns01-cluster-issuer'
+          # nginx.ingress.kubernetes.io/force-ssl-redirect: 'true'
+          nginx.ingress.kubernetes.io/backend-protocol: HTTP
+        hosts:
+          - host: server.local
+            paths:
+              - path: /
+                pathType: Prefix
+        tls:
+          []
+          # - hosts:
+          #     - server-dev.jan.ai
+          #   secretName: jan-server-prod-tls-v2
+
+      instrumentation:
+        enabled: false
+      podAnnotations: {}
+
+      podSecurityContext: {}
+
+      securityContext: {}
+
+      service:
+        extenalLabel: {}
+        type: ClusterIP
+        port: 1337
+        targetPort: 1337
+
+      # If you want to use GPU, please uncomment the following lines and change imageTag to the one with GPU support
+      resources:
+        # limits:
+        #   nvidia.com/gpu: 1
+        requests:
+          cpu: 2000m
+          memory: 8192M
+
+      # If you want to use pv, please uncomment the following lines and enable pvc.enabled
+      volumes:
+        []
+        # - name: janroot
+        #   persistentVolumeClaim:
+        #     claimName: janroot
+
+      volumeMounts:
+        []
+        # - name: janroot
+        #   mountPath: /app/server/build/jan
+
+      # AWS_ACCESS_KEY_ID, AWS_SECRET_ACCESS_KEY, S3_BUCKET_NAME, AWS_ENDPOINT, AWS_REGION should mount as a secret env instead of plain text here
+      # Change API_BASE_URL to your server's public domain
+      env:
+        - name: API_BASE_URL
+          value: 'http://server.local'
+
+      lifecycle: {}
+      autoscaling:
+        enabled: false
+        minReplicas: 2
+        maxReplicas: 3
+        targetCPUUtilizationPercentage: 95
+        targetMemoryUtilizationPercentage: 95
+
+      kedaScaling:
+        enabled: false # ignore if autoscaling.enable = true
+        cooldownPeriod: 30
+        pollingInterval: 2
+        minReplicas: 1
+        maxReplicas: 5
+        metricName: celery_queue_length
+        query: celery_queue_length{queue_name="myqueue"} # change queue_name here
+        serverAddress: http://prometheus-prod-kube-prome-prometheus.monitoring.svc:9090
+        threshold: '3'
+
+      nodeSelector: {}
+
+      tolerations: []
+
+      podSecurityGroup:
+        enabled: false
+        securitygroupid: []
+
+      # Reloader Option
+      reloader: 'false'
+      vpa:
+        enabled: false
+
+    - name: web
+      image:
+        repository: ghcr.io/janhq/jan-server
+        pullPolicy: Always
+
+      command: ['/bin/sh', '-c']
+      args:
+        [
+          'export NODE_ENV=production && yarn workspace jan-web build && cd web && npx serve out',
+        ]
+
+      replicaCount: 1
+      ports:
+        containerPort: 3000
+
+      strategy:
+        canary:
+          steps:
+            - setWeight: 50
+            - pause: { duration: 1m }
+
+      ingress:
+        enabled: true
+        className: 'nginx'
+        annotations:
+          nginx.ingress.kubernetes.io/proxy-body-size: '100m'
+          nginx.ingress.kubernetes.io/proxy-read-timeout: '1800'
+          nginx.ingress.kubernetes.io/proxy-send-timeout: '1800'
+          # cert-manager.io/cluster-issuer: 'jan-ai-dns01-cluster-issuer'
+          # nginx.ingress.kubernetes.io/force-ssl-redirect: 'true'
+          nginx.ingress.kubernetes.io/backend-protocol: HTTP
+        hosts:
+          - host: web.local
+            paths:
+              - path: /
+                pathType: Prefix
+        tls:
+          []
+          # - hosts:
+          #     - server-dev.jan.ai
+          #   secretName: jan-server-prod-tls-v2
+
+      instrumentation:
+        enabled: false
+      podAnnotations: {}
+
+      podSecurityContext: {}
+
+      securityContext: {}
+
+      service:
+        extenalLabel: {}
+        type: ClusterIP
+        port: 3000
+        targetPort: 3000
+
+      resources:
+        limits:
+          cpu: 1000m
+          memory: 2048M
+        requests:
+          cpu: 50m
+          memory: 500M
+
+      volumes:
+        []
+        # - name: janroot
+        #   persistentVolumeClaim:
+        #     claimName: janroot
+
+      volumeMounts:
+        []
+        # - name: janroot
+        #   mountPath: /app/server/build/jan
+
+      # AWS_ACCESS_KEY_ID, AWS_SECRET_ACCESS_KEY, S3_BUCKET_NAME, AWS_ENDPOINT, AWS_REGION should mount as a secret env instead of plain text here
+      # Change API_BASE_URL to your server's public domain
+      env:
+        - name: API_BASE_URL
+          value: 'http://server.local'
+
+      lifecycle: {}
+      autoscaling:
+        enabled: true
+        minReplicas: 1
+        maxReplicas: 3
+        targetCPUUtilizationPercentage: 95
+        targetMemoryUtilizationPercentage: 95
+
+      kedaScaling:
+        enabled: false # ignore if autoscaling.enable = true
+        cooldownPeriod: 30
+        pollingInterval: 2
+        minReplicas: 1
+        maxReplicas: 5
+        metricName: celery_queue_length
+        query: celery_queue_length{queue_name="myqueue"} # change queue_name here
+        serverAddress: http://prometheus-prod-kube-prome-prometheus.monitoring.svc:9090
+        threshold: '3'
+
+      nodeSelector: {}
+
+      tolerations: []
+
+      podSecurityGroup:
+        enabled: false
+        securitygroupid: []
+
+      # Reloader Option
+      reloader: 'false'
+      vpa:
+        enabled: false
diff --git a/core/jest.config.js b/core/jest.config.js
index fb03768fe..c18f55091 100644
--- a/core/jest.config.js
+++ b/core/jest.config.js
@@ -4,4 +4,4 @@ module.exports = {
   moduleNameMapper: {
     '@/(.*)': '<rootDir>/src/$1',
   },
-}
\ No newline at end of file
+}
diff --git a/core/package.json b/core/package.json
index 437e6d0a6..c3abe2d56 100644
--- a/core/package.json
+++ b/core/package.json
@@ -57,6 +57,7 @@
     "rollup-plugin-typescript2": "^0.36.0",
     "ts-jest": "^26.1.1",
     "tslib": "^2.6.2",
-    "typescript": "^5.2.2"
+    "typescript": "^5.2.2",
+    "rimraf": "^3.0.2"
   }
 }
diff --git a/core/rollup.config.ts b/core/rollup.config.ts
index d78130a4d..ebea8e237 100644
--- a/core/rollup.config.ts
+++ b/core/rollup.config.ts
@@ -54,7 +54,8 @@ export default [
       'url',
       'http',
       'os',
-      'util'
+      'util',
+      'child_process',
     ],
     watch: {
       include: 'src/node/**',
diff --git a/core/src/api/index.ts b/core/src/api/index.ts
index 0d7cc51f7..676020758 100644
--- a/core/src/api/index.ts
+++ b/core/src/api/index.ts
@@ -1,15 +1,22 @@
+/**
+ * Native Route APIs
+ * @description Enum of all the routes exposed by the app
+ */
+export enum NativeRoute {
+  openExternalUrl = 'openExternalUrl',
+  openAppDirectory = 'openAppDirectory',
+  openFileExplore = 'openFileExplorer',
+  selectDirectory = 'selectDirectory',
+  relaunch = 'relaunch',
+}
+
 /**
  * App Route APIs
  * @description Enum of all the routes exposed by the app
  */
 export enum AppRoute {
-  openExternalUrl = 'openExternalUrl',
-  openAppDirectory = 'openAppDirectory',
-  openFileExplore = 'openFileExplorer',
-  selectDirectory = 'selectDirectory',
   getAppConfigurations = 'getAppConfigurations',
   updateAppConfiguration = 'updateAppConfiguration',
-  relaunch = 'relaunch',
   joinPath = 'joinPath',
   isSubdirectory = 'isSubdirectory',
   baseName = 'baseName',
@@ -30,6 +37,7 @@ export enum DownloadRoute {
   downloadFile = 'downloadFile',
   pauseDownload = 'pauseDownload',
   resumeDownload = 'resumeDownload',
+  getDownloadProgress = 'getDownloadProgress',
 }
 
 export enum DownloadEvent {
@@ -68,6 +76,10 @@ export enum FileManagerRoute {
 
 export type ApiFunction = (...args: any[]) => any
 
+export type NativeRouteFunctions = {
+  [K in NativeRoute]: ApiFunction
+}
+
 export type AppRouteFunctions = {
   [K in AppRoute]: ApiFunction
 }
@@ -96,7 +108,8 @@ export type FileManagerRouteFunctions = {
   [K in FileManagerRoute]: ApiFunction
 }
 
-export type APIFunctions = AppRouteFunctions &
+export type APIFunctions = NativeRouteFunctions &
+  AppRouteFunctions &
   AppEventFunctions &
   DownloadRouteFunctions &
   DownloadEventFunctions &
@@ -104,11 +117,13 @@ export type APIFunctions = AppRouteFunctions &
   FileSystemRouteFunctions &
   FileManagerRoute
 
-export const APIRoutes = [
+export const CoreRoutes = [
   ...Object.values(AppRoute),
   ...Object.values(DownloadRoute),
   ...Object.values(ExtensionRoute),
   ...Object.values(FileSystemRoute),
   ...Object.values(FileManagerRoute),
 ]
+
+export const APIRoutes = [...CoreRoutes, ...Object.values(NativeRoute)]
 export const APIEvents = [...Object.values(AppEvent), ...Object.values(DownloadEvent)]
diff --git a/core/src/extension.ts b/core/src/extension.ts
index 0b7f9b7fc..3528f581c 100644
--- a/core/src/extension.ts
+++ b/core/src/extension.ts
@@ -1,13 +1,13 @@
 export enum ExtensionTypeEnum {
-  Assistant = "assistant",
-  Conversational = "conversational",
-  Inference = "inference",
-  Model = "model",
-  SystemMonitoring = "systemMonitoring",
+  Assistant = 'assistant',
+  Conversational = 'conversational',
+  Inference = 'inference',
+  Model = 'model',
+  SystemMonitoring = 'systemMonitoring',
 }
 
 export interface ExtensionType {
-  type(): ExtensionTypeEnum | undefined;
+  type(): ExtensionTypeEnum | undefined
 }
 /**
  * Represents a base extension.
@@ -20,16 +20,16 @@ export abstract class BaseExtension implements ExtensionType {
    * Undefined means its not extending any known extension by the application.
    */
   type(): ExtensionTypeEnum | undefined {
-    return undefined;
+    return undefined
   }
   /**
    * Called when the extension is loaded.
    * Any initialization logic for the extension should be put here.
    */
-  abstract onLoad(): void;
+  abstract onLoad(): void
   /**
    * Called when the extension is unloaded.
    * Any cleanup logic for the extension should be put here.
    */
-  abstract onUnload(): void;
+  abstract onUnload(): void
 }
diff --git a/core/src/extensions/assistant.ts b/core/src/extensions/assistant.ts
index ba345711a..5c3114f41 100644
--- a/core/src/extensions/assistant.ts
+++ b/core/src/extensions/assistant.ts
@@ -1,5 +1,5 @@
-import { Assistant, AssistantInterface } from "../index";
-import { BaseExtension, ExtensionTypeEnum } from "../extension";
+import { Assistant, AssistantInterface } from '../index'
+import { BaseExtension, ExtensionTypeEnum } from '../extension'
 
 /**
  * Assistant extension for managing assistants.
@@ -10,10 +10,10 @@ export abstract class AssistantExtension extends BaseExtension implements Assist
    * Assistant extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.Assistant;
+    return ExtensionTypeEnum.Assistant
   }
 
-  abstract createAssistant(assistant: Assistant): Promise<void>;
-  abstract deleteAssistant(assistant: Assistant): Promise<void>;
-  abstract getAssistants(): Promise<Assistant[]>;
+  abstract createAssistant(assistant: Assistant): Promise<void>
+  abstract deleteAssistant(assistant: Assistant): Promise<void>
+  abstract getAssistants(): Promise<Assistant[]>
 }
diff --git a/core/src/extensions/conversational.ts b/core/src/extensions/conversational.ts
index 4319784c3..a49a4e689 100644
--- a/core/src/extensions/conversational.ts
+++ b/core/src/extensions/conversational.ts
@@ -14,7 +14,7 @@ export abstract class ConversationalExtension
    * Conversation extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.Conversational;
+    return ExtensionTypeEnum.Conversational
   }
 
   abstract getThreads(): Promise<Thread[]>
diff --git a/core/src/extensions/index.ts b/core/src/extensions/index.ts
index 1796c1618..522334548 100644
--- a/core/src/extensions/index.ts
+++ b/core/src/extensions/index.ts
@@ -2,24 +2,24 @@
  * Conversational extension. Persists and retrieves conversations.
  * @module
  */
-export { ConversationalExtension } from "./conversational";
+export { ConversationalExtension } from './conversational'
 
 /**
  * Inference extension. Start, stop and inference models.
  */
-export { InferenceExtension } from "./inference";
+export { InferenceExtension } from './inference'
 
 /**
  * Monitoring extension for system monitoring.
  */
-export { MonitoringExtension } from "./monitoring";
+export { MonitoringExtension } from './monitoring'
 
 /**
  * Assistant extension for managing assistants.
  */
-export { AssistantExtension } from "./assistant";
+export { AssistantExtension } from './assistant'
 
 /**
  * Model extension for managing models.
  */
-export { ModelExtension } from "./model";
+export { ModelExtension } from './model'
diff --git a/core/src/extensions/inference.ts b/core/src/extensions/inference.ts
index c551d108f..e8e51f9eb 100644
--- a/core/src/extensions/inference.ts
+++ b/core/src/extensions/inference.ts
@@ -1,5 +1,5 @@
-import { InferenceInterface, MessageRequest, ThreadMessage } from "../index";
-import { BaseExtension, ExtensionTypeEnum } from "../extension";
+import { InferenceInterface, MessageRequest, ThreadMessage } from '../index'
+import { BaseExtension, ExtensionTypeEnum } from '../extension'
 
 /**
  * Inference extension. Start, stop and inference models.
@@ -9,8 +9,8 @@ export abstract class InferenceExtension extends BaseExtension implements Infere
    * Inference extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.Inference;
+    return ExtensionTypeEnum.Inference
   }
 
-  abstract inference(data: MessageRequest): Promise<ThreadMessage>;
+  abstract inference(data: MessageRequest): Promise<ThreadMessage>
 }
diff --git a/core/src/extensions/model.ts b/core/src/extensions/model.ts
index 30aa5b6ba..df7d14f42 100644
--- a/core/src/extensions/model.ts
+++ b/core/src/extensions/model.ts
@@ -1,5 +1,5 @@
-import { BaseExtension, ExtensionTypeEnum } from "../extension";
-import { Model, ModelInterface } from "../index";
+import { BaseExtension, ExtensionTypeEnum } from '../extension'
+import { Model, ModelInterface } from '../index'
 
 /**
  * Model extension for managing models.
@@ -9,16 +9,16 @@ export abstract class ModelExtension extends BaseExtension implements ModelInter
    * Model extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.Model;
+    return ExtensionTypeEnum.Model
   }
 
   abstract downloadModel(
     model: Model,
-    network?: { proxy: string; ignoreSSL?: boolean },
-  ): Promise<void>;
-  abstract cancelModelDownload(modelId: string): Promise<void>;
-  abstract deleteModel(modelId: string): Promise<void>;
-  abstract saveModel(model: Model): Promise<void>;
-  abstract getDownloadedModels(): Promise<Model[]>;
-  abstract getConfiguredModels(): Promise<Model[]>;
+    network?: { proxy: string; ignoreSSL?: boolean }
+  ): Promise<void>
+  abstract cancelModelDownload(modelId: string): Promise<void>
+  abstract deleteModel(modelId: string): Promise<void>
+  abstract saveModel(model: Model): Promise<void>
+  abstract getDownloadedModels(): Promise<Model[]>
+  abstract getConfiguredModels(): Promise<Model[]>
 }
diff --git a/core/src/extensions/monitoring.ts b/core/src/extensions/monitoring.ts
index 2de9b9ae5..ba193f0f4 100644
--- a/core/src/extensions/monitoring.ts
+++ b/core/src/extensions/monitoring.ts
@@ -1,5 +1,5 @@
-import { BaseExtension, ExtensionTypeEnum } from "../extension";
-import { MonitoringInterface } from "../index";
+import { BaseExtension, ExtensionTypeEnum } from '../extension'
+import { MonitoringInterface } from '../index'
 
 /**
  * Monitoring extension for system monitoring.
@@ -10,9 +10,9 @@ export abstract class MonitoringExtension extends BaseExtension implements Monit
    * Monitoring extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.SystemMonitoring;
+    return ExtensionTypeEnum.SystemMonitoring
   }
 
-  abstract getResourcesInfo(): Promise<any>;
-  abstract getCurrentLoad(): Promise<any>;
+  abstract getResourcesInfo(): Promise<any>
+  abstract getCurrentLoad(): Promise<any>
 }
diff --git a/core/src/index.ts b/core/src/index.ts
index a56b6f0e1..3505797b1 100644
--- a/core/src/index.ts
+++ b/core/src/index.ts
@@ -38,3 +38,10 @@ export * from './extension'
  * @module
  */
 export * from './extensions/index'
+
+/**
+ * Declare global object
+ */
+declare global {
+  var core: any | undefined
+}
diff --git a/core/src/node/api/common/adapter.ts b/core/src/node/api/common/adapter.ts
new file mode 100644
index 000000000..56f4cedb3
--- /dev/null
+++ b/core/src/node/api/common/adapter.ts
@@ -0,0 +1,43 @@
+import {
+  AppRoute,
+  DownloadRoute,
+  ExtensionRoute,
+  FileManagerRoute,
+  FileSystemRoute,
+} from '../../../api'
+import { Downloader } from '../processors/download'
+import { FileSystem } from '../processors/fs'
+import { Extension } from '../processors/extension'
+import { FSExt } from '../processors/fsExt'
+import { App } from '../processors/app'
+
+export class RequestAdapter {
+  downloader: Downloader
+  fileSystem: FileSystem
+  extension: Extension
+  fsExt: FSExt
+  app: App
+
+  constructor(observer?: Function) {
+    this.downloader = new Downloader(observer)
+    this.fileSystem = new FileSystem()
+    this.extension = new Extension()
+    this.fsExt = new FSExt()
+    this.app = new App()
+  }
+
+  // TODO: Clearer Factory pattern here
+  process(route: string, ...args: any) {
+    if (route in DownloadRoute) {
+      return this.downloader.process(route, ...args)
+    } else if (route in FileSystemRoute) {
+      return this.fileSystem.process(route, ...args)
+    } else if (route in ExtensionRoute) {
+      return this.extension.process(route, ...args)
+    } else if (route in FileManagerRoute) {
+      return this.fsExt.process(route, ...args)
+    } else if (route in AppRoute) {
+      return this.app.process(route, ...args)
+    }
+  }
+}
diff --git a/core/src/node/api/common/handler.ts b/core/src/node/api/common/handler.ts
new file mode 100644
index 000000000..4a39ae52a
--- /dev/null
+++ b/core/src/node/api/common/handler.ts
@@ -0,0 +1,23 @@
+import { CoreRoutes } from '../../../api'
+import { RequestAdapter } from './adapter'
+
+export type Handler = (route: string, args: any) => any
+
+export class RequestHandler {
+  handler: Handler
+  adataper: RequestAdapter
+
+  constructor(handler: Handler, observer?: Function) {
+    this.handler = handler
+    this.adataper = new RequestAdapter(observer)
+  }
+
+  handle() {
+    CoreRoutes.map((route) => {
+      this.handler(route, async (...args: any[]) => {
+        const values = await this.adataper.process(route, ...args)
+        return values
+      })
+    })
+  }
+}
diff --git a/core/src/node/api/index.ts b/core/src/node/api/index.ts
index 4c3041ba3..ab0c51656 100644
--- a/core/src/node/api/index.ts
+++ b/core/src/node/api/index.ts
@@ -1,2 +1,3 @@
 export * from './HttpServer'
-export * from './routes'
+export * from './restful/v1'
+export * from './common/handler'
diff --git a/core/src/node/api/processors/Processor.ts b/core/src/node/api/processors/Processor.ts
new file mode 100644
index 000000000..8ef0c6e19
--- /dev/null
+++ b/core/src/node/api/processors/Processor.ts
@@ -0,0 +1,3 @@
+export abstract class Processor {
+  abstract process(key: string, ...args: any[]): any
+}
diff --git a/core/src/node/api/processors/app.ts b/core/src/node/api/processors/app.ts
new file mode 100644
index 000000000..c62b5011d
--- /dev/null
+++ b/core/src/node/api/processors/app.ts
@@ -0,0 +1,96 @@
+import { basename, isAbsolute, join, relative } from 'path'
+
+import { Processor } from './Processor'
+import { getAppConfigurations as appConfiguration, updateAppConfiguration } from '../../helper'
+import { log as writeLog, logServer as writeServerLog } from '../../helper/log'
+import { appResourcePath } from '../../helper/path'
+
+export class App implements Processor {
+  observer?: Function
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(key: string, ...args: any[]): any {
+    const instance = this as any
+    const func = instance[key]
+    return func(...args)
+  }
+
+  /**
+   * Joins multiple paths together, respect to the current OS.
+   */
+  joinPath(args: any[]) {
+    return join(...args)
+  }
+
+  /**
+   * Checks if the given path is a subdirectory of the given directory.
+   *
+   * @param _event - The IPC event object.
+   * @param from - The path to check.
+   * @param to - The directory to check against.
+   *
+   * @returns {Promise<boolean>} - A promise that resolves with the result.
+   */
+  isSubdirectory(from: any, to: any) {
+    const rel = relative(from, to)
+    const isSubdir = rel && !rel.startsWith('..') && !isAbsolute(rel)
+
+    if (isSubdir === '') return false
+    else return isSubdir
+  }
+
+  /**
+   * Retrieve basename from given path, respect to the current OS.
+   */
+  baseName(args: any) {
+    return basename(args)
+  }
+
+  /**
+   * Log message to log file.
+   */
+  log(args: any) {
+    writeLog(args)
+  }
+
+  /**
+   * Log message to log file.
+   */
+  logServer(args: any) {
+    writeServerLog(args)
+  }
+
+  getAppConfigurations() {
+    return appConfiguration()
+  }
+
+  async updateAppConfiguration(args: any) {
+    await updateAppConfiguration(args)
+  }
+
+  /**
+   * Start Jan API Server.
+   */
+  async startServer(args?: any) {
+    const { startServer } = require('@janhq/server')
+    return startServer({
+      host: args?.host,
+      port: args?.port,
+      isCorsEnabled: args?.isCorsEnabled,
+      isVerboseEnabled: args?.isVerboseEnabled,
+      schemaPath: join(await appResourcePath(), 'docs', 'openapi', 'jan.yaml'),
+      baseDir: join(await appResourcePath(), 'docs', 'openapi'),
+    })
+  }
+
+  /**
+   * Stop Jan API Server.
+   */
+  stopServer() {
+    const { stopServer } = require('@janhq/server')
+    return stopServer()
+  }
+}
diff --git a/core/src/node/api/processors/download.ts b/core/src/node/api/processors/download.ts
new file mode 100644
index 000000000..686ba58a1
--- /dev/null
+++ b/core/src/node/api/processors/download.ts
@@ -0,0 +1,106 @@
+import { resolve, sep } from 'path'
+import { DownloadEvent } from '../../../api'
+import { normalizeFilePath } from '../../helper/path'
+import { getJanDataFolderPath } from '../../helper'
+import { DownloadManager } from '../../helper/download'
+import { createWriteStream, renameSync } from 'fs'
+import { Processor } from './Processor'
+import { DownloadState } from '../../../types'
+
+export class Downloader implements Processor {
+  observer?: Function
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(key: string, ...args: any[]): any {
+    const instance = this as any
+    const func = instance[key]
+    return func(this.observer, ...args)
+  }
+
+  downloadFile(observer: any, url: string, localPath: string, network: any) {
+    const request = require('request')
+    const progress = require('request-progress')
+
+    const strictSSL = !network?.ignoreSSL
+    const proxy = network?.proxy?.startsWith('http') ? network.proxy : undefined
+    if (typeof localPath === 'string') {
+      localPath = normalizeFilePath(localPath)
+    }
+    const array = localPath.split(sep)
+    const fileName = array.pop() ?? ''
+    const modelId = array.pop() ?? ''
+
+    const destination = resolve(getJanDataFolderPath(), localPath)
+    const rq = request({ url, strictSSL, proxy })
+
+    // Put request to download manager instance
+    DownloadManager.instance.setRequest(localPath, rq)
+
+    // Downloading file to a temp file first
+    const downloadingTempFile = `${destination}.download`
+
+    progress(rq, {})
+      .on('progress', (state: any) => {
+        const downloadState: DownloadState = {
+          ...state,
+          modelId,
+          fileName,
+          downloadState: 'downloading',
+        }
+        console.log('progress: ', downloadState)
+        observer?.(DownloadEvent.onFileDownloadUpdate, downloadState)
+        DownloadManager.instance.downloadProgressMap[modelId] = downloadState
+      })
+      .on('error', (error: Error) => {
+        const currentDownloadState = DownloadManager.instance.downloadProgressMap[modelId]
+        const downloadState: DownloadState = {
+          ...currentDownloadState,
+          error: error.message,
+          downloadState: 'error',
+        }
+        if (currentDownloadState) {
+          DownloadManager.instance.downloadProgressMap[modelId] = downloadState
+        }
+
+        observer?.(DownloadEvent.onFileDownloadError, downloadState)
+      })
+      .on('end', () => {
+        const currentDownloadState = DownloadManager.instance.downloadProgressMap[modelId]
+        if (currentDownloadState && DownloadManager.instance.networkRequests[localPath]) {
+          // Finished downloading, rename temp file to actual file
+          renameSync(downloadingTempFile, destination)
+          const downloadState: DownloadState = {
+            ...currentDownloadState,
+            downloadState: 'end',
+          }
+          observer?.(DownloadEvent.onFileDownloadSuccess, downloadState)
+          DownloadManager.instance.downloadProgressMap[modelId] = downloadState
+        }
+      })
+      .pipe(createWriteStream(downloadingTempFile))
+  }
+
+  abortDownload(observer: any, fileName: string) {
+    const rq = DownloadManager.instance.networkRequests[fileName]
+    if (rq) {
+      DownloadManager.instance.networkRequests[fileName] = undefined
+      rq?.abort()
+    } else {
+      observer?.(DownloadEvent.onFileDownloadError, {
+        fileName,
+        error: 'aborted',
+      })
+    }
+  }
+
+  resumeDownload(observer: any, fileName: any) {
+    DownloadManager.instance.networkRequests[fileName]?.resume()
+  }
+
+  pauseDownload(observer: any, fileName: any) {
+    DownloadManager.instance.networkRequests[fileName]?.pause()
+  }
+}
diff --git a/core/src/node/api/processors/extension.ts b/core/src/node/api/processors/extension.ts
new file mode 100644
index 000000000..df5d2d945
--- /dev/null
+++ b/core/src/node/api/processors/extension.ts
@@ -0,0 +1,88 @@
+import { readdirSync } from 'fs'
+import { join, extname } from 'path'
+
+import { Processor } from './Processor'
+import { ModuleManager } from '../../helper/module'
+import { getJanExtensionsPath as getPath } from '../../helper'
+import {
+  getActiveExtensions as getExtensions,
+  getExtension,
+  removeExtension,
+  installExtensions,
+} from '../../extension/store'
+import { appResourcePath } from '../../helper/path'
+
+export class Extension implements Processor {
+  observer?: Function
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(key: string, ...args: any[]): any {
+    const instance = this as any
+    const func = instance[key]
+    return func(...args)
+  }
+
+  invokeExtensionFunc(modulePath: string, method: string, ...params: any[]) {
+    const module = require(join(getPath(), modulePath))
+    ModuleManager.instance.setModule(modulePath, module)
+
+    if (typeof module[method] === 'function') {
+      return module[method](...params)
+    } else {
+      console.debug(module[method])
+      console.error(`Function "${method}" does not exist in the module.`)
+    }
+  }
+
+  /**
+   * Returns the paths of the base extensions.
+   * @returns An array of paths to the base extensions.
+   */
+  async baseExtensions() {
+    const baseExtensionPath = join(await appResourcePath(), 'pre-install')
+    return readdirSync(baseExtensionPath)
+      .filter((file) => extname(file) === '.tgz')
+      .map((file) => join(baseExtensionPath, file))
+  }
+
+  /**MARK: Extension Manager handlers */
+  async installExtension(extensions: any) {
+    // Install and activate all provided extensions
+    const installed = await installExtensions(extensions)
+    return JSON.parse(JSON.stringify(installed))
+  }
+
+  // Register IPC route to uninstall a extension
+  async uninstallExtension(extensions: any) {
+    // Uninstall all provided extensions
+    for (const ext of extensions) {
+      const extension = getExtension(ext)
+      await extension.uninstall()
+      if (extension.name) removeExtension(extension.name)
+    }
+
+    // Reload all renderer pages if needed
+    return true
+  }
+
+  // Register IPC route to update a extension
+  async updateExtension(extensions: any) {
+    // Update all provided extensions
+    const updated: any[] = []
+    for (const ext of extensions) {
+      const extension = getExtension(ext)
+      const res = await extension.update()
+      if (res) updated.push(extension)
+    }
+
+    // Reload all renderer pages if needed
+    return JSON.parse(JSON.stringify(updated))
+  }
+
+  getActiveExtensions() {
+    return JSON.parse(JSON.stringify(getExtensions()))
+  }
+}
diff --git a/core/src/node/api/processors/fs.ts b/core/src/node/api/processors/fs.ts
new file mode 100644
index 000000000..93a5f1905
--- /dev/null
+++ b/core/src/node/api/processors/fs.ts
@@ -0,0 +1,25 @@
+import { join } from 'path'
+import { normalizeFilePath } from '../../helper/path'
+import { getJanDataFolderPath } from '../../helper'
+import { Processor } from './Processor'
+
+export class FileSystem implements Processor {
+  observer?: Function
+  private static moduleName = 'fs'
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(route: string, ...args: any[]): any {
+    return import(FileSystem.moduleName).then((mdl) =>
+      mdl[route](
+        ...args.map((arg: any) =>
+          typeof arg === 'string' && (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
+            ? join(getJanDataFolderPath(), normalizeFilePath(arg))
+            : arg
+        )
+      )
+    )
+  }
+}
diff --git a/core/src/node/api/processors/fsExt.ts b/core/src/node/api/processors/fsExt.ts
new file mode 100644
index 000000000..71e07ae57
--- /dev/null
+++ b/core/src/node/api/processors/fsExt.ts
@@ -0,0 +1,78 @@
+import { join } from 'path'
+import fs from 'fs'
+import { FileManagerRoute } from '../../../api'
+import { appResourcePath, normalizeFilePath } from '../../helper/path'
+import { getJanDataFolderPath, getJanDataFolderPath as getPath } from '../../helper'
+import { Processor } from './Processor'
+import { FileStat } from '../../../types'
+
+export class FSExt implements Processor {
+  observer?: Function
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(key: string, ...args: any): any {
+    const instance = this as any
+    const func = instance[key]
+    return func(...args)
+  }
+
+  // Handles the 'syncFile' IPC event. This event is triggered to synchronize a file from a source path to a destination path.
+  syncFile(src: string, dest: string) {
+    const reflect = require('@alumna/reflect')
+    return reflect({
+      src,
+      dest,
+      recursive: true,
+      delete: false,
+      overwrite: true,
+      errorOnExist: false,
+    })
+  }
+
+  // Handles the 'getJanDataFolderPath' IPC event. This event is triggered to get the user space path.
+  getJanDataFolderPath() {
+    return Promise.resolve(getPath())
+  }
+
+  // Handles the 'getResourcePath' IPC event. This event is triggered to get the resource path.
+  getResourcePath() {
+    return appResourcePath()
+  }
+
+  // Handles the 'getUserHomePath' IPC event. This event is triggered to get the user home path.
+  getUserHomePath() {
+    return process.env[process.platform == 'win32' ? 'USERPROFILE' : 'HOME']
+  }
+
+  // handle fs is directory here
+  fileStat(path: string) {
+    const normalizedPath = normalizeFilePath(path)
+
+    const fullPath = join(getJanDataFolderPath(), normalizedPath)
+    const isExist = fs.existsSync(fullPath)
+    if (!isExist) return undefined
+
+    const isDirectory = fs.lstatSync(fullPath).isDirectory()
+    const size = fs.statSync(fullPath).size
+
+    const fileStat: FileStat = {
+      isDirectory,
+      size,
+    }
+
+    return fileStat
+  }
+
+  writeBlob(path: string, data: any) {
+    try {
+      const normalizedPath = normalizeFilePath(path)
+      const dataBuffer = Buffer.from(data, 'base64')
+      fs.writeFileSync(join(getJanDataFolderPath(), normalizedPath), dataBuffer)
+    } catch (err) {
+      console.error(`writeFile ${path} result: ${err}`)
+    }
+  }
+}
diff --git a/core/src/node/api/restful/app/download.ts b/core/src/node/api/restful/app/download.ts
new file mode 100644
index 000000000..b5919659b
--- /dev/null
+++ b/core/src/node/api/restful/app/download.ts
@@ -0,0 +1,23 @@
+import { DownloadRoute } from '../../../../api'
+import { DownloadManager } from '../../../helper/download'
+import { HttpServer } from '../../HttpServer'
+
+export const downloadRouter = async (app: HttpServer) => {
+  app.get(`/download/${DownloadRoute.getDownloadProgress}/:modelId`, async (req, res) => {
+    const modelId = req.params.modelId
+
+    console.debug(`Getting download progress for model ${modelId}`)
+    console.debug(
+      `All Download progress: ${JSON.stringify(DownloadManager.instance.downloadProgressMap)}`
+    )
+
+    // check if null DownloadManager.instance.downloadProgressMap
+    if (!DownloadManager.instance.downloadProgressMap[modelId]) {
+      return res.status(404).send({
+        message: 'Download progress not found',
+      })
+    } else {
+      return res.status(200).send(DownloadManager.instance.downloadProgressMap[modelId])
+    }
+  })
+}
diff --git a/core/src/node/api/restful/app/handlers.ts b/core/src/node/api/restful/app/handlers.ts
new file mode 100644
index 000000000..43c3f7add
--- /dev/null
+++ b/core/src/node/api/restful/app/handlers.ts
@@ -0,0 +1,13 @@
+import { HttpServer } from '../../HttpServer'
+import { Handler, RequestHandler } from '../../common/handler'
+
+export function handleRequests(app: HttpServer) {
+  const restWrapper: Handler = (route: string, listener: (...args: any[]) => any) => {
+    app.post(`/app/${route}`, async (request: any, reply: any) => {
+      const args = JSON.parse(request.body) as any[]
+      reply.send(JSON.stringify(await listener(...args)))
+    })
+  }
+  const handler = new RequestHandler(restWrapper)
+  handler.handle()
+}
diff --git a/core/src/node/api/routes/common.ts b/core/src/node/api/restful/common.ts
similarity index 54%
rename from core/src/node/api/routes/common.ts
rename to core/src/node/api/restful/common.ts
index 8887755fe..433632989 100644
--- a/core/src/node/api/routes/common.ts
+++ b/core/src/node/api/restful/common.ts
@@ -1,24 +1,34 @@
-import { AppRoute } from '../../../api'
 import { HttpServer } from '../HttpServer'
-import { basename, join } from 'path'
 import {
   chatCompletions,
   deleteBuilder,
   downloadModel,
   getBuilder,
   retrieveBuilder,
-} from '../common/builder'
+  createMessage,
+  createThread,
+  getMessages,
+  retrieveMessage,
+  updateThread,
+} from './helper/builder'
 
-import { JanApiRouteConfiguration } from '../common/configuration'
-import { startModel, stopModel } from '../common/startStopModel'
+import { JanApiRouteConfiguration } from './helper/configuration'
+import { startModel, stopModel } from './helper/startStopModel'
 import { ModelSettingParams } from '../../../types'
-import { getJanDataFolderPath } from '../../utils'
-import { normalizeFilePath } from '../../path'
 
 export const commonRouter = async (app: HttpServer) => {
+  const normalizeData = (data: any) => {
+    return {
+      object: 'list',
+      data,
+    }
+  }
   // Common Routes
+  // Read & Delete :: Threads | Models | Assistants
   Object.keys(JanApiRouteConfiguration).forEach((key) => {
-    app.get(`/${key}`, async (_request) => getBuilder(JanApiRouteConfiguration[key]))
+    app.get(`/${key}`, async (_request) =>
+      getBuilder(JanApiRouteConfiguration[key]).then(normalizeData)
+    )
 
     app.get(`/${key}/:id`, async (request: any) =>
       retrieveBuilder(JanApiRouteConfiguration[key], request.params.id)
@@ -29,7 +39,26 @@ export const commonRouter = async (app: HttpServer) => {
     )
   })
 
-  // Download Model Routes
+  // Threads
+  app.post(`/threads/`, async (req, res) => createThread(req.body))
+
+  app.get(`/threads/:threadId/messages`, async (req, res) =>
+    getMessages(req.params.threadId).then(normalizeData)
+  )
+
+  app.get(`/threads/:threadId/messages/:messageId`, async (req, res) =>
+    retrieveMessage(req.params.threadId, req.params.messageId)
+  )
+
+  app.post(`/threads/:threadId/messages`, async (req, res) =>
+    createMessage(req.params.threadId as any, req.body as any)
+  )
+
+  app.patch(`/threads/:threadId`, async (request: any) =>
+    updateThread(request.params.threadId, request.body)
+  )
+
+  // Models
   app.get(`/models/download/:modelId`, async (request: any) =>
     downloadModel(request.params.modelId, {
       ignoreSSL: request.query.ignoreSSL === 'true',
@@ -48,24 +77,6 @@ export const commonRouter = async (app: HttpServer) => {
 
   app.put(`/models/:modelId/stop`, async (request: any) => stopModel(request.params.modelId))
 
-  // Chat Completion Routes
+  // Chat Completion
   app.post(`/chat/completions`, async (request: any, reply: any) => chatCompletions(request, reply))
-
-  // App Routes
-  app.post(`/app/${AppRoute.joinPath}`, async (request: any, reply: any) => {
-    const args = JSON.parse(request.body) as any[]
-
-    const paths = args[0].map((arg: string) =>
-      typeof arg === 'string' && (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
-        ? join(getJanDataFolderPath(), normalizeFilePath(arg))
-        : arg
-    )
-
-    reply.send(JSON.stringify(join(...paths)))
-  })
-
-  app.post(`/app/${AppRoute.baseName}`, async (request: any, reply: any) => {
-    const args = JSON.parse(request.body) as any[]
-    reply.send(JSON.stringify(basename(args[0])))
-  })
 }
diff --git a/core/src/node/api/common/builder.ts b/core/src/node/api/restful/helper/builder.ts
similarity index 96%
rename from core/src/node/api/common/builder.ts
rename to core/src/node/api/restful/helper/builder.ts
index 5c99cf4d8..7001c0c76 100644
--- a/core/src/node/api/common/builder.ts
+++ b/core/src/node/api/restful/helper/builder.ts
@@ -1,10 +1,11 @@
 import fs from 'fs'
 import { JanApiRouteConfiguration, RouteConfiguration } from './configuration'
 import { join } from 'path'
-import { ContentType, MessageStatus, Model, ThreadMessage } from './../../../index'
-import { getEngineConfiguration, getJanDataFolderPath } from '../../utils'
+import { ContentType, MessageStatus, Model, ThreadMessage } from '../../../../index'
+import { getEngineConfiguration, getJanDataFolderPath } from '../../../helper'
 import { DEFAULT_CHAT_COMPLETION_URL } from './consts'
 
+// TODO: Refactor these
 export const getBuilder = async (configuration: RouteConfiguration) => {
   const directoryPath = join(getJanDataFolderPath(), configuration.dirName)
   try {
@@ -124,7 +125,7 @@ export const getMessages = async (threadId: string): Promise<ThreadMessage[]> =>
   }
 }
 
-export const retrieveMesasge = async (threadId: string, messageId: string) => {
+export const retrieveMessage = async (threadId: string, messageId: string) => {
   const messages = await getMessages(threadId)
   const filteredMessages = messages.filter((m) => m.id === messageId)
   if (!filteredMessages || filteredMessages.length === 0) {
@@ -317,13 +318,6 @@ export const chatCompletions = async (request: any, reply: any) => {
     apiUrl = engineConfiguration.full_url
   }
 
-  reply.raw.writeHead(200, {
-    'Content-Type': 'text/event-stream',
-    'Cache-Control': 'no-cache',
-    'Connection': 'keep-alive',
-    'Access-Control-Allow-Origin': '*',
-  })
-
   const headers: Record<string, any> = {
     'Content-Type': 'application/json',
   }
@@ -342,8 +336,14 @@ export const chatCompletions = async (request: any, reply: any) => {
   })
   if (response.status !== 200) {
     console.error(response)
-    return
+    reply.code(400).send(response)
   } else {
+    reply.raw.writeHead(200, {
+      'Content-Type': 'text/event-stream',
+      'Cache-Control': 'no-cache',
+      'Connection': 'keep-alive',
+      'Access-Control-Allow-Origin': '*',
+    })
     response.body.pipe(reply.raw)
   }
 }
diff --git a/core/src/node/api/common/configuration.ts b/core/src/node/api/restful/helper/configuration.ts
similarity index 100%
rename from core/src/node/api/common/configuration.ts
rename to core/src/node/api/restful/helper/configuration.ts
diff --git a/core/src/node/api/common/consts.ts b/core/src/node/api/restful/helper/consts.ts
similarity index 100%
rename from core/src/node/api/common/consts.ts
rename to core/src/node/api/restful/helper/consts.ts
diff --git a/core/src/node/api/common/startStopModel.ts b/core/src/node/api/restful/helper/startStopModel.ts
similarity index 99%
rename from core/src/node/api/common/startStopModel.ts
rename to core/src/node/api/restful/helper/startStopModel.ts
index 0d4934e1c..0e6972b0b 100644
--- a/core/src/node/api/common/startStopModel.ts
+++ b/core/src/node/api/restful/helper/startStopModel.ts
@@ -1,9 +1,9 @@
 import fs from 'fs'
 import { join } from 'path'
-import { getJanDataFolderPath, getJanExtensionsPath, getSystemResourceInfo } from '../../utils'
-import { logServer } from '../../log'
+import { getJanDataFolderPath, getJanExtensionsPath, getSystemResourceInfo } from '../../../helper'
+import { logServer } from '../../../helper/log'
 import { ChildProcessWithoutNullStreams, spawn } from 'child_process'
-import { Model, ModelSettingParams, PromptTemplate } from '../../../types'
+import { Model, ModelSettingParams, PromptTemplate } from '../../../../types'
 import {
   LOCAL_HOST,
   NITRO_DEFAULT_PORT,
diff --git a/core/src/node/api/restful/v1.ts b/core/src/node/api/restful/v1.ts
new file mode 100644
index 000000000..5eb8f5067
--- /dev/null
+++ b/core/src/node/api/restful/v1.ts
@@ -0,0 +1,16 @@
+import { HttpServer } from '../HttpServer'
+import { commonRouter } from './common'
+import { downloadRouter } from './app/download'
+import { handleRequests } from './app/handlers'
+
+export const v1Router = async (app: HttpServer) => {
+  // MARK: Public API Routes
+  app.register(commonRouter)
+
+  // MARK: Internal Application Routes
+  handleRequests(app)
+
+  // Expanded route for tracking download progress
+  // TODO: Replace by Observer Wrapper (ZeroMQ / Vanilla Websocket)
+  app.register(downloadRouter)
+}
diff --git a/core/src/node/api/routes/download.ts b/core/src/node/api/routes/download.ts
deleted file mode 100644
index ab8c0bd37..000000000
--- a/core/src/node/api/routes/download.ts
+++ /dev/null
@@ -1,58 +0,0 @@
-import { DownloadRoute } from '../../../api'
-import { join } from 'path'
-import { DownloadManager } from '../../download'
-import { HttpServer } from '../HttpServer'
-import { createWriteStream } from 'fs'
-import { getJanDataFolderPath } from '../../utils'
-import { normalizeFilePath } from '../../path'
-
-export const downloadRouter = async (app: HttpServer) => {
-  app.post(`/${DownloadRoute.downloadFile}`, async (req, res) => {
-    const strictSSL = !(req.query.ignoreSSL === 'true')
-    const proxy = req.query.proxy?.startsWith('http') ? req.query.proxy : undefined
-    const body = JSON.parse(req.body as any)
-    const normalizedArgs = body.map((arg: any) => {
-      if (typeof arg === 'string' && arg.startsWith('file:')) {
-        return join(getJanDataFolderPath(), normalizeFilePath(arg))
-      }
-      return arg
-    })
-
-    const localPath = normalizedArgs[1]
-    const fileName = localPath.split('/').pop() ?? ''
-
-    const request = require('request')
-    const progress = require('request-progress')
-
-    const rq = request({ url: normalizedArgs[0], strictSSL, proxy })
-    progress(rq, {})
-      .on('progress', function (state: any) {
-        console.log('download onProgress', state)
-      })
-      .on('error', function (err: Error) {
-        console.log('download onError', err)
-      })
-      .on('end', function () {
-        console.log('download onEnd')
-      })
-      .pipe(createWriteStream(normalizedArgs[1]))
-
-    DownloadManager.instance.setRequest(fileName, rq)
-  })
-
-  app.post(`/${DownloadRoute.abortDownload}`, async (req, res) => {
-    const body = JSON.parse(req.body as any)
-    const normalizedArgs = body.map((arg: any) => {
-      if (typeof arg === 'string' && arg.startsWith('file:')) {
-        return join(getJanDataFolderPath(), normalizeFilePath(arg))
-      }
-      return arg
-    })
-
-    const localPath = normalizedArgs[0]
-    const fileName = localPath.split('/').pop() ?? ''
-    const rq = DownloadManager.instance.networkRequests[fileName]
-    DownloadManager.instance.networkRequests[fileName] = undefined
-    rq?.abort()
-  })
-}
diff --git a/core/src/node/api/routes/extension.ts b/core/src/node/api/routes/extension.ts
deleted file mode 100644
index 02bc54eb3..000000000
--- a/core/src/node/api/routes/extension.ts
+++ /dev/null
@@ -1,49 +0,0 @@
-import { join, extname } from 'path'
-import { ExtensionRoute } from '../../../api/index'
-import { ModuleManager } from '../../module'
-import { getActiveExtensions, installExtensions } from '../../extension/store'
-import { HttpServer } from '../HttpServer'
-
-import { readdirSync } from 'fs'
-import { getJanExtensionsPath } from '../../utils'
-
-export const extensionRouter = async (app: HttpServer) => {
-  // TODO: Share code between node projects
-  app.post(`/${ExtensionRoute.getActiveExtensions}`, async (_req, res) => {
-    const activeExtensions = await getActiveExtensions()
-    res.status(200).send(activeExtensions)
-  })
-
-  app.post(`/${ExtensionRoute.baseExtensions}`, async (_req, res) => {
-    const baseExtensionPath = join(__dirname, '..', '..', '..', 'pre-install')
-    const extensions = readdirSync(baseExtensionPath)
-      .filter((file) => extname(file) === '.tgz')
-      .map((file) => join(baseExtensionPath, file))
-
-    res.status(200).send(extensions)
-  })
-
-  app.post(`/${ExtensionRoute.installExtension}`, async (req) => {
-    const extensions = req.body as any
-    const installed = await installExtensions(JSON.parse(extensions)[0])
-    return JSON.parse(JSON.stringify(installed))
-  })
-
-  app.post(`/${ExtensionRoute.invokeExtensionFunc}`, async (req, res) => {
-    const args = JSON.parse(req.body as any)
-    console.debug(args)
-    const module = await import(join(getJanExtensionsPath(), args[0]))
-
-    ModuleManager.instance.setModule(args[0], module)
-    const method = args[1]
-    if (typeof module[method] === 'function') {
-      // remove first item from args
-      const newArgs = args.slice(2)
-      console.log(newArgs)
-      return module[method](...args.slice(2))
-    } else {
-      console.debug(module[method])
-      console.error(`Function "${method}" does not exist in the module.`)
-    }
-  })
-}
diff --git a/core/src/node/api/routes/fileManager.ts b/core/src/node/api/routes/fileManager.ts
deleted file mode 100644
index 66056444e..000000000
--- a/core/src/node/api/routes/fileManager.ts
+++ /dev/null
@@ -1,14 +0,0 @@
-import { FileManagerRoute } from '../../../api'
-import { HttpServer } from '../../index'
-
-export const fsRouter = async (app: HttpServer) => {
-  app.post(`/app/${FileManagerRoute.syncFile}`, async (request: any, reply: any) => {})
-
-  app.post(`/app/${FileManagerRoute.getJanDataFolderPath}`, async (request: any, reply: any) => {})
-
-  app.post(`/app/${FileManagerRoute.getResourcePath}`, async (request: any, reply: any) => {})
-
-  app.post(`/app/${FileManagerRoute.getUserHomePath}`, async (request: any, reply: any) => {})
-
-  app.post(`/app/${FileManagerRoute.fileStat}`, async (request: any, reply: any) => {})
-}
diff --git a/core/src/node/api/routes/fs.ts b/core/src/node/api/routes/fs.ts
deleted file mode 100644
index c5404ccce..000000000
--- a/core/src/node/api/routes/fs.ts
+++ /dev/null
@@ -1,29 +0,0 @@
-import { FileSystemRoute } from '../../../api'
-import { join } from 'path'
-import { HttpServer } from '../HttpServer'
-import { getJanDataFolderPath } from '../../utils'
-import { normalizeFilePath } from '../../path'
-
-export const fsRouter = async (app: HttpServer) => {
-  const moduleName = 'fs'
-  // Generate handlers for each fs route
-  Object.values(FileSystemRoute).forEach((route) => {
-    app.post(`/${route}`, async (req, res) => {
-      const body = JSON.parse(req.body as any)
-      try {
-        const result = await import(moduleName).then((mdl) => {
-          return mdl[route](
-            ...body.map((arg: any) =>
-              typeof arg === 'string' && (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
-                ? join(getJanDataFolderPath(), normalizeFilePath(arg))
-                : arg
-            )
-          )
-        })
-        res.status(200).send(result)
-      } catch (ex) {
-        console.log(ex)
-      }
-    })
-  })
-}
diff --git a/core/src/node/api/routes/index.ts b/core/src/node/api/routes/index.ts
deleted file mode 100644
index e6edc62f7..000000000
--- a/core/src/node/api/routes/index.ts
+++ /dev/null
@@ -1,6 +0,0 @@
-export * from './download'
-export * from './extension'
-export * from './fs'
-export * from './thread'
-export * from './common'
-export * from './v1'
diff --git a/core/src/node/api/routes/thread.ts b/core/src/node/api/routes/thread.ts
deleted file mode 100644
index 4066d2716..000000000
--- a/core/src/node/api/routes/thread.ts
+++ /dev/null
@@ -1,30 +0,0 @@
-import { HttpServer } from '../HttpServer'
-import {
-  createMessage,
-  createThread,
-  getMessages,
-  retrieveMesasge,
-  updateThread,
-} from '../common/builder'
-
-export const threadRouter = async (app: HttpServer) => {
-  // create thread
-  app.post(`/`, async (req, res) => createThread(req.body))
-
-  app.get(`/:threadId/messages`, async (req, res) => getMessages(req.params.threadId))
-
-  // retrieve message
-  app.get(`/:threadId/messages/:messageId`, async (req, res) =>
-    retrieveMesasge(req.params.threadId, req.params.messageId),
-  )
-
-  // create message
-  app.post(`/:threadId/messages`, async (req, res) =>
-    createMessage(req.params.threadId as any, req.body as any),
-  )
-
-  // modify thread
-  app.patch(`/:threadId`, async (request: any) =>
-    updateThread(request.params.threadId, request.body),
-  )
-}
diff --git a/core/src/node/api/routes/v1.ts b/core/src/node/api/routes/v1.ts
deleted file mode 100644
index a2a48cd8b..000000000
--- a/core/src/node/api/routes/v1.ts
+++ /dev/null
@@ -1,25 +0,0 @@
-import { HttpServer } from '../HttpServer'
-import { commonRouter } from './common'
-import { threadRouter } from './thread'
-import { fsRouter } from './fs'
-import { extensionRouter } from './extension'
-import { downloadRouter } from './download'
-
-export const v1Router = async (app: HttpServer) => {
-  // MARK: External Routes
-  app.register(commonRouter)
-  app.register(threadRouter, {
-    prefix: '/threads',
-  })
-
-  // MARK: Internal Application Routes
-  app.register(fsRouter, {
-    prefix: '/fs',
-  })
-  app.register(extensionRouter, {
-    prefix: '/extension',
-  })
-  app.register(downloadRouter, {
-    prefix: '/download',
-  })
-}
diff --git a/core/src/node/extension/extension.ts b/core/src/node/extension/extension.ts
index aeb0277c0..1f8dfa3ec 100644
--- a/core/src/node/extension/extension.ts
+++ b/core/src/node/extension/extension.ts
@@ -104,7 +104,7 @@ export default class Extension {
       await pacote.extract(
         this.specifier,
         join(ExtensionManager.instance.getExtensionsPath() ?? '', this.name ?? ''),
-        this.installOptions,
+        this.installOptions
       )
 
       // Set the url using the custom extensions protocol
diff --git a/core/src/node/extension/index.ts b/core/src/node/extension/index.ts
index ed8544773..994fc97f2 100644
--- a/core/src/node/extension/index.ts
+++ b/core/src/node/extension/index.ts
@@ -41,8 +41,8 @@ async function registerExtensionProtocol() {
     console.error('Electron is not available')
   }
   const extensionPath = ExtensionManager.instance.getExtensionsPath()
-  if (electron) {
-    return electron.protocol.registerFileProtocol('extension', (request: any, callback: any) => {
+  if (electron && electron.protocol) {
+    return electron.protocol?.registerFileProtocol('extension', (request: any, callback: any) => {
       const entry = request.url.substr('extension://'.length - 1)
 
       const url = normalize(extensionPath + entry)
@@ -69,7 +69,7 @@ export function useExtensions(extensionsPath: string) {
 
   // Read extension list from extensions folder
   const extensions = JSON.parse(
-    readFileSync(ExtensionManager.instance.getExtensionsFile(), 'utf-8'),
+    readFileSync(ExtensionManager.instance.getExtensionsFile(), 'utf-8')
   )
   try {
     // Create and store a Extension instance for each extension in list
@@ -82,7 +82,7 @@ export function useExtensions(extensionsPath: string) {
     throw new Error(
       'Could not successfully rebuild list of installed extensions.\n' +
         error +
-        '\nPlease check the extensions.json file in the extensions folder.',
+        '\nPlease check the extensions.json file in the extensions folder.'
     )
   }
 
@@ -122,7 +122,7 @@ function loadExtension(ext: any) {
 export function getStore() {
   if (!ExtensionManager.instance.getExtensionsFile()) {
     throw new Error(
-      'The extension path has not yet been set up. Please run useExtensions before accessing the store',
+      'The extension path has not yet been set up. Please run useExtensions before accessing the store'
     )
   }
 
diff --git a/core/src/node/extension/store.ts b/core/src/node/extension/store.ts
index 84b1f9caf..93b1aeb2b 100644
--- a/core/src/node/extension/store.ts
+++ b/core/src/node/extension/store.ts
@@ -1,6 +1,6 @@
-import { writeFileSync } from "fs";
-import Extension from "./extension";
-import { ExtensionManager } from "./manager";
+import { writeFileSync } from 'fs'
+import Extension from './extension'
+import { ExtensionManager } from './manager'
 
 /**
  * @module store
@@ -11,7 +11,7 @@ import { ExtensionManager } from "./manager";
  * Register of installed extensions
  * @type {Object.<string, Extension>} extension - List of installed extensions
  */
-const extensions: Record<string, Extension> = {};
+const extensions: Record<string, Extension> = {}
 
 /**
  * Get a extension from the stored extensions.
@@ -21,10 +21,10 @@ const extensions: Record<string, Extension> = {};
  */
 export function getExtension(name: string) {
   if (!Object.prototype.hasOwnProperty.call(extensions, name)) {
-    throw new Error(`Extension ${name} does not exist`);
+    throw new Error(`Extension ${name} does not exist`)
   }
 
-  return extensions[name];
+  return extensions[name]
 }
 
 /**
@@ -33,7 +33,7 @@ export function getExtension(name: string) {
  * @alias extensionManager.getAllExtensions
  */
 export function getAllExtensions() {
-  return Object.values(extensions);
+  return Object.values(extensions)
 }
 
 /**
@@ -42,7 +42,7 @@ export function getAllExtensions() {
  * @alias extensionManager.getActiveExtensions
  */
 export function getActiveExtensions() {
-  return Object.values(extensions).filter((extension) => extension.active);
+  return Object.values(extensions).filter((extension) => extension.active)
 }
 
 /**
@@ -53,9 +53,9 @@ export function getActiveExtensions() {
  * @alias extensionManager.removeExtension
  */
 export function removeExtension(name: string, persist = true) {
-  const del = delete extensions[name];
-  if (persist) persistExtensions();
-  return del;
+  const del = delete extensions[name]
+  if (persist) persistExtensions()
+  return del
 }
 
 /**
@@ -65,10 +65,10 @@ export function removeExtension(name: string, persist = true) {
  * @returns {void}
  */
 export function addExtension(extension: Extension, persist = true) {
-  if (extension.name) extensions[extension.name] = extension;
+  if (extension.name) extensions[extension.name] = extension
   if (persist) {
-    persistExtensions();
-    extension.subscribe("pe-persist", persistExtensions);
+    persistExtensions()
+    extension.subscribe('pe-persist', persistExtensions)
   }
 }
 
@@ -77,14 +77,11 @@ export function addExtension(extension: Extension, persist = true) {
  * @returns {void}
  */
 export function persistExtensions() {
-  const persistData: Record<string, Extension> = {};
+  const persistData: Record<string, Extension> = {}
   for (const name in extensions) {
-    persistData[name] = extensions[name];
+    persistData[name] = extensions[name]
   }
-  writeFileSync(
-    ExtensionManager.instance.getExtensionsFile(),
-    JSON.stringify(persistData),
-  );
+  writeFileSync(ExtensionManager.instance.getExtensionsFile(), JSON.stringify(persistData))
 }
 
 /**
@@ -94,26 +91,29 @@ export function persistExtensions() {
  * @returns {Promise.<Array.<Extension>>} New extension
  * @alias extensionManager.installExtensions
  */
-export async function installExtensions(extensions: any, store = true) {
-  const installed: Extension[] = [];
+export async function installExtensions(extensions: any) {
+  const installed: Extension[] = []
   for (const ext of extensions) {
     // Set install options and activation based on input type
-    const isObject = typeof ext === "object";
-    const spec = isObject ? [ext.specifier, ext] : [ext];
-    const activate = isObject ? ext.activate !== false : true;
+    const isObject = typeof ext === 'object'
+    const spec = isObject ? [ext.specifier, ext] : [ext]
+    const activate = isObject ? ext.activate !== false : true
 
     // Install and possibly activate extension
-    const extension = new Extension(...spec);
-    await extension._install();
-    if (activate) extension.setActive(true);
+    const extension = new Extension(...spec)
+    if (!extension.origin) {
+      continue
+    }
+    await extension._install()
+    if (activate) extension.setActive(true)
 
     // Add extension to store if needed
-    if (store) addExtension(extension);
-    installed.push(extension);
+    addExtension(extension)
+    installed.push(extension)
   }
 
   // Return list of all installed extensions
-  return installed;
+  return installed
 }
 
 /**
diff --git a/core/src/node/utils/index.ts b/core/src/node/helper/config.ts
similarity index 91%
rename from core/src/node/utils/index.ts
rename to core/src/node/helper/config.ts
index 4bcbf13b1..71e721578 100644
--- a/core/src/node/utils/index.ts
+++ b/core/src/node/helper/config.ts
@@ -1,8 +1,7 @@
-import { AppConfiguration, SystemResourceInfo } from '../../types'
+import { AppConfiguration } from '../../types'
 import { join } from 'path'
 import fs from 'fs'
 import os from 'os'
-import { log, logServer } from '../log'
 import childProcess from 'child_process'
 
 // TODO: move this to core
@@ -56,34 +55,6 @@ export const updateAppConfiguration = (configuration: AppConfiguration): Promise
   return Promise.resolve()
 }
 
-/**
- * Utility function to get server log path
- *
- * @returns {string} The log path.
- */
-export const getServerLogPath = (): string => {
-  const appConfigurations = getAppConfigurations()
-  const logFolderPath = join(appConfigurations.data_folder, 'logs')
-  if (!fs.existsSync(logFolderPath)) {
-    fs.mkdirSync(logFolderPath, { recursive: true })
-  }
-  return join(logFolderPath, 'server.log')
-}
-
-/**
- * Utility function to get app log path
- *
- * @returns {string} The log path.
- */
-export const getAppLogPath = (): string => {
-  const appConfigurations = getAppConfigurations()
-  const logFolderPath = join(appConfigurations.data_folder, 'logs')
-  if (!fs.existsSync(logFolderPath)) {
-    fs.mkdirSync(logFolderPath, { recursive: true })
-  }
-  return join(logFolderPath, 'app.log')
-}
-
 /**
  * Utility function to get data folder path
  *
@@ -146,18 +117,6 @@ const exec = async (command: string): Promise<string> => {
   })
 }
 
-export const getSystemResourceInfo = async (): Promise<SystemResourceInfo> => {
-  const cpu = await physicalCpuCount()
-  const message = `[NITRO]::CPU informations - ${cpu}`
-  log(message)
-  logServer(message)
-
-  return {
-    numCpuPhysicalCore: cpu,
-    memAvailable: 0, // TODO: this should not be 0
-  }
-}
-
 export const getEngineConfiguration = async (engineId: string) => {
   if (engineId !== 'openai') {
     return undefined
@@ -167,3 +126,31 @@ export const getEngineConfiguration = async (engineId: string) => {
   const data = fs.readFileSync(filePath, 'utf-8')
   return JSON.parse(data)
 }
+
+/**
+ * Utility function to get server log path
+ *
+ * @returns {string} The log path.
+ */
+export const getServerLogPath = (): string => {
+  const appConfigurations = getAppConfigurations()
+  const logFolderPath = join(appConfigurations.data_folder, 'logs')
+  if (!fs.existsSync(logFolderPath)) {
+    fs.mkdirSync(logFolderPath, { recursive: true })
+  }
+  return join(logFolderPath, 'server.log')
+}
+
+/**
+ * Utility function to get app log path
+ *
+ * @returns {string} The log path.
+ */
+export const getAppLogPath = (): string => {
+  const appConfigurations = getAppConfigurations()
+  const logFolderPath = join(appConfigurations.data_folder, 'logs')
+  if (!fs.existsSync(logFolderPath)) {
+    fs.mkdirSync(logFolderPath, { recursive: true })
+  }
+  return join(logFolderPath, 'app.log')
+}
diff --git a/core/src/node/download.ts b/core/src/node/helper/download.ts
similarity index 67%
rename from core/src/node/download.ts
rename to core/src/node/helper/download.ts
index 6d15fc344..b9fb88bb5 100644
--- a/core/src/node/download.ts
+++ b/core/src/node/helper/download.ts
@@ -1,15 +1,18 @@
+import { DownloadState } from '../../types'
 
 /**
  * Manages file downloads and network requests.
  */
 export class DownloadManager {
-  public networkRequests: Record<string, any> = {};
+  public networkRequests: Record<string, any> = {}
 
-  public static instance: DownloadManager = new DownloadManager();
+  public static instance: DownloadManager = new DownloadManager()
+
+  public downloadProgressMap: Record<string, DownloadState> = {}
 
   constructor() {
     if (DownloadManager.instance) {
-      return DownloadManager.instance;
+      return DownloadManager.instance
     }
   }
   /**
@@ -18,6 +21,6 @@ export class DownloadManager {
    * @param {Request | undefined} request - The network request to set, or undefined to clear the request.
    */
   setRequest(fileName: string, request: any | undefined) {
-    this.networkRequests[fileName] = request;
+    this.networkRequests[fileName] = request
   }
 }
diff --git a/core/src/node/helper/index.ts b/core/src/node/helper/index.ts
new file mode 100644
index 000000000..6fc54fc6b
--- /dev/null
+++ b/core/src/node/helper/index.ts
@@ -0,0 +1,6 @@
+export * from './config'
+export * from './download'
+export * from './log'
+export * from './module'
+export * from './path'
+export * from './resource'
diff --git a/core/src/node/log.ts b/core/src/node/helper/log.ts
similarity index 93%
rename from core/src/node/log.ts
rename to core/src/node/helper/log.ts
index 6f2c2f80f..8ff196943 100644
--- a/core/src/node/log.ts
+++ b/core/src/node/helper/log.ts
@@ -1,6 +1,6 @@
 import fs from 'fs'
 import util from 'util'
-import { getAppLogPath, getServerLogPath } from './utils'
+import { getAppLogPath, getServerLogPath } from './config'
 
 export const log = (message: string) => {
   const path = getAppLogPath()
diff --git a/core/src/node/module.ts b/core/src/node/helper/module.ts
similarity index 100%
rename from core/src/node/module.ts
rename to core/src/node/helper/module.ts
diff --git a/core/src/node/helper/path.ts b/core/src/node/helper/path.ts
new file mode 100644
index 000000000..c20889f4c
--- /dev/null
+++ b/core/src/node/helper/path.ts
@@ -0,0 +1,35 @@
+import { join } from 'path'
+
+/**
+ * Normalize file path
+ * Remove all file protocol prefix
+ * @param path
+ * @returns
+ */
+export function normalizeFilePath(path: string): string {
+  return path.replace(/^(file:[\\/]+)([^:\s]+)$/, '$2')
+}
+
+export async function appResourcePath(): Promise<string> {
+  let electron: any = undefined
+
+  try {
+    const moduleName = 'electron'
+    electron = await import(moduleName)
+  } catch (err) {
+    console.error('Electron is not available')
+  }
+
+  // electron
+  if (electron && electron.protocol) {
+    let appPath = join(electron.app.getAppPath(), '..', 'app.asar.unpacked')
+
+    if (!electron.app.isPackaged) {
+      // for development mode
+      appPath = join(electron.app.getAppPath())
+    }
+    return appPath
+  }
+  // server
+  return join(global.core.appPath(), '../../..')
+}
diff --git a/core/src/node/helper/resource.ts b/core/src/node/helper/resource.ts
new file mode 100644
index 000000000..c79a63688
--- /dev/null
+++ b/core/src/node/helper/resource.ts
@@ -0,0 +1,14 @@
+import { SystemResourceInfo } from '../../types'
+import { physicalCpuCount } from './config'
+import { log, logServer } from './log'
+
+export const getSystemResourceInfo = async (): Promise<SystemResourceInfo> => {
+  const cpu = await physicalCpuCount()
+  const message = `[NITRO]::CPU informations - ${cpu}`
+  log(message)
+
+  return {
+    numCpuPhysicalCore: cpu,
+    memAvailable: 0, // TODO: this should not be 0
+  }
+}
diff --git a/core/src/node/index.ts b/core/src/node/index.ts
index 10385ecfc..31f2f076e 100644
--- a/core/src/node/index.ts
+++ b/core/src/node/index.ts
@@ -2,9 +2,5 @@ export * from './extension/index'
 export * from './extension/extension'
 export * from './extension/manager'
 export * from './extension/store'
-export * from './download'
-export * from './module'
 export * from './api'
-export * from './log'
-export * from './utils'
-export * from './path'
+export * from './helper'
diff --git a/core/src/node/path.ts b/core/src/node/path.ts
deleted file mode 100644
index adbc38c6c..000000000
--- a/core/src/node/path.ts
+++ /dev/null
@@ -1,9 +0,0 @@
-/**
- * Normalize file path
- * Remove all file protocol prefix
- * @param path 
- * @returns 
- */
-export function normalizeFilePath(path: string): string {
-  return path.replace(/^(file:[\\/]+)([^:\s]+)$/, "$2");
-}
diff --git a/core/src/types/assistant/assistantEvent.ts b/core/src/types/assistant/assistantEvent.ts
new file mode 100644
index 000000000..8c32f5d37
--- /dev/null
+++ b/core/src/types/assistant/assistantEvent.ts
@@ -0,0 +1,7 @@
+/**
+ * The `EventName` enumeration contains the names of all the available events in the Jan platform.
+ */
+export enum AssistantEvent {
+  /** The `OnAssistantsUpdate` event is emitted when the assistant list is updated. */
+  OnAssistantsUpdate = 'OnAssistantsUpdate',
+}
diff --git a/core/src/types/assistant/index.ts b/core/src/types/assistant/index.ts
index 83ea73f85..e18589551 100644
--- a/core/src/types/assistant/index.ts
+++ b/core/src/types/assistant/index.ts
@@ -1,2 +1,3 @@
 export * from './assistantEntity'
+export * from './assistantEvent'
 export * from './assistantInterface'
diff --git a/core/src/types/file/index.ts b/core/src/types/file/index.ts
index 6526cfc6d..cc7274a28 100644
--- a/core/src/types/file/index.ts
+++ b/core/src/types/file/index.ts
@@ -2,3 +2,26 @@ export type FileStat = {
   isDirectory: boolean
   size: number
 }
+
+export type DownloadState = {
+  modelId: string
+  fileName: string
+  time: DownloadTime
+  speed: number
+  percent: number
+
+  size: DownloadSize
+  children?: DownloadState[]
+  error?: string
+  downloadState: 'downloading' | 'error' | 'end'
+}
+
+type DownloadTime = {
+  elapsed: number
+  remaining: number
+}
+
+type DownloadSize = {
+  total: number
+  transferred: number
+}
diff --git a/core/src/types/message/index.ts b/core/src/types/message/index.ts
index e8d78deda..ebb4c363d 100644
--- a/core/src/types/message/index.ts
+++ b/core/src/types/message/index.ts
@@ -1,3 +1,4 @@
 export * from './messageEntity'
 export * from './messageInterface'
 export * from './messageEvent'
+export * from './messageRequestType'
diff --git a/core/src/types/message/messageEntity.ts b/core/src/types/message/messageEntity.ts
index 87e4b1997..e9211d550 100644
--- a/core/src/types/message/messageEntity.ts
+++ b/core/src/types/message/messageEntity.ts
@@ -27,6 +27,8 @@ export type ThreadMessage = {
   updated: number
   /** The additional metadata of this message. **/
   metadata?: Record<string, unknown>
+
+  type?: string
 }
 
 /**
@@ -56,6 +58,8 @@ export type MessageRequest = {
   /** The thread of this message is belong to. **/
   // TODO: deprecate threadId field
   thread?: Thread
+
+  type?: string
 }
 
 /**
diff --git a/core/src/types/message/messageRequestType.ts b/core/src/types/message/messageRequestType.ts
new file mode 100644
index 000000000..cbb4cf421
--- /dev/null
+++ b/core/src/types/message/messageRequestType.ts
@@ -0,0 +1,5 @@
+export enum MessageRequestType {
+  Thread = 'Thread',
+  Assistant = 'Assistant',
+  Summary = 'Summary',
+}
diff --git a/core/src/types/model/modelEvent.ts b/core/src/types/model/modelEvent.ts
index 978a48724..443f3a34f 100644
--- a/core/src/types/model/modelEvent.ts
+++ b/core/src/types/model/modelEvent.ts
@@ -12,4 +12,6 @@ export enum ModelEvent {
   OnModelStop = 'OnModelStop',
   /** The `OnModelStopped` event is emitted when a model stopped ok. */
   OnModelStopped = 'OnModelStopped',
+  /** The `OnModelUpdate` event is emitted when the model list is updated. */
+  OnModelsUpdate = 'OnModelsUpdate',
 }
diff --git a/core/src/types/model/modelInterface.ts b/core/src/types/model/modelInterface.ts
index 74a479f3c..93d5867ee 100644
--- a/core/src/types/model/modelInterface.ts
+++ b/core/src/types/model/modelInterface.ts
@@ -10,7 +10,7 @@ export interface ModelInterface {
    * @param network - Optional object to specify proxy/whether to ignore SSL certificates.
    * @returns A Promise that resolves when the model has been downloaded.
    */
-  downloadModel(model: Model, network?: { ignoreSSL?: boolean, proxy?: string }): Promise<void>
+  downloadModel(model: Model, network?: { ignoreSSL?: boolean; proxy?: string }): Promise<void>
 
   /**
    * Cancels the download of a specific model.
diff --git a/core/tests/node/path.test.ts b/core/tests/node/path.test.ts
index 9f8a557bb..5390df119 100644
--- a/core/tests/node/path.test.ts
+++ b/core/tests/node/path.test.ts
@@ -1,4 +1,4 @@
-import { normalizeFilePath } from "../../src/node/path";
+import { normalizeFilePath } from "../../src/node/helper/path";
 
 describe("Test file normalize", () => {
   test("returns no file protocol prefix on Unix", async () => {
diff --git a/core/tslint.json b/core/tslint.json
index 398a41670..6543a641a 100644
--- a/core/tslint.json
+++ b/core/tslint.json
@@ -1,6 +1,3 @@
 {
-  "extends": [
-    "tslint-config-standard",
-    "tslint-config-prettier"
-  ]
-}
\ No newline at end of file
+  "extends": ["tslint-config-standard", "tslint-config-prettier"]
+}
diff --git a/docker-compose.yml b/docker-compose.yml
new file mode 100644
index 000000000..1691a841a
--- /dev/null
+++ b/docker-compose.yml
@@ -0,0 +1,172 @@
+# Docker Compose file for setting up Minio, createbuckets, app_cpu, and app_gpu services
+
+version: '3.7'
+
+services:
+  # Minio service for object storage
+  minio:
+    image: minio/minio
+    volumes:
+      - minio_data:/data
+    ports:
+      - "9000:9000"
+      - "9001:9001"
+    environment:
+      # Set the root user and password for Minio
+      MINIO_ROOT_USER: minioadmin # This acts as AWS_ACCESS_KEY
+      MINIO_ROOT_PASSWORD: minioadmin # This acts as AWS_SECRET_ACCESS_KEY
+    command: server --console-address ":9001" /data
+    restart: always
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:9000/minio/health/live"]
+      interval: 30s
+      timeout: 20s
+      retries: 3
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.2
+
+  # createbuckets service to create a bucket and set its policy
+  createbuckets:
+    image: minio/mc
+    depends_on:
+      - minio
+    entrypoint: >
+      /bin/sh -c "
+      /usr/bin/mc alias set myminio http://minio:9000 minioadmin minioadmin;
+      /usr/bin/mc mb myminio/mybucket;
+      /usr/bin/mc policy set public myminio/mybucket;
+      exit 0;
+      "
+    networks:
+      vpcbr:
+
+  # app_cpu service for running the CPU version of the application
+  app_cpu_s3fs:
+    image: jan:latest
+    volumes:
+      - app_data_cpu_s3fs:/app/server/build/jan
+    build:
+      context: .
+      dockerfile: Dockerfile
+    environment:
+      # Set the AWS access key, secret access key, bucket name, endpoint, and region for app_cpu
+      AWS_ACCESS_KEY_ID: minioadmin
+      AWS_SECRET_ACCESS_KEY: minioadmin
+      S3_BUCKET_NAME: mybucket
+      AWS_ENDPOINT: http://10.5.0.2:9000
+      AWS_REGION: us-east-1
+      API_BASE_URL: http://localhost:1337
+    restart: always
+    profiles:
+      - cpu-s3fs
+    ports:
+      - "3000:3000"
+      - "1337:1337"
+      - "3928:3928"
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.3
+
+  # app_gpu service for running the GPU version of the application
+  app_gpu_s3fs:
+    deploy:
+      resources:
+        reservations:
+          devices:
+          - driver: nvidia
+            count: all
+            capabilities: [gpu]
+    image: jan-gpu:latest
+    volumes:
+      - app_data_gpu_s3fs:/app/server/build/jan
+    build:
+      context: .
+      dockerfile: Dockerfile.gpu
+    restart: always
+    environment:
+      # Set the AWS access key, secret access key, bucket name, endpoint, and region for app_gpu
+      AWS_ACCESS_KEY_ID: minioadmin
+      AWS_SECRET_ACCESS_KEY: minioadmin
+      S3_BUCKET_NAME: mybucket
+      AWS_ENDPOINT: http://10.5.0.2:9000
+      AWS_REGION: us-east-1
+      API_BASE_URL: http://localhost:1337
+    profiles:
+      - gpu-s3fs
+    ports:
+      - "3000:3000"
+      - "1337:1337"
+      - "3928:3928"
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.4
+
+  app_cpu_fs:
+    image: jan:latest
+    volumes:
+      - app_data_cpu_fs:/app/server/build/jan
+    build:
+      context: .
+      dockerfile: Dockerfile
+    environment:
+      API_BASE_URL: http://localhost:1337
+    restart: always
+    profiles:
+      - cpu-fs
+    ports:
+      - "3000:3000"
+      - "1337:1337"
+      - "3928:3928"
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.5
+
+  # app_gpu service for running the GPU version of the application
+  app_gpu_fs:
+    deploy:
+      resources:
+        reservations:
+          devices:
+          - driver: nvidia
+            count: all
+            capabilities: [gpu]
+    image: jan-gpu:latest
+    volumes:
+      - app_data_gpu_fs:/app/server/build/jan
+    build:
+      context: .
+      dockerfile: Dockerfile.gpu
+    restart: always
+    environment:
+      API_BASE_URL: http://localhost:1337
+    profiles:
+      - gpu-fs
+    ports:
+      - "3000:3000"
+      - "1337:1337"
+      - "3928:3928"
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.6
+
+volumes:
+  minio_data:
+  app_data_cpu_s3fs:
+  app_data_gpu_s3fs:
+  app_data_cpu_fs:
+  app_data_gpu_fs:
+
+networks:
+  vpcbr:
+    driver: bridge
+    ipam:
+     config:
+       - subnet: 10.5.0.0/16
+         gateway: 10.5.0.1
+
+# Usage:
+# - Run 'docker compose --profile cpu-s3fs up -d' to start the app_cpu service
+# - Run 'docker compose --profile gpu-s3fs up -d' to start the app_gpu service
+# - Run 'docker compose --profile cpu-fs up -d' to start the app_cpu service
+# - Run 'docker compose --profile gpu-fs up -d' to start the app_gpu service
diff --git a/docs/docs/about/03-engineering/05-postmortems/01-january-10-2024-bitdefender-false-positive-flag.mdx b/docs/blog/01-january-10-2024-bitdefender-false-positive-flag.mdx
similarity index 96%
rename from docs/docs/about/03-engineering/05-postmortems/01-january-10-2024-bitdefender-false-positive-flag.mdx
rename to docs/blog/01-january-10-2024-bitdefender-false-positive-flag.mdx
index 4d0189c60..ef418ff97 100644
--- a/docs/docs/about/03-engineering/05-postmortems/01-january-10-2024-bitdefender-false-positive-flag.mdx
+++ b/docs/blog/01-january-10-2024-bitdefender-false-positive-flag.mdx
@@ -1,22 +1,8 @@
 ---
-title: |
-  10/1/24: Bitdefender False Positive Flag (Resolved)
+title: "Post Mortem: Bitdefender False Positive Flag"
+description: "10th January 2024, Jan's 0.4.4 Release on Windows triggered Bitdefender to incorrectly flag it as infected with Gen:Variant.Tedy.258323, leading to automatic quarantine warnings on users' computers."
 slug: /postmortems/january-10-2024-bitdefender-false-positive-flag
-description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-    postmortem,
-    incident,
-    flagging issue,
-  ]
+tags: [Postmortem]
 ---
 
 Following the recent incident related to Jan version 0.4.4 triggering Bitdefender on Windows with Gen:Variant.Tedy.258323 on January 10, 2024, we wanted to provide a comprehensive postmortem and outline the necessary follow-up actions.
diff --git a/docs/blog/README.md b/docs/blog/README.md
deleted file mode 100644
index 464090415..000000000
--- a/docs/blog/README.md
+++ /dev/null
@@ -1 +0,0 @@
-# TODO
diff --git a/docs/blog/authors.yml b/docs/blog/authors.yml
index f30d4610d..ec58002e4 100644
--- a/docs/blog/authors.yml
+++ b/docs/blog/authors.yml
@@ -1,6 +1,76 @@
 dan-jan:
   name: Daniel Onggunhao
   title: Co-Founder
-  url: https://github.com/dan-jan 
+  url: https://github.com/dan-jan
   image_url: https://avatars.githubusercontent.com/u/101145494?v=4
-  email: daniel@jan.ai
\ No newline at end of file
+  email: daniel@jan.ai
+
+namchuai:
+  name: Nam Nguyen
+  title: Developer
+  url: https://github.com/namchuai
+  image_url: https://avatars.githubusercontent.com/u/10397206?v=4
+  email: james@jan.ai
+
+hiro-v:
+  name: Hiro Vuong
+  title: MLE
+  url: https://github.com/hiro-v
+  image_url: https://avatars.githubusercontent.com/u/22463238?v=4
+  email: hiro@jan.ai
+
+ashley-jan:
+  name: Ashley Tran
+  title: Product Designer
+  url: https://github.com/imtuyethan
+  image_url: https://avatars.githubusercontent.com/u/89722390?v=4
+  email: ashley@jan.ai
+
+hientominh:
+  name: Hien To
+  title: DevOps Engineer
+  url: https://github.com/hientominh
+  image_url: https://avatars.githubusercontent.com/u/37921427?v=4
+  email: hien@jan.ai
+
+Van-QA:
+  name: Van Pham
+  title: QA & Release Manager
+  url: https://github.com/Van-QA
+  image_url: https://avatars.githubusercontent.com/u/64197333?v=4
+  email: van@jan.ai
+
+louis-jan:
+  name: Louis Le
+  title: Software Engineer
+  url: https://github.com/louis-jan
+  image_url: https://avatars.githubusercontent.com/u/133622055?v=4
+  email: louis@jan.ai
+
+hahuyhoang411:
+  name: Rex Ha
+  title: LLM Researcher & Content Writer
+  url: https://github.com/hahuyhoang411
+  image_url: https://avatars.githubusercontent.com/u/64120343?v=4
+  email: rex@jan.ai
+
+automaticcat:
+  name: Alan Dao
+  title: AI Engineer
+  url: https://github.com/tikikun
+  image_url: https://avatars.githubusercontent.com/u/22268502?v=4
+  email: alan@jan.ai
+
+hieu-jan:
+  name: Henry Ho
+  title: Software Engineer
+  url: https://github.com/hieu-jan
+  image_url: https://avatars.githubusercontent.com/u/150573299?v=4
+  email: hieu@jan.ai
+
+0xsage:
+  name: Nicole Zhu
+  title: Co-Founder
+  url: https://github.com/0xsage
+  image_url: https://avatars.githubusercontent.com/u/69952136?v=4
+  email: nicole@jan.ai
diff --git a/docs/docs/about/01-README.md b/docs/docs/about/01-README.md
deleted file mode 100644
index d5d3b8dc2..000000000
--- a/docs/docs/about/01-README.md
+++ /dev/null
@@ -1,139 +0,0 @@
----
-title: About Jan
-slug: /about
-description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-Jan believes in the need for an **open source AI ecosystem**. We are focused on building the infra and tooling to allow open source AIs to compete on a level playing field with proprietary ones.
-
-Jan's long-term technical endeavor is to build a cognitive framework for future robots, who are practical, useful assistants for humans and businesses in everyday life.
-
-## Quicklinks
-
-- Core product vision for [Jan Framework](../docs)
-- R&D and model training efforts [Discord](https://discord.gg/9NfUSyzp3y) (via our small data-center which is `free & open to all researchers who lack GPUs`!)
-- Current implementations of Jan Framework: [Jan Desktop](https://jan.ai/), [Nitro](https://nitro.jan.ai/)
-
-## Why does Jan Exist?
-
-### Mission
-
-Our current mission is to allow humans and businesses to **own their AI, with the right to tinker, repair and innovate**.
-
-:::tip
-Our life-long mission is to **eliminate work - so human can focus on creation, invention, and moral governance over robots**.
-:::
-
-### Ideal Customer
-
-Our ideal customer is an AI enthusiast or business who has experienced some limitations with current AI solutions and is keen to find open source alternatives.
-
-### Problems
-
-Our ideal customer would use Jan to solve one of these problems.
-
-_Control_
-
-- Control (e.g. preventing vendor lock-in)
-- Stability (e.g. runs predictably every time)
-- Local-use (e.g. for speed, or for airgapped environments)
-
-_Privacy_
-
-- Data protection (e.g. personal data or company data)
-- Privacy (e.g. nsfw)
-
-_Customisability_
-
-- Tinkerability (e.g. ability to change model, experiment)
-- Niche Models (e.g. fine-tuned, domain-specific models that outperform OpenAI)
-
-Sources: [^1] [^2] [^3] [^4]
-
-[^1]: [What are you guys doing that can't be done with ChatGPT?](https://www.reddit.com/r/LocalLLaMA/comments/17mghqr/comment/k7ksti6/?utm_source=share&utm_medium=web2x&context=3)
-[^2]: [What's your main interest in running a local LLM instead of an existing API?](https://www.reddit.com/r/LocalLLaMA/comments/1718a9o/whats_your_main_interest_in_running_a_local_llm/)
-[^3]: [Ask HN: What's the best self-hosted/local alternative to GPT-4?](https://news.ycombinator.com/item?id=36138224)
-[^4]: [LoRAs](https://www.reddit.com/r/LocalLLaMA/comments/17mghqr/comment/k7mdz1i/?utm_source=share&utm_medium=web2x&context=3)
-
-### Solution
-
-Jan is a seamless user experience that runs on your personal computer, that glues the different pieces of the open source AI ecosystem to provide an alternative to OpenAI's closed platform.
-
-- We build a comprehensive, seamless platform that takes care of the technical chores across the stack required to run open source AI
-- We run on top of a local folder of non-proprietary files, that anyone can tinker with (yes, even other apps!)
-- We provide open formats for packaging and distributing AI to run reproducibly across devices
-
-## How Jan Works
-
-### Open Source
-
-Jan is a startup with an open source business model. We believe in the need for an open source AI ecosystem, and are committed to building it.
-
-- [Jan Framework](https://github.com/janhq/jan) (AGPLv3)
-- [Jan Desktop Client & Local server](https://jan.ai) (AGPLv3, built on Jan Framework)
-- [Nitro: run Local AI](https://github.com/janhq/nitro) (AGPLv3)
-
-### Build in Public
-
-We use GitHub to build in public and welcome anyone to join in.
-
-- [Jan's Kanban](https://github.com/orgs/janhq/projects/5)
-- [Jan's Roadmap](https://github.com/orgs/janhq/projects/5/views/29)
-- [Jan's Newsletter](https://newsletter.jan.ai)
-
-### Remote Team
-
-Jan has a fully-remote team. We are mainly based in the APAC timezone. We use [Discord](https://discord.gg/af6SaTdzpx) and [Github](https://github.com/janhq) to work.
-
-### Bootstrapped
-
-Jan is currently a bootstrapped, founder funded startup.
-
-We balance technical invention with the search for a sustainable business model. Thus, we appreciate any business inquiries that can balance growth with cashflow.
-
-**We invite you to join us on our journey to find PMF**. Join our [Discord here](https://discord.gg/BnHRr3Q7Ms)
-
-### Analytics
-
-Adhering to Jan's privacy preserving philosophy, our analytics philosophy is to get `barely-enough-to-function`.
-
-#### What is tracked
-
-1. By default, Github tracks downloads and device metadata for all public GitHub repositories. This helps us troubleshoot & ensure cross-platform support.
-2. We use [Umami](https://umami.is/) to collect, analyze, and understand application data while maintaining visitor privacy and data ownership. We are using the Umami Cloud in Europe to ensure GDPR compliance. Please see [Umami Privacy Policy](https://umami.is/privacy) for more details.
-3. We use Umami to track a single `app.opened` event without additional user metadata, in order to understand retention. In addition, we track `app.event` to understand app version usage.
-4. Additionally, we plan to enable a `Settings` feature for users to turn off all tracking.
-
-#### Request for help
-
-As a result, our feature prioritization can feel a bit black box at times.
-
-We'd appreciate high quality insights and volunteers for user interviews through [Discord](https://discord.gg/af6SaTdzpx) and [Github](https://github.com/janhq).
-
-## Contact
-
-### General Enquiries
-
-Drop us a message in our [Discord](https://discord.gg/af6SaTdzpx) and we'll get back to you.
-
-- `#general`: for general discussion
-- `#jan-dev`: for Jan-related questions
-- `#nitro-dev`: for Nitro-related questions
-- '#bd-inquiries': for enterprise license queries
-
-### Careers
-
-Jan has a culture of ownership, independent thought, and lightning fast execution. If you'd like to join us, we have open positions on our [careers page](https://janai.bamboohr.com/careers).
-
-## Footnotes
diff --git a/docs/docs/about/02-onboarding/README.md b/docs/docs/about/02-onboarding/README.md
deleted file mode 100644
index bf232c07d..000000000
--- a/docs/docs/about/02-onboarding/README.md
+++ /dev/null
@@ -1,79 +0,0 @@
----
-title: Onboarding
-description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
-slug: /onboarding
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-# Onboarding
-
-Welcome to Jan! We’re really excited to bring you onboard.
-
-## Expectations
-
-- **Take Initiative** Take ownership of an area. If you see a problem, take it and own it to completion. Your work will often not be defined, or poorly defined. Take the initiative to figure out what needs to be done, seek others out for clarification, and then communicate what you will be doing to the team.
-
-- **Bias to Action** There are many problem-filled areas. There is no need to ask for permission or try to build consensus: just take action.
-
-- **Speak Up** We require clear, effective and timely communication, which enables others to coordinate with you to be effective. We are a fully distributed, remote team of people from different cultures and languages. If conflicts do arise, first assume Hanlon’s Razor: “Never attribute to malice that which is adequately explained by ~~stupidity~~ lack of communication or too much ambiguity”. Don’t take things personally, be a professional.
-
-- **Mastery** We are working in a frontier industry, where there are no playbooks, and expertise is developed by doing. Own your area, and build mastery.
-
-## Code of conduct
-
-- We operate on the basis of trust.
-- We expect you to be available and communicative during scheduled meetings or work hours.
-- Turning on video during meetings is encouraged.
-- Casual dress during meetings is acceptable; however, use discretion (No nudity, pajamas, etc.)
-- While it’s natural for people to disagree at times, disagreement is no excuse for poor behavior and poor manners. We cannot allow that frustration to turn into a personal attack.
-- Respect other people's cultures. Especially since we are working in a diverse working culture.
-- Sexual harassment is a specific type of prohibited conduct. Sexual harassment is any unwelcome conduct of a sexual nature that might reasonably be expected or be perceived to cause offense or humiliation. Sexual harassment may involve any conduct of a verbal, nonverbal, or physical nature, including written and electronic communications, and may occur between persons of the same or different genders.
-
-## Onboarding Checklist
-
-### HR
-
-- [ ] Service Agreement
-- [ ] Equipment Loan Agreement
-- [ ] Calendar events
-  - [ ] Add to Google Team
-  - [ ] Add to Standup & TGIF
-- [ ] `#hr-*` channel
-- [ ] BambooHr Log-in
-- [ ] Add Emergency Contact in BambooHR
-
-### Apps you will need
-
-:::info
-
-💡 In order to feel connected in a remote workplace, we encourage you to add your profile photo to all the accounts.
-
-:::
-
-- Company-wide
-  - [ ] Google:`[first_name]@jan.ai`
-    - Recommended: setup on Mobile too (i.e. Calendar, Mail)
-    - We use Google Calendar for tracking meetings, etc.
-  - [ ] Discord:
-    - [Invite link](https://discord.gg/sZb6qxfgyx) to Jan’s Discord
-    - We use Discord for day-to-day Comms in the company (ala Slack)
-    - Recommended: setup on Mobile with Notifications
-    - Download the desktop app
-  - [ ] 1Password
-  - [ ] [Jan](https://jan.ai/) - Desktop App
-- Engineering
-  - [ ] Code Editor (such as VSCode, Vim, ect)
-  - [ ] Github
-- Communications
-  - [ ] Fill in your contact details [here](https://docs.google.com/spreadsheets/d/1KAxya29_wb1bEESiFJeCrOec4pCG3uA2D4_VPgAn89U/edit#gid=0)
-  - [ ] To make sure everyone in the remote working environment understands more about each other, we encourage you to share your `How to work with me` in the [Drive Tab](https://docs.google.com/spreadsheets/d/1KAxya29_wb1bEESiFJeCrOec4pCG3uA2D4_VPgAn89U/edit#gid=0) under your name and the Discord `Internal` channel.
diff --git a/docs/docs/about/03-engineering/03-mlops.md b/docs/docs/about/03-engineering/03-mlops.md
deleted file mode 100644
index d3e768a58..000000000
--- a/docs/docs/about/03-engineering/03-mlops.md
+++ /dev/null
@@ -1,149 +0,0 @@
----
-title: MLOps
-description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
-slug: /engineering/mlops
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-## Connecting to Rigs
-
-We have a small data rig you can remote into for R&D and CI.
-
-### Pritunl Setup
-
-1. **Install Pritunl**: [Download here](https://client.pritunl.com/#install)
-2. **Import .ovpn file**
-3. **VSCode**: Install the "Remote-SSH" extension for connection
-
-### Llama.cpp Setup
-
-1. **Clone Repo**: `git clone https://github.com/ggerganov/llama.cpp && cd llama.cpp`
-2. **Build**:
-
-```bash
-mkdir build && cd build
-cmake .. -DLLAMA_CUBLAS=ON -DLLAMA_CUDA_F16=ON -DLLAMA_CUDA_MMV_Y=8
-cmake --build . --config Release
-```
-
-3. **Download Model:**
-
-```bash
-cd ../models && wget https://huggingface.co/TheBloke/Llama-2-7B-GGUF/resolve/main/llama-2-7b.Q8_0.gguf
-```
-
-4. **Run:**
-
-```bash
-cd ../build/bin/
-./main -m ./models/llama-2-7b.Q8_0.gguf -p "Writing a thesis proposal can be done in 10 simple steps:\nStep 1:" -n 2048 -e -ngl 100 -t 48
-```
-
-For the llama.cpp CLI arguments you can see here:
-
-| Short Option    | Long Option           | Param Value | Description                                                      |
-| --------------- | --------------------- | ----------- | ---------------------------------------------------------------- |
-| `-h`            | `--help`              |             | Show this help message and exit                                  |
-| `-i`            | `--interactive`       |             | Run in interactive mode                                          |
-|                 | `--interactive-first` |             | Run in interactive mode and wait for input right away            |
-|                 | `-ins`, `--instruct`  |             | Run in instruction mode (use with Alpaca models)                 |
-| `-r`            | `--reverse-prompt`    | `PROMPT`    | Run in interactive mode and poll user input upon seeing `PROMPT` |
-|                 | `--color`             |             | Colorise output to distinguish prompt and user input from        |
-| **Generations** |
-| `-s`            | `--seed`              | `SEED`      | Seed for random number generator                                 |
-| `-t`            | `--threads`           | `N`         | Number of threads to use during computation                      |
-| `-p`            | `--prompt`            | `PROMPT`    | Prompt to start generation with                                  |
-|                 | `--random-prompt`     |             | Start with a randomized prompt                                   |
-|                 | `--in-prefix`         | `STRING`    | String to prefix user inputs with                                |
-| `-f`            | `--file`              | `FNAME`     | Prompt file to start generation                                  |
-| `-n`            | `--n_predict`         | `N`         | Number of tokens to predict                                      |
-|                 | `--top_k`             | `N`         | Top-k sampling                                                   |
-|                 | `--top_p`             | `N`         | Top-p sampling                                                   |
-|                 | `--repeat_last_n`     | `N`         | Last n tokens to consider for penalize                           |
-|                 | `--repeat_penalty`    | `N`         | Penalize repeat sequence of tokens                               |
-| `-c`            | `--ctx_size`          | `N`         | Size of the prompt context                                       |
-|                 | `--ignore-eos`        |             | Ignore end of stream token and continue generating               |
-|                 | `--memory_f32`        |             | Use `f32` instead of `f16` for memory key+value                  |
-|                 | `--temp`              | `N`         | Temperature                                                      |
-|                 | `--n_parts`           | `N`         | Number of model parts                                            |
-| `-b`            | `--batch_size`        | `N`         | Batch size for prompt processing                                 |
-|                 | `--perplexity`        |             | Compute perplexity over the prompt                               |
-|                 | `--keep`              |             | Number of tokens to keep from the initial prompt                 |
-|                 | `--mlock`             |             | Force system to keep model in RAM                                |
-|                 | `--mtest`             |             | Determine the maximum memory usage                               |
-|                 | `--verbose-prompt`    |             | Print prompt before generation                                   |
-| `-m`            | `--model`             | `FNAME`     | Model path                                                       |
-
-### TensorRT-LLM Setup
-
-#### **Docker and TensorRT-LLM build**
-
-> Note: You should run with admin permission to make sure everything works fine
-
-1. **Docker Image:**
-
-```bash
-sudo make -C docker build
-```
-
-2. **Run Container:**
-
-```bash
-sudo make -C docker run
-```
-
-Once in the container, TensorRT-LLM can be built from the source using the following:
-
-3. **Build:**
-
-```bash
-# To build the TensorRT-LLM code.
-python3 ./scripts/build_wheel.py --trt_root /usr/local/tensorrt
-# Deploy TensorRT-LLM in your environment.
-pip install ./build/tensorrt_llm*.whl
-```
-
-> Note: You can specify the GPU architecture (e.g. for 4090 is ADA) for compilation time reduction
-> The list of supported architectures can be found in the `CMakeLists.txt` file.
-
-```bash
-python3 ./scripts/build_wheel.py --cuda_architectures "89-real;90-real"
-```
-
-#### Running TensorRT-LLM
-
-1. **Requirements:**
-
-```bash
-pip install -r examples/bloom/requirements.txt && git lfs install
-```
-
-2. **Download Weights:**
-
-```bash
-cd examples/llama && rm -rf ./llama/7B && mkdir -p ./llama/7B && git clone https://huggingface.co/NousResearch/Llama-2-7b-hf ./llama/7B
-```
-
-3. **Build Engine:**
-
-```bash
-python build.py --model_dir ./llama/7B/ --dtype float16 --remove_input_padding --use_gpt_attention_plugin float16 --enable_context_fmha --use_gemm_plugin float16 --use_weight_only --output_dir ./llama/7B/trt_engines/weight_only/1-gpu/
-```
-
-4. **Run Inference:**
-
-```bash
-python3 run.py --max_output_len=2048 --tokenizer_dir ./llama/7B/ --engine_dir=./llama/7B/trt_engines/weight_only/1-gpu/ --input_text "Writing a thesis proposal can be done in 10 simple steps:\nStep 1:"
-```
-
-For the tensorRT-LLM CLI arguments, you can see in the `run.py`.
diff --git a/docs/docs/about/03-engineering/04-rd.md b/docs/docs/about/03-engineering/04-rd.md
deleted file mode 100644
index f173d27de..000000000
--- a/docs/docs/about/03-engineering/04-rd.md
+++ /dev/null
@@ -1,20 +0,0 @@
----
-title: R&D
-description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
-slug: /engineering/research
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-## Foundry Best Practices
-
-@alan/rex TODO
diff --git a/docs/docs/about/03-engineering/05-postmortems/README.md b/docs/docs/about/03-engineering/05-postmortems/README.md
deleted file mode 100644
index fda1e6c2f..000000000
--- a/docs/docs/about/03-engineering/05-postmortems/README.md
+++ /dev/null
@@ -1,20 +0,0 @@
----
-title: Postmortems
-description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
-slug: /postmortems
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-import DocCardList from "@theme/DocCardList";
-
-<DocCardList />
diff --git a/docs/docs/about/04-product/README.md b/docs/docs/about/04-product/README.md
deleted file mode 100644
index c07109800..000000000
--- a/docs/docs/about/04-product/README.md
+++ /dev/null
@@ -1,9 +0,0 @@
----
-title: Product
-slug: /product
----
-
-## Prerequisites
-
-- [Figma](https://figma.com)
-- [ScreenStudio](https://www.screen.studio/)
diff --git a/docs/docs/about/05-community/events/README.mdx b/docs/docs/about/05-community/events/README.mdx
deleted file mode 100644
index 92d9cd5f1..000000000
--- a/docs/docs/about/05-community/events/README.mdx
+++ /dev/null
@@ -1,20 +0,0 @@
----
-title: Events
-slug: /events
-description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-import DocCardList from "@theme/DocCardList";
-
-<DocCardList />
\ No newline at end of file
diff --git a/docs/docs/about/06-careers/README.md b/docs/docs/about/06-careers/README.md
deleted file mode 100644
index a0a579e02..000000000
--- a/docs/docs/about/06-careers/README.md
+++ /dev/null
@@ -1,20 +0,0 @@
----
-title: Careers
-slug: /careers
-description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-## We're hiring
-
-[Careers on Bamboo](https://janai.bamboohr.com/careers)
diff --git a/docs/docs/about/2035.mdx b/docs/docs/about/2035.mdx
new file mode 100644
index 000000000..3af7a3197
--- /dev/null
+++ b/docs/docs/about/2035.mdx
@@ -0,0 +1,12 @@
+---
+title: Jan's Vision for 2035
+---
+
+[Jan 2035: A Robotics Company](https://hackmd.io/QIWyYbNNQVWVbupuI3kjAA)
+
+We only have 2 planning parameters:
+
+- 10 year vision
+- 2 week sprint
+
+And we measure our success on Quarterly OKRs
\ No newline at end of file
diff --git a/docs/docs/about/about.md b/docs/docs/about/about.md
new file mode 100644
index 000000000..3066f3003
--- /dev/null
+++ b/docs/docs/about/about.md
@@ -0,0 +1,94 @@
+---
+title: About Jan
+slug: /about
+description: Jan is a productivity tool to customize AI to your needs and workflows.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+  ]
+---
+
+Jan is a [open-source](https://en.wikipedia.org/wiki/Open_source), [local-first](https://www.inkandswitch.com/local-first/) tool to [create, customize and use AI](https://www.gatesnotes.com/AI-agents) for everyday tasks.
+
+You can:
+
+- Run locally using [open-source LLMs](https://huggingface.co/models?pipeline_tag=text-generation) or connect to cloud AIs like [ChatGPT](https://openai.com/blog/openai-api) or [Google](https://ai.google.dev/)
+- Fine-tune AI with specific knowledge
+- Search the web and other databases
+- Connect AI to your everyday tools and (with your permission) do work on your behalf
+
+Longer-term, Jan is building a cognitive framework for future robots. We envision a world where we have personal or company robots that we continually improve and customize, growing together with us.
+
+![Human repairing a Droid](/img/star-wars-droids.png)
+
+## Why do we exist
+
+At Jan, our mission is to advance human-machine collaboration. We achieve this through delivering the best open-source, local-first tools to allow users to run, customize and tinker with AI.
+
+## What's different about it?
+
+|                                                            | Status Quo                                                                 | Jan                                                                                                                           |
+| ---------------------------------------------------------- | -------------------------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------- |
+| Ownership                                                  | AI Monopolies owned by Big Tech                                            | AI that you own and control                                                                                                   |
+| Openness?                                                  | Closed-source                                                              | [Open-source (AGPLv3)](https://github.com/janhq/jan/blob/main/LICENSE)                                                        |
+| Your role                                                  | Consume                                                                    | Create, Tinker and Customize                                                                                                  |
+| Approach                                                   | Cloud                                                                      | [Local-first](https://www.inkandswitch.com/local-first/), running 100% on your devices                                        |
+| Data                                                       | Data stored on their servers                                               | Data stored in your local filesystem in open, non-proprietary file formats                                                    |
+| Privacy                                                    | 😂                                                                         | Runs 100% on your own machine, predictably, privately and offline                                                             |
+| Transparency                                               | "Black Box"                                                                | Runs predictability with code available to tinker and customize                                                               |
+| What happens if there's an outage or goes out of business? | Your life's work held hostage in the cloud in proprietary data formats[^1] | Continues to run 100% on your computer, your data is safe in your local folder                                                |
+| Driving Philosophy                                         | Monetize your users                                                        | [Privacy as a human right](https://en.wikipedia.org/wiki/Right_to_privacy) and the [Right to Repair](https://www.repair.org/) |
+
+## How do I get it?
+
+You can install and start using Jan in less than 5 minutes, from [jan.ai](https://jan.ai) or our [Github repo](https://github.com/janhq/jan).
+
+You can read the [User Guide](/docs/user-guide) if you need some help to get started.
+
+## What license is the code under?
+
+Jan is licensed under the [AGPLv3 License](https://github.com/janhq/jan/blob/main/LICENSE).
+
+We happily accept pull requests, however, we do ask that you sign a [Contributor License Agreement](https://en.wikipedia.org/wiki/Contributor_License_Agreement) so that we have the right to relicense your contributions[^2].
+
+We also have a [Contributor Program](/docs/team/contributor-program) to provide ownership and upside to contributors who have made significant contributions to the project.
+
+## What was it built with?
+
+[Jan](https://github.com/janhq/jan) is pragmatically built using `Typescript` at the application level and `C++` at the Inference level (which we have refactored into [Nitro](https://nitro.jan.ai)[^3]).
+
+We follow [clean architecture](https://blog.cleancoder.com/uncle-bob/2012/08/13/the-clean-architecture.html) and currently support multiple frameworks and runtimes:
+
+- A desktop client with [Electron](https://www.electronjs.org/)
+- A headless server-mode with [Nodejs](https://nodejs.org/en)
+- Planned support for mobile with [Capacitor](https://capacitorjs.com/)
+- Planned support for Python runtime
+
+Architecturally, we have made similar choices to the [Next.js Enterprise Javascript Stack](https://vercel.com/templates/next.js/nextjs-enterprise-boilerplate), which is a [battle-tested](https://nextjs.org/showcase/enterprise) framework for building enterprise-grade applications that scale.
+
+:::tip
+
+**At its core, Jan is a software development kit to build and run copilots on personal devices**. The Desktop Client many folks use is, rather, a specific set of extensions packaged by default. We're excited to see what developers do with the SDK (once its in better shape).
+
+:::
+
+## Contact
+
+Drop us a message in our [Discord](https://discord.gg/af6SaTdzpx) and we'll get back to you.
+
+- `#general`: for general discussion
+- `#get-help`: for bug reports and troubleshooting
+- `#roadmap`: for feature requests and ideas
+
+## Footnotes
+
+[^1]: Credit to Obsidian's original website
+[^2]: Credit to [Discourse's About Page](https://www.discourse.org/about)
+[^3]: Credit to [Llama.cpp](https://github.com/ggerganov/llama.cpp), [TensorRT-LLM](https://github.com/NVIDIA/TensorRT-LLM), [vLLM](https://github.com/vllm-project/vllm), [LMDeploy](https://github.com/InternLM/lmdeploy) and more.
diff --git a/docs/docs/about/roadmap.md b/docs/docs/about/roadmap.md
new file mode 100644
index 000000000..1c789d733
--- /dev/null
+++ b/docs/docs/about/roadmap.md
@@ -0,0 +1,6 @@
+---
+title: Roadmap
+---
+
+- [ ] [Immediate Roadmap on Github](https://github.com/orgs/janhq/projects/5/views/16)
+- [ ] [Longer-term Roadmap on Discord](https://discord.gg/Ey62mynnYr)
\ No newline at end of file
diff --git a/docs/docs/about/05-community/README.md b/docs/docs/community/community.md
similarity index 96%
rename from docs/docs/about/05-community/README.md
rename to docs/docs/community/community.md
index 849cac61e..24a87daf0 100644
--- a/docs/docs/about/05-community/README.md
+++ b/docs/docs/community/community.md
@@ -1,5 +1,5 @@
 ---
-title: Community
+title: Jan's Community
 slug: /community
 description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
 keywords:
diff --git a/docs/docs/docs/02-integrations/README.md b/docs/docs/docs/02-integrations/README.md
deleted file mode 100644
index a1fe45e0c..000000000
--- a/docs/docs/docs/02-integrations/README.md
+++ /dev/null
@@ -1,9 +0,0 @@
----
-title: Integrations
----
-
-Existing and upcoming 3rd party integrations on top of Jan Framework.
-
-From both the core development team, and core contributors.
-
-Suggestions? File an [issue here](https://github.com/janhq/jan/issues)
diff --git a/docs/docs/ecosystem/ecosystem.md b/docs/docs/ecosystem/ecosystem.md
new file mode 100644
index 000000000..38f939b3a
--- /dev/null
+++ b/docs/docs/ecosystem/ecosystem.md
@@ -0,0 +1,3 @@
+---
+title: Ecosystem
+---
\ No newline at end of file
diff --git a/docs/docs/about/05-community/events/hcmc-oct23.md b/docs/docs/events/hcmc-oct23.md
similarity index 100%
rename from docs/docs/about/05-community/events/hcmc-oct23.md
rename to docs/docs/events/hcmc-oct23.md
diff --git a/docs/docs/about/05-community/events/nvidia-llm-day-nov-23.md b/docs/docs/events/nvidia-llm-day-nov-23.md
similarity index 100%
rename from docs/docs/about/05-community/events/nvidia-llm-day-nov-23.md
rename to docs/docs/events/nvidia-llm-day-nov-23.md
diff --git a/docs/docs/features/agents-framework.md b/docs/docs/features/agents-framework.md
new file mode 100644
index 000000000..2ba312854
--- /dev/null
+++ b/docs/docs/features/agents-framework.md
@@ -0,0 +1,3 @@
+---
+title: Agents Framework
+---
\ No newline at end of file
diff --git a/docs/docs/features/api-server.md b/docs/docs/features/api-server.md
new file mode 100644
index 000000000..36f697cb2
--- /dev/null
+++ b/docs/docs/features/api-server.md
@@ -0,0 +1,3 @@
+---
+title: API Server
+---
\ No newline at end of file
diff --git a/docs/docs/features/data-security.md b/docs/docs/features/data-security.md
new file mode 100644
index 000000000..c5c1e6c7c
--- /dev/null
+++ b/docs/docs/features/data-security.md
@@ -0,0 +1,3 @@
+---
+title: Data Security
+---
\ No newline at end of file
diff --git a/docs/docs/features/extensions-framework.md b/docs/docs/features/extensions-framework.md
new file mode 100644
index 000000000..6c173ee53
--- /dev/null
+++ b/docs/docs/features/extensions-framework.md
@@ -0,0 +1,3 @@
+---
+title: Extensions Framework
+---
\ No newline at end of file
diff --git a/docs/docs/features/features.md b/docs/docs/features/features.md
new file mode 100644
index 000000000..d68e9a7ad
--- /dev/null
+++ b/docs/docs/features/features.md
@@ -0,0 +1,3 @@
+---
+title: Features
+---
\ No newline at end of file
diff --git a/docs/docs/features/local.md b/docs/docs/features/local.md
new file mode 100644
index 000000000..6c80c0378
--- /dev/null
+++ b/docs/docs/features/local.md
@@ -0,0 +1,3 @@
+---
+title: Local & Self-Hosted AI
+---
\ No newline at end of file
diff --git a/docs/docs/features/remote.md b/docs/docs/features/remote.md
new file mode 100644
index 000000000..4145a0f0a
--- /dev/null
+++ b/docs/docs/features/remote.md
@@ -0,0 +1,3 @@
+---
+title: OpenAI API Support (and others)
+---
\ No newline at end of file
diff --git a/docs/docs/foundry/foundry.md b/docs/docs/foundry/foundry.md
new file mode 100644
index 000000000..e69de29bb
diff --git a/docs/docs/guides/02-installation/05-docker.md b/docs/docs/guides/02-installation/05-docker.md
new file mode 100644
index 000000000..6236ed92e
--- /dev/null
+++ b/docs/docs/guides/02-installation/05-docker.md
@@ -0,0 +1,102 @@
+---
+title: Docker
+slug: /install/docker
+description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    docker installation,
+  ]
+---
+
+# Installing Jan using Docker
+
+## Installation
+
+### Pre-requisites
+
+:::note
+
+**Supported OS**: Linux, WSL2 Docker
+
+:::
+
+- Docker Engine and Docker Compose are required to run Jan in Docker mode. Follow the [instructions](https://docs.docker.com/engine/install/ubuntu/) below to get started with Docker Engine on Ubuntu.
+
+```bash
+curl -fsSL https://get.docker.com -o get-docker.sh
+sudo sh ./get-docker.sh --dry-run
+```
+
+- If you intend to run Jan in GPU mode, you need to install `nvidia-driver` and `nvidia-docker2`. Follow the instruction [here](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html) for installation.
+
+### Instructions
+
+- Run Jan in Docker mode
+
+  - **Option 1**: Run Jan in CPU mode
+
+    ```bash
+    docker compose --profile cpu up -d
+    ```
+
+  - **Option 2**: Run Jan in GPU mode
+
+    - **Step 1**: Check CUDA compatibility with your NVIDIA driver by running `nvidia-smi` and check the CUDA version in the output
+
+      ```bash
+      nvidia-smi
+
+      # Output
+      +---------------------------------------------------------------------------------------+
+      | NVIDIA-SMI 531.18                 Driver Version: 531.18       CUDA Version: 12.1     |
+      |-----------------------------------------+----------------------+----------------------+
+      | GPU  Name                      TCC/WDDM | Bus-Id        Disp.A | Volatile Uncorr. ECC |
+      | Fan  Temp  Perf            Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
+      |                                         |                      |               MIG M. |
+      |=========================================+======================+======================|
+      |   0  NVIDIA GeForce RTX 4070 Ti    WDDM | 00000000:01:00.0  On |                  N/A |
+      |  0%   44C    P8               16W / 285W|   1481MiB / 12282MiB |      2%      Default |
+      |                                         |                      |                  N/A |
+      +-----------------------------------------+----------------------+----------------------+
+      |   1  NVIDIA GeForce GTX 1660 Ti    WDDM | 00000000:02:00.0 Off |                  N/A |
+      |  0%   49C    P8               14W / 120W|      0MiB /  6144MiB |      0%      Default |
+      |                                         |                      |                  N/A |
+      +-----------------------------------------+----------------------+----------------------+
+      |   2  NVIDIA GeForce GTX 1660 Ti    WDDM | 00000000:05:00.0 Off |                  N/A |
+      | 29%   38C    P8               11W / 120W|      0MiB /  6144MiB |      0%      Default |
+      |                                         |                      |                  N/A |
+      +-----------------------------------------+----------------------+----------------------+
+
+      +---------------------------------------------------------------------------------------+
+      | Processes:                                                                            |
+      |  GPU   GI   CI        PID   Type   Process name                            GPU Memory |
+      |        ID   ID                                                             Usage      |
+      |=======================================================================================|
+      ```
+
+    - **Step 2**: Visit [NVIDIA NGC Catalog ](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda/tags) and find the smallest minor version of image tag that matches your CUDA version (e.g., 12.1 -> 12.1.0)
+
+    - **Step 3**: Update the `Dockerfile.gpu` line number 5 with the latest minor version of the image tag from step 2 (e.g. change `FROM nvidia/cuda:12.2.0-runtime-ubuntu22.04 AS base` to `FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04 AS base`)
+
+    - **Step 4**: Run command to start Jan in GPU mode
+
+      ```bash
+      # GPU mode
+      docker compose --profile gpu up -d
+      ```
+
+  This will start the web server and you can access Jan at `http://localhost:3000`.
+
+:::warning
+
+- Docker mode is currently only suitable for development and localhost. Production is not supported yet, and the RAG feature is not available in Docker mode.
+
+:::
diff --git a/docs/docs/guides/02-installation/05-nightly-build.md b/docs/docs/guides/02-installation/07-nightly-build.md
similarity index 100%
rename from docs/docs/guides/02-installation/05-nightly-build.md
rename to docs/docs/guides/02-installation/07-nightly-build.md
diff --git a/docs/docs/guides/02-installation/07-antivirus-compatibility-testing.md b/docs/docs/guides/02-installation/08-antivirus-compatibility-testing.md
similarity index 100%
rename from docs/docs/guides/02-installation/07-antivirus-compatibility-testing.md
rename to docs/docs/guides/02-installation/08-antivirus-compatibility-testing.md
diff --git a/docs/docs/guides/04-using-models/02-import-manually.mdx b/docs/docs/guides/04-using-models/02-import-manually.mdx
index 68142a8af..7c446ea1c 100644
--- a/docs/docs/guides/04-using-models/02-import-manually.mdx
+++ b/docs/docs/guides/04-using-models/02-import-manually.mdx
@@ -29,6 +29,10 @@ In this section, we will show you how to import a GGUF model from [HuggingFace](
 
 > We are fast shipping a UI to make this easier, but it's a bit manual for now. Apologies.
 
+## Import Models Using Absolute Filepath (version 0.4.7)
+
+Starting from version 0.4.7, Jan has introduced the capability to import models using an absolute file path. It allows you to import models from any directory on your computer. Please check the [import models using absolute filepath](../import-models-using-absolute-filepath) guide for more information. 
+
 ## Manually Importing a Downloaded Model (nightly versions and v0.4.4+)
 
 ### 1. Create a Model Folder
@@ -186,7 +190,6 @@ This means that you can easily reconfigure your models, export them, and share y
 
 Edit `model.json` and include the following configurations:
 
-- Ensure the filename must be `model.json`.
 - Ensure the `id` property matches the folder name you created.
 - Ensure the GGUF filename should match the `id` property exactly.
 - Ensure the `source.url` property is the direct binary download link ending in `.gguf`. In HuggingFace, you can find the direct links in the `Files and versions` tab.
diff --git a/docs/docs/guides/04-using-models/03-import-models-using-absolute-filepath.mdx b/docs/docs/guides/04-using-models/03-import-models-using-absolute-filepath.mdx
new file mode 100644
index 000000000..490f68cd6
--- /dev/null
+++ b/docs/docs/guides/04-using-models/03-import-models-using-absolute-filepath.mdx
@@ -0,0 +1,84 @@
+---
+title: Import Models Using Absolute Filepath
+slug: /guides/using-models/import-models-using-absolute-filepath
+description: Guide to import model using absolute filepath in Jan.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    import-models-manually,
+    absolute-filepath,
+  ]
+---
+
+In this guide, we will walk you through the process of importing a model using an absolute filepath in Jan, using our latest model, [Trinity](https://huggingface.co/janhq/trinity-v1-GGUF), as an example.
+
+### 1. Get the Absolute Filepath of the Model
+
+After downloading .gguf model, you can get the absolute filepath of the model file.
+
+### 2. Configure the Model JSON
+
+1. Navigate to the `~/jan/models` folder. 
+2. Create a folder named `<modelname>`, for example, `tinyllama`.
+3. Create a `model.json` file inside the folder, including the following configurations:
+
+- Ensure the `id` property matches the folder name you created.
+- Ensure the `url` property is the direct binary download link ending in `.gguf`. Now, you can use the absolute filepath of the model file.
+- Ensure the `engine` property is set to `nitro`.
+
+```json
+{
+  "sources": [
+    {
+      "filename": "tinyllama.gguf",
+      // highlight-next-line
+      "url": "<absolute-filepath-of-the-model-file>"
+    }
+  ],
+  "id": "tinyllama-1.1b",
+  "object": "model",
+  "name": "(Absolute Path) TinyLlama Chat 1.1B Q4",
+  "version": "1.0",
+  "description": "TinyLlama is a tiny model with only 1.1B. It's a good model for less powerful computers.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "<|system|>\n{system_message}<|user|>\n{prompt}<|assistant|>",
+    "llama_model_path": "tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 2048,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "TinyLlama",
+    "tags": ["Tiny", "Foundation Model"],
+    "size": 669000000
+  },
+  "engine": "nitro"
+}
+```
+
+:::warning
+
+- If you are using Windows, you need to use double backslashes in the url property, for example: `C:\\Users\\username\\filename.gguf`.
+
+:::
+
+### 3. Start the Model
+
+Restart Jan and navigate to the Hub. Locate your model and click the Use button.
+
+![Demo](assets/03-demo-absolute-filepath.gif)
\ No newline at end of file
diff --git a/docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx b/docs/docs/guides/04-using-models/04-integrate-with-remote-server.mdx
similarity index 97%
rename from docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx
rename to docs/docs/guides/04-using-models/04-integrate-with-remote-server.mdx
index f0db1bd55..3632a40b0 100644
--- a/docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx
+++ b/docs/docs/guides/04-using-models/04-integrate-with-remote-server.mdx
@@ -88,7 +88,7 @@ You can find your API keys in the [OpenAI Platform](https://platform.openai.com/
 
 Restart Jan and navigate to the Hub. Then, select your configured model and start the model.
 
-![image-01](assets/03-openai-platform-configuration.png)
+![image-01](assets/04-openai-platform-configuration.png)
 
 ## Engines with OAI Compatible Configuration
 
@@ -159,7 +159,7 @@ Navigate to the `~/jan/models` folder. Create a folder named `mistral-ins-7b-q4`
 
 Restart Jan and navigate to the Hub. Locate your model and click the Use button.
 
-![image-02](assets/03-oai-compatible-configuration.png)
+![image-02](assets/04-oai-compatible-configuration.png)
 
 ## Assistance and Support
 
diff --git a/docs/docs/guides/04-using-models/04-customize-engine-settings.mdx b/docs/docs/guides/04-using-models/05-customize-engine-settings.mdx
similarity index 100%
rename from docs/docs/guides/04-using-models/04-customize-engine-settings.mdx
rename to docs/docs/guides/04-using-models/05-customize-engine-settings.mdx
diff --git a/docs/docs/guides/04-using-models/assets/03-demo-absolute-filepath.gif b/docs/docs/guides/04-using-models/assets/03-demo-absolute-filepath.gif
new file mode 100644
index 000000000..24dcc251a
Binary files /dev/null and b/docs/docs/guides/04-using-models/assets/03-demo-absolute-filepath.gif differ
diff --git a/docs/docs/guides/04-using-models/assets/03-oai-compatible-configuration.png b/docs/docs/guides/04-using-models/assets/04-oai-compatible-configuration.png
similarity index 100%
rename from docs/docs/guides/04-using-models/assets/03-oai-compatible-configuration.png
rename to docs/docs/guides/04-using-models/assets/04-oai-compatible-configuration.png
diff --git a/docs/docs/guides/04-using-models/assets/03-openai-platform-configuration.png b/docs/docs/guides/04-using-models/assets/04-openai-platform-configuration.png
similarity index 100%
rename from docs/docs/guides/04-using-models/assets/03-openai-platform-configuration.png
rename to docs/docs/guides/04-using-models/assets/04-openai-platform-configuration.png
diff --git a/docs/docs/guides/05-using-server/01-server.md b/docs/docs/guides/05-using-server/01-server.md
deleted file mode 100644
index 952b7399f..000000000
--- a/docs/docs/guides/05-using-server/01-server.md
+++ /dev/null
@@ -1,33 +0,0 @@
----
-title: Connect to Server
-description: Connect to Jan's built-in API server.
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-:::warning
-
-This page is under construction.
-
-:::
-
-Jan ships with a built-in API server, that can be used as a drop-in, local replacement for OpenAI's API.
-
-Jan runs on port `1337` by default, but this can (soon) be changed in Settings.
-
-1. Go to Settings > Advanced > Enable API Server
-
-2. Go to http://localhost:1337 for the API docs.
-
-3. In terminal, simply CURL...
-
-Note: Some UI states may be broken when in Server Mode.
diff --git a/docs/docs/guides/05-using-server/01-start-server.md b/docs/docs/guides/05-using-server/01-start-server.md
new file mode 100644
index 000000000..2433fd80a
--- /dev/null
+++ b/docs/docs/guides/05-using-server/01-start-server.md
@@ -0,0 +1,72 @@
+---
+title: Start Local Server
+slug: /guides/using-server/start-server
+description: How to run Jan's built-in API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    local server,
+    api server,
+  ]
+---
+
+Jan ships with a built-in API server that can be used as a drop-in, local replacement for OpenAI's API. You can run your server by following these simple steps.
+
+## Open Local API Server View
+
+Navigate to the Local API Server view by clicking the corresponding icon on the left side of the screen.
+
+<br></br>
+
+![01-local-api-view](./assets/01-local-api-view.gif)
+
+## Choosing a Model
+
+On the top right of your screen under `Model Settings`, set the LLM that your local server will be running. You can choose from any of the models already installed, or pick a new model by clicking `Explore the Hub`.
+
+<br></br>
+
+![01-choose-model](./assets/01-choose-model.png)
+
+## Server Options
+
+On the left side of your screen, you can set custom server options.
+
+<br></br>
+
+![01-server-settings](./assets/01-server-options.png)
+
+### Local Server Address
+
+By default, Jan will be accessible only on localhost `127.0.0.1`. This means a local server can only be accessed on the same machine where the server is being run.
+
+You can make the local server more accessible by clicking on the address and choosing `0.0.0.0` instead, which allows the server to be accessed from other devices on the local network. This is less secure than choosing localhost, and should be done with caution.
+
+### Port
+
+Jan runs on port `1337` by default. You can change the port to any other port number if needed.
+
+### Cross-Origin Resource Sharing (CORS)
+
+Cross-Origin Resource Sharing (CORS) manages resource access on the local server from external domains. Enabled for security by default, it can be disabled if needed.
+
+### Verbose Server Logs
+
+The center of the screen displays the server logs as the local server runs. This option provides extensive details about server activities.
+
+## Start Server
+
+Click the `Start Server` button on the top left of your screen. You will see the server log display a message such as `Server listening at http://127.0.0.1:1337`, and the `Start Server` button will change to a red `Stop Server` button.
+
+<br></br>
+
+![01-running-server](./assets/01-running-server.gif)
+
+You server is now running and you can use the server address and port to make requests to the local server.
diff --git a/docs/docs/guides/05-using-server/02-using-server.md b/docs/docs/guides/05-using-server/02-using-server.md
new file mode 100644
index 000000000..3d4b004a1
--- /dev/null
+++ b/docs/docs/guides/05-using-server/02-using-server.md
@@ -0,0 +1,102 @@
+---
+title: Using Jan's Built-in API Server
+description: How to use Jan's built-in API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    local server,
+    api server,
+  ]
+---
+
+Jan's built-in API server is compatible with [OpenAI's API](https://platform.openai.com/docs/api-reference) and can be used as a drop-in, local replacement. Follow these steps to use the API server.
+
+## Open the API Reference
+
+Jan contains a comprehensive API reference. This reference displays all the API endpoints available, gives you examples requests and responses, and allows you to execute them in browser.
+
+On the top left of your screen below the red `Stop Server` button is the blue `API Reference`. Clicking this will open the reference in your browser.
+
+<br></br>
+
+![02-api-reference](./assets/02-api-reference.png)
+
+Scroll through the various available endpoints to learn what options are available and try them out by executing the example requests. In addition, you can also use the [Jan API Reference](https://jan.ai/api-reference/) on the Jan website.
+
+### Chat
+
+In the Chat section of the API reference, you will see an example JSON request body.
+
+<br></br>
+
+![02-chat-example](./assets/02-chat-example.png)
+
+With your local server running, you can click the `Try it out` button on the top left, then the blue `Execute` button below the JSON. The browser will send the example request to your server, and display the response body below.
+
+Use the API endpoints, request and response body examples as models for your own application.
+
+### cURL Request Example
+
+Here is an example curl request with a local server running `tinyllama-1.1b`:
+
+<br></br>
+
+```json
+{
+  "messages": [
+    {
+      "content": "You are a helpful assistant.",
+      "role": "system"
+    },
+    {
+      "content": "Hello!",
+      "role": "user"
+    }
+  ],
+  "model": "tinyllama-1.1b",
+  "stream": true,
+  "max_tokens": 2048,
+  "stop": [
+    "hello"
+  ],
+  "frequency_penalty": 0,
+  "presence_penalty": 0,
+  "temperature": 0.7,
+  "top_p": 0.95
+}
+'
+```
+
+### Response Body Example
+
+```json
+{
+  "choices": [
+    {
+      "finish_reason": null,
+      "index": 0,
+      "message": {
+        "content": "Hello user. What can I help you with?",
+        "role": "assistant"
+      }
+    }
+  ],
+  "created": 1700193928,
+  "id": "ebwd2niJvJB1Q2Whyvkz",
+  "model": "_",
+  "object": "chat.completion",
+  "system_fingerprint": "_",
+  "usage": {
+    "completion_tokens": 500,
+    "prompt_tokens": 33,
+    "total_tokens": 533
+  }
+}
+```
diff --git a/docs/docs/guides/05-using-server/assets/01-choose-model.png b/docs/docs/guides/05-using-server/assets/01-choose-model.png
new file mode 100644
index 000000000..9062a1e95
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/01-choose-model.png differ
diff --git a/docs/docs/guides/05-using-server/assets/01-local-api-view.gif b/docs/docs/guides/05-using-server/assets/01-local-api-view.gif
new file mode 100644
index 000000000..cb221fce4
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/01-local-api-view.gif differ
diff --git a/docs/docs/guides/05-using-server/assets/01-running-server.gif b/docs/docs/guides/05-using-server/assets/01-running-server.gif
new file mode 100644
index 000000000..a4225f3cb
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/01-running-server.gif differ
diff --git a/docs/docs/guides/05-using-server/assets/01-server-options.png b/docs/docs/guides/05-using-server/assets/01-server-options.png
new file mode 100644
index 000000000..c48844e40
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/01-server-options.png differ
diff --git a/docs/docs/guides/05-using-server/assets/02-api-reference.png b/docs/docs/guides/05-using-server/assets/02-api-reference.png
new file mode 100644
index 000000000..154d9dfc9
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/02-api-reference.png differ
diff --git a/docs/docs/guides/05-using-server/assets/02-chat-example.png b/docs/docs/guides/05-using-server/assets/02-chat-example.png
new file mode 100644
index 000000000..bd7e33a6a
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/02-chat-example.png differ
diff --git a/docs/docs/guides/07-integrations/01-integrate-continue.mdx b/docs/docs/guides/07-integrations/01-integrate-continue.mdx
index 3a0e9f282..1fa0397e2 100644
--- a/docs/docs/guides/07-integrations/01-integrate-continue.mdx
+++ b/docs/docs/guides/07-integrations/01-integrate-continue.mdx
@@ -35,7 +35,7 @@ To get started with Continue in VS Code, please follow this [guide to install Co
 
 ### 2. Enable Jan API Server
 
-To configure the Continue to use Jan's Local Server, you need to enable Jan API Server with your preferred model, please follow this [guide to enable Jan API Server](../05-using-server/01-server.md)
+To configure the Continue to use Jan's Local Server, you need to enable Jan API Server with your preferred model, please follow this [guide to enable Jan API Server](/guides/using-server/start-server).
 
 ### 3. Configure Continue to Use Jan's Local Server
 
@@ -77,7 +77,7 @@ Edit the `config.json` file and include the following configuration.
       // highlight-start
       "model": "mistral-ins-7b-q4",
       "apiKey": "EMPTY",
-      "apiBase": "http://localhost:1337"
+      "apiBase": "http://localhost:1337/v1"
       // highlight-end
     }
   ]
@@ -86,7 +86,7 @@ Edit the `config.json` file and include the following configuration.
 
 - Ensure that the `provider` is `openai`.
 - Ensure that the `model` is the same as the one you enabled in the Jan API Server.
-- Ensure that the `apiBase` is `http://localhost:1337`.
+- Ensure that the `apiBase` is `http://localhost:1337/v1`.
 - Ensure that the `apiKey` is `EMPTY`.
 
 ### 4. Ensure the Using Model Is Activated in Jan
diff --git a/docs/docs/guides/07-integrations/04-integrate-mistral-ai.mdx b/docs/docs/guides/07-integrations/04-integrate-mistral-ai.mdx
new file mode 100644
index 000000000..14ddeaa75
--- /dev/null
+++ b/docs/docs/guides/07-integrations/04-integrate-mistral-ai.mdx
@@ -0,0 +1,89 @@
+---
+title: Integrate Mistral AI with Jan
+slug: /guides/integrations/mistral-ai
+description: Guide to integrate Mistral AI with Jan
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    Mistral integration,
+  ]
+---
+
+## Quick Introduction
+
+[Mistral AI](https://docs.mistral.ai/) currently provides two ways of accessing their Large Language Models (LLM) - via their API or via open source models available on Hugging Face.  In this guide, we will show you how to integrate Mistral AI with Jan using the API method.
+
+## Steps to Integrate Mistral AI with Jan
+
+### 1. Configure Mistral API key
+
+You can find your API keys in the [Mistral API Key](https://console.mistral.ai/user/api-keys/) and set the Mistral AI API key in `~/jan/engines/openai.json` file.
+
+```json title="~/jan/engines/openai.json"
+{
+  // highlight-start
+  "full_url": "https://api.mistral.ai/v1/chat/completions",
+  "api_key": "<your-mistral-ai-api-key>"
+  // highlight-end
+}
+```
+
+### 2. Modify a Model JSON
+
+Navigate to the `~/jan/models` folder. Create a folder named `<mistral-modelname>`, for example, `mistral-tiny` and create a `model.json` file inside the folder including the following configurations:
+
+- Ensure the filename must be `model.json`.
+- Ensure the `id` property is set to the model id from Mistral AI.
+- Ensure the `format` property is set to `api`.
+- Ensure the `engine` property is set to `openai`.
+- Ensure the `state` property is set to `ready`.
+
+```json title="~/jan/models/mistral-tiny/model.json"
+{
+  "sources": [
+    {
+      "filename": "mistral-tiny",
+      "url": "https://mistral.ai/"
+    }
+  ],
+  "id": "mistral-tiny",
+  "object": "model",
+  "name": "Mistral-7B-v0.2 (Tiny Endpoint)",
+  "version": "1.0",
+  "description": "Currently powered by Mistral-7B-v0.2, a better fine-tuning of the initial Mistral-7B released, inspired by the fantastic work of the community.",
+  // highlight-next-line
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "Mistral AI",
+    "tags": ["General", "Big Context Length"]
+  },
+  // highlight-start
+  "engine": "openai"
+  // highlight-end
+}
+```
+
+:::tip
+
+Mistral AI provides different endpoints. Please check out their [endpoint documentation](https://docs.mistral.ai/platform/endpoints/) to find the one that suits your needs. In this example, we will use the `mistral-tiny` model.
+
+:::
+
+### 3. Start the Model
+
+Restart Jan and navigate to the Hub. Locate your model and click the Use button.
+
+![Mitral AI Tiny Model](assets/04-mistral-ai-tiny-hub.png)
+
+### 4. Try Out the Integration of Jan and Mistral AI
+
+![Mistral AI Integration Demo](assets/04-mistral-ai-integration-demo.gif)
diff --git a/docs/docs/guides/07-integrations/05-integrate-lmstudio.mdx b/docs/docs/guides/07-integrations/05-integrate-lmstudio.mdx
new file mode 100644
index 000000000..58e2f0be9
--- /dev/null
+++ b/docs/docs/guides/07-integrations/05-integrate-lmstudio.mdx
@@ -0,0 +1,184 @@
+---
+title: Integrate LM Studio with Jan
+slug: /guides/integrations/lmstudio
+description: Guide to integrate LM Studio with Jan
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    LM Studio integration,
+  ]
+---
+
+## Quick Introduction
+
+With [LM Studio](https://lmstudio.ai/), you can discover, download, and run local Large Language Models (LLMs). In this guide, we will show you how to integrate and use your current models on LM Studio with Jan using 2 methods.  The first method is integrating LM Studio server with Jan UI. The second method is migrating your downloaded model from LM Studio to Jan. We will use the [Phi 2 - GGUF](https://huggingface.co/TheBloke/phi-2-GGUF) model on Hugging Face as an example.
+
+## Steps to Integrate LM Studio Server with Jan UI
+
+### 1. Start the LM Studio Server
+
+1. Navigate to the `Local Inference Server` on the LM Studio application.  
+2. Select the model you want to use. 
+3. Start the server after configuring the server port and options. 
+
+![LM Studio Server](assets/05-setting-lmstudio-server.gif)
+
+<br></br>
+
+Modify the `openai.json` file in the `~/jan/engines` folder to include the full URL of the LM Studio server.
+
+```json title="~/jan/engines/openai.json"
+{
+  "full_url": "http://localhost:<port>/v1/chat/completions"
+}
+```
+
+:::tip
+
+- Replace `<port>` with the port number you set in the LM Studio server. The default port is `1234`.
+
+:::
+
+### 2. Modify a Model JSON
+
+Navigate to the `~/jan/models` folder. Create a folder named `<lmstudio-modelname>`, for example, `lmstudio-phi-2` and create a `model.json` file inside the folder including the following configurations:
+
+- Set the `format` property to `api`.
+- Set the `engine` property to `openai`.
+- Set the `state` property to `ready`.
+
+```json title="~/jan/models/lmstudio-phi-2/model.json"
+{
+  "sources": [
+    {
+      "filename": "phi-2-GGUF",
+      "url": "https://huggingface.co/TheBloke/phi-2-GGUF"
+    }
+  ],
+  "id": "lmstudio-phi-2",
+  "object": "model",
+  "name": "LM Studio - Phi 2 - GGUF",
+  "version": "1.0",
+  "description": "TheBloke/phi-2-GGUF",
+  // highlight-next-line
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "Microsoft",
+    "tags": ["General", "Big Context Length"]
+  },
+  // highlight-start
+  "engine": "openai"
+  // highlight-end
+}
+```
+
+### 3. Start the Model
+
+1. Restart Jan and navigate to the **Hub**. 
+2. Locate your model and click the **Use** button.
+
+![LM Studio Model](assets/05-lmstudio-run.png)
+
+### 4. Try Out the Integration of Jan and LM Studio
+
+![LM Studio Integration Demo](assets/05-lmstudio-integration-demo.gif)
+
+## Steps to Migrate Your Downloaded Model from LM Studio to Jan (version 0.4.6 and older)
+
+### 1. Migrate Your Downloaded Model
+
+1. Navigate to `My Models` in the LM Studio application and reveal the model folder.
+
+![Reveal-model-folder-lmstudio](assets/05-reveal-model-folder-lmstudio.gif)
+
+2. Copy the model folder that you want to migrate to `~/jan/models` folder.
+
+3. Ensure the folder name property is the same as the model name of `.gguf` filename by changing the folder name if necessary. For example, in this case, we changed foldername from `TheBloke` to `phi-2.Q4_K_S`.
+
+### 2. Start the Model
+
+1. Restart Jan and navigate to the **Hub**. Jan will automatically detect the model and display it in the **Hub**. 
+2. Locate your model and click the **Use** button to try the migrating model.
+
+![Demo](assets/05-demo-migrating-model.gif)
+
+## Steps to Pointing to the Downloaded Model of LM Studio from Jan (version 0.4.7+)
+
+Starting from version 0.4.7, Jan supports importing models using an absolute filepath, so you can directly use the model from the LM Studio folder.
+
+### 1. Reveal the Model Absolute Path
+
+Navigate to `My Models` in the LM Studio application and reveal the model folder. Then, you can get the absolute path of your model.
+
+![Reveal-model-folder-lmstudio](assets/05-reveal-model-folder-lmstudio.gif)
+
+### 2. Modify a Model JSON
+
+Navigate to the `~/jan/models` folder. Create a folder named `<modelname>`, for example, `phi-2.Q4_K_S` and create a `model.json` file inside the folder including the following configurations:
+
+- Ensure the `id` property matches the folder name you created.
+- Ensure the `url` property is the direct binary download link ending in `.gguf`. Now, you can use the absolute filepath of the model file. In this example, the absolute filepath is `/Users/<username>/.cache/lm-studio/models/TheBloke/phi-2-GGUF/phi-2.Q4_K_S.gguf`.
+- Ensure the `engine` property is set to `nitro`.
+
+```json
+{
+  "object": "model",
+  "version": 1,
+  "format": "gguf",
+  "sources": [
+    {
+      "filename": "phi-2.Q4_K_S.gguf",
+      "url": "<absolute-path-of-model-file>"
+    }
+  ],
+  "id": "phi-2.Q4_K_S",
+  "name": "phi-2.Q4_K_S",
+  "created": 1708308111506,
+  "description": "phi-2.Q4_K_S - user self import model",
+  "settings": {
+    "ctx_len": 4096,
+    "embedding": false,
+    "prompt_template": "{system_message}\n### Instruction: {prompt}\n### Response:",
+    "llama_model_path": "phi-2.Q4_K_S.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 2048,
+    "stop": ["<endofstring>"],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "size": 1615568736,
+    "author": "User",
+    "tags": []
+  },
+  "engine": "nitro"
+}
+```
+
+:::warning
+
+- If you are using Windows, you need to use double backslashes in the url property, for example: `C:\\Users\\username\\filename.gguf`.
+
+:::
+
+
+### 3. Start the Model
+
+1. Restart Jan and navigate to the **Hub**. 
+2. Jan will automatically detect the model and display it in the **Hub**. 
+3. Locate your model and click the **Use** button to try the migrating model.  
+
+![Demo](assets/05-demo-pointing-model.gif)
diff --git a/docs/docs/guides/07-integrations/06-integrate-ollama.mdx b/docs/docs/guides/07-integrations/06-integrate-ollama.mdx
new file mode 100644
index 000000000..e55c3e49f
--- /dev/null
+++ b/docs/docs/guides/07-integrations/06-integrate-ollama.mdx
@@ -0,0 +1,90 @@
+---
+title: Integrate Ollama with Jan
+slug: /guides/integrations/ollama
+description: Guide to integrate Ollama with Jan
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    Ollama integration,
+  ]
+---
+
+## Quick Introduction
+
+With [Ollama](https://ollama.com/), you can run large language models locally. In this guide, we will show you how to integrate and use your current models on Ollama with Jan using 2 methods.  The first method is integrating Ollama server with Jan UI. The second method is migrating your downloaded model from Ollama to Jan. We will use the [llama2](https://ollama.com/library/llama2) model as an example.
+
+## Steps to Integrate Ollama Server with Jan UI
+
+### 1. Start the Ollama Server
+
+1. Select the model you want to use from the [Ollama library](https://ollama.com/library). 
+2. Run your model by using the following command:
+  
+```bash
+ollama run <model-name>
+```
+
+3. According to the [Ollama documentation on OpenAI compatibility](https://github.com/ollama/ollama/blob/main/docs/openai.md), you can use the `http://localhost:11434/v1/chat/completions` endpoint to interact with the Ollama server. Thus, modify the `openai.json` file in the `~/jan/engines` folder to include the full URL of the Ollama server.
+
+```json title="~/jan/engines/openai.json"
+{
+  "full_url": "http://localhost:11434/v1/chat/completions"
+}
+```
+
+### 2. Modify a Model JSON
+
+1. Navigate to the `~/jan/models` folder. 
+2. Create a folder named `<ollam-modelname>`, for example, `lmstudio-phi-2`.
+3. Create a `model.json` file inside the folder including the following configurations:
+
+- Set the `id` property to the model name as Ollama model name.
+- Set the `format` property to `api`.
+- Set the `engine` property to `openai`.
+- Set the `state` property to `ready`.
+
+```json title="~/jan/models/llama2/model.json"
+{
+  "sources": [
+    {
+      "filename": "llama2",
+      "url": "https://ollama.com/library/llama2"
+    }
+  ],
+  // highlight-next-line
+  "id": "llama2",
+  "object": "model",
+  "name": "Ollama - Llama2",
+  "version": "1.0",
+  "description": "Llama 2 is a collection of foundation language models ranging from 7B to 70B parameters.",
+  // highlight-next-line
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "Meta",
+    "tags": ["General", "Big Context Length"]
+  },
+  // highlight-next-line
+  "engine": "openai"
+}
+```
+
+### 3. Start the Model
+
+1. Restart Jan and navigate to the **Hub**.
+2. Locate your model and click the **Use** button.
+
+![Ollama Model](assets/06-ollama-run.png)
+
+### 4. Try Out the Integration of Jan and Ollama
+
+![Ollama Integration Demo](assets/06-ollama-integration-demo.gif)
+
diff --git a/docs/docs/guides/07-integrations/assets/04-mistral-ai-integration-demo.gif b/docs/docs/guides/07-integrations/assets/04-mistral-ai-integration-demo.gif
new file mode 100644
index 000000000..015167e2a
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/04-mistral-ai-integration-demo.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/04-mistral-ai-tiny-hub.png b/docs/docs/guides/07-integrations/assets/04-mistral-ai-tiny-hub.png
new file mode 100644
index 000000000..1ae377d70
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/04-mistral-ai-tiny-hub.png differ
diff --git a/docs/docs/guides/07-integrations/assets/05-demo-migrating-model.gif b/docs/docs/guides/07-integrations/assets/05-demo-migrating-model.gif
new file mode 100644
index 000000000..985755e47
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-demo-migrating-model.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/05-demo-pointing-model.gif b/docs/docs/guides/07-integrations/assets/05-demo-pointing-model.gif
new file mode 100644
index 000000000..137fb955a
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-demo-pointing-model.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/05-lmstudio-integration-demo.gif b/docs/docs/guides/07-integrations/assets/05-lmstudio-integration-demo.gif
new file mode 100644
index 000000000..445ea3416
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-lmstudio-integration-demo.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/05-lmstudio-run.png b/docs/docs/guides/07-integrations/assets/05-lmstudio-run.png
new file mode 100644
index 000000000..721581f72
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-lmstudio-run.png differ
diff --git a/docs/docs/guides/07-integrations/assets/05-reveal-model-folder-lmstudio.gif b/docs/docs/guides/07-integrations/assets/05-reveal-model-folder-lmstudio.gif
new file mode 100644
index 000000000..4c1ee85fc
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-reveal-model-folder-lmstudio.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/05-setting-lmstudio-server.gif b/docs/docs/guides/07-integrations/assets/05-setting-lmstudio-server.gif
new file mode 100644
index 000000000..63084be01
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-setting-lmstudio-server.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/06-ollama-integration-demo.gif b/docs/docs/guides/07-integrations/assets/06-ollama-integration-demo.gif
new file mode 100644
index 000000000..708f2058a
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/06-ollama-integration-demo.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/06-ollama-run.png b/docs/docs/guides/07-integrations/assets/06-ollama-run.png
new file mode 100644
index 000000000..7f18e1b15
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/06-ollama-run.png differ
diff --git a/docs/docs/guides/08-troubleshooting/03-gpu-not-used.mdx b/docs/docs/guides/08-troubleshooting/03-gpu-not-used.mdx
index d35993ab6..53638027b 100644
--- a/docs/docs/guides/08-troubleshooting/03-gpu-not-used.mdx
+++ b/docs/docs/guides/08-troubleshooting/03-gpu-not-used.mdx
@@ -188,4 +188,6 @@ Troubleshooting tips:
 
 2. If the issue persists, ensure your (V)RAM is accessible by the application. Some folks have virtual RAM and need additional configuration.
 
-3. Get help in [Jan Discord](https://discord.gg/mY69SZaMaC).
+3. If you are facing issues with the installation of RTX issues, please update the NVIDIA driver that supports CUDA 11.7 or higher. Ensure that the CUDA path is added to the environment variable.
+
+4. Get help in [Jan Discord](https://discord.gg/mY69SZaMaC).
diff --git a/docs/docs/guides/09-advanced-settings/01-https-proxy.mdx b/docs/docs/guides/09-advanced-settings/01-https-proxy.mdx
new file mode 100644
index 000000000..35f4c30f9
--- /dev/null
+++ b/docs/docs/guides/09-advanced-settings/01-https-proxy.mdx
@@ -0,0 +1,101 @@
+---
+title: HTTPS Proxy
+slug: /guides/advanced-settings/https-proxy
+description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    advanced-settings,
+    https-proxy,
+  ]
+---
+
+In this guide, we will show you how to set up your own HTTPS proxy server and configure Jan to use it.
+
+## Why HTTPS Proxy?
+An HTTPS proxy helps you to maintain your privacy and security while still being able to browser the internet circumventing geographical restrictions. 
+
+## Setting Up Your Own HTTPS Proxy Server
+In this section, we will show you a high-level overview of how to set up your own HTTPS proxy server. This guide focus on using Squid as a popular and open-source proxy server software, but there are other software options you might consider based on your needs and preferences.
+
+### Step 1: Choosing a Server
+Firstly, you need to choose a server to host your proxy server. We recommend using a cloud provider like Amazon AWS, Google Cloud, Microsoft Azure, Digital Ocean, etc. Ensure that your server has a public IP address and is accessible from the internet.
+
+### Step 2: Installing Squid
+```bash
+sudo apt-get update
+sudo apt-get install squid
+```
+
+### Step 3: Configure Squid for HTTPS
+
+To enable HTTPS, you will need to configure Squid with SSL support.
+
+- Generate SSL certificate
+
+Squid requires an SSL certificate to be able to handle HTTPS traffic. You can generate a self-signed certificate or obtain one from a Certificate Authority (CA). For a self-signed certificate, you can use OpenSSL:
+
+```bash
+openssl req -new -newkey rsa:2048 -days 365 -nodes -x509 -keyout squid-proxy.pem -out squid-proxy.pem
+```
+
+- Configure Squid to use the SSL certificate: Edit the Squid configuration file `/etc/squid/squid.conf` to include the path to your SSL certificate and enable the HTTPS port:
+
+```bash
+http_port 3128 ssl-bump cert=/path/to/your/squid-proxy.pem
+ssl_bump server-first all
+ssl_bump bump all
+```
+
+- Enable SSL Bumping: To intercept HTTPS traffic, Squid uses a process called SSL Bumping. This process allows Squid to decrypt and re-encrypt HTTPS traffic. To enable SSL Bumping, ensure the `ssl_bump` directives are configured correctly in your `squid.conf` file.
+
+### Step 4 (Optional): Configure ACLs and Authentication
+
+- Access Control Lists (ACLs): You can define rules to control who can access your proxy. This is done by editing the squid.conf file and defining ACLs:
+
+```bash
+acl allowed_ips src "/etc/squid/allowed_ips.txt"
+http_access allow allowed_ips
+```
+
+- Authentication: If you want to add an authentication layer, Squid supports several authentication schemes. Basic authentication setup might look like this:
+
+```bash
+auth_param basic program /usr/lib/squid/basic_ncsa_auth /etc/squid/passwords
+acl authenticated proxy_auth REQUIRED
+http_access allow authenticated
+```
+
+### Step 5: Restart and Test Your Proxy
+
+After configuring, restart Squid to apply the changes:
+
+```bash
+sudo systemctl restart squid
+```
+
+To test, configure your browser or another client to use the proxy server with its IP address and port (default is 3128). Check if you can access the internet through your proxy.
+
+:::tip
+
+Tips for Secure Your Proxy:
+- Firewall rules: Ensure that only intended users or IP addresses can connect to your proxy server. This can be achieved by setting up appropriate firewall rules.
+- Regular updates: Keep your server and proxy software updated to ensure that you are protected against known vulnerabilities.
+- Monitoring and logging: Monitor your proxy server for unusual activity and enable logging to keep track of the traffic passing through your proxy.
+
+::: 
+
+## Setting Up Jan to Use Your HTTPS Proxy
+
+Once you have your HTTPS proxy server set up, you can configure Jan to use it. Navigate to `Settings` > `Advanced Settings` and specify the HTTPS proxy (proxy auto-configuration and SOCKS not supported).
+
+You can turn on the feature `Ignore SSL Certificates` if you are using a self-signed certificate. This feature allows self-signed or unverified certificates.
+
+![01-https-proxy-jan-configure](./assets/01-https-proxy-jan-configure.png)
\ No newline at end of file
diff --git a/docs/docs/guides/09-advanced-settings/README.mdx b/docs/docs/guides/09-advanced-settings/README.mdx
new file mode 100644
index 000000000..ba3da9bb1
--- /dev/null
+++ b/docs/docs/guides/09-advanced-settings/README.mdx
@@ -0,0 +1,65 @@
+---
+title: Advanced Settings
+slug: /guides/advanced-settings/
+description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    advanced-settings,
+  ]
+---
+
+This guide will show you how to use the advanced settings in Jan.
+
+## Keyboard Shortcuts
+
+Keyboard shortcuts are a great way to speed up your workflow. Here are some of the keyboard shortcuts that you can use in Jan.
+
+| Combination     | Description                                        |
+| --------------- | -------------------------------------------------- |
+| `⌘ E`           | Show list your models                              |
+| `⌘ K`           | Show list navigation pages                         |
+| `⌘ B`           | Toggle collapsible left panel                      |
+| `⌘ ,`           | Navigate to setting page                           |
+| `Enter`         | Send a message                                     |
+| `Shift + Enter` | Insert new line in input box                       |
+| `Arrow Up`      | Navigate to previous option (within search dialog) |
+| `Arrow Down`    | Navigate to next option (within search dialog)     |
+
+<br></br>
+
+:::note
+`⌘` is the command key on macOS, and `Ctrl` on Windows.
+:::
+
+## Experimental Mode
+
+Experimental mode allows you to enable experimental features that may be unstable tested.
+
+## Jan Data Folder
+
+The Jan data folder is the location where messages, model configurations, and other user data are placed. You can change the location of the data folder to a different location.
+
+![00-changing-folder](./assets/00-changing-folder.gif)
+
+## HTTPS Proxy & Ignore SSL Certificate
+
+HTTPS Proxy allows you to use a proxy server to connect to the internet. You can also ignore SSL certificates if you are using a self-signed certificate.
+Please check out the guide on [how to set up your own HTTPS proxy server and configure Jan to use it](../advanced-settings/https-proxy) for more information.
+
+## Clear Logs
+
+Clear logs will remove all logs from the Jan application.
+
+## Reset To Factory Default
+
+Reset the application to its original state, deleting all your usage data, including model customizations and conversation history. This action is irreversible and recommended only if the application is in a corrupted state.
+
+![00-reset-factory-settings](./assets/00-reset-factory-settings.gif)
diff --git a/docs/docs/guides/09-advanced-settings/assets/00-changing-folder.gif b/docs/docs/guides/09-advanced-settings/assets/00-changing-folder.gif
new file mode 100644
index 000000000..ac280a5c3
Binary files /dev/null and b/docs/docs/guides/09-advanced-settings/assets/00-changing-folder.gif differ
diff --git a/docs/docs/guides/09-advanced-settings/assets/00-reset-factory-settings.gif b/docs/docs/guides/09-advanced-settings/assets/00-reset-factory-settings.gif
new file mode 100644
index 000000000..81760848d
Binary files /dev/null and b/docs/docs/guides/09-advanced-settings/assets/00-reset-factory-settings.gif differ
diff --git a/docs/docs/guides/09-advanced-settings/assets/01-https-proxy-jan-configure.png b/docs/docs/guides/09-advanced-settings/assets/01-https-proxy-jan-configure.png
new file mode 100644
index 000000000..25e0f7660
Binary files /dev/null and b/docs/docs/guides/09-advanced-settings/assets/01-https-proxy-jan-configure.png differ
diff --git a/docs/docs/how-we-work.md b/docs/docs/how-we-work.md
new file mode 100644
index 000000000..e81099d18
--- /dev/null
+++ b/docs/docs/how-we-work.md
@@ -0,0 +1,23 @@
+---
+title: How We Work
+---
+
+### Open Source
+
+Jan is a startup with an open source business model. We believe in the need for an open source AI ecosystem, and are committed to building it.
+
+- [Jan Framework](https://github.com/janhq/jan) (AGPLv3)
+- [Jan Desktop Client & Local server](https://jan.ai) (AGPLv3, built on Jan Framework)
+- [Nitro: run Local AI](https://github.com/janhq/nitro) (AGPLv3)
+
+### Build in Public
+
+We use GitHub to build in public and welcome anyone to join in.
+
+- [Jan's Kanban](https://github.com/orgs/janhq/projects/5)
+- [Jan's Roadmap](https://github.com/orgs/janhq/projects/5/views/29)
+- `coming soon` [Jan's Newsletter](https://newsletter.jan.ai)
+
+### Remote Team
+
+Jan has a fully-remote team. We are mainly based in the APAC timezone. We use [Discord](https://discord.gg/af6SaTdzpx) and [Github](https://github.com/janhq) to work.
diff --git a/docs/docs/how-we-work/analytics/analytics.md b/docs/docs/how-we-work/analytics/analytics.md
new file mode 100644
index 000000000..79e107a83
--- /dev/null
+++ b/docs/docs/how-we-work/analytics/analytics.md
@@ -0,0 +1,12 @@
+---
+title: Analytics
+---
+
+Adhering to Jan's privacy preserving philosophy, our analytics philosophy is to get "barely-enough-to-function'.
+
+#### What is tracked
+
+1. By default, Github tracks downloads and device metadata for all public GitHub repositories. This helps us troubleshoot & ensure cross-platform support.
+2. We use [Umami](https://umami.is/) to collect, analyze, and understand application data while maintaining visitor privacy and data ownership. We are using the Umami Cloud in Europe to ensure GDPR compliance. Please see [Umami Privacy Policy](https://umami.is/privacy) for more details.
+3. We use Umami to track a single `app.opened` event without additional user metadata, in order to understand retention. In addition, we track `app.version` to understand app version usage.
+4. Additionally, we plan to enable a `Settings` feature for users to turn off all tracking.
diff --git a/docs/docs/about/03-engineering/assets/01-get-help.png b/docs/docs/how-we-work/engineering/assets/01-get-help.png
similarity index 100%
rename from docs/docs/about/03-engineering/assets/01-get-help.png
rename to docs/docs/how-we-work/engineering/assets/01-get-help.png
diff --git a/docs/docs/about/03-engineering/01-ci-cd.md b/docs/docs/how-we-work/engineering/ci-cd.md
similarity index 100%
rename from docs/docs/about/03-engineering/01-ci-cd.md
rename to docs/docs/how-we-work/engineering/ci-cd.md
diff --git a/docs/docs/about/03-engineering/README.md b/docs/docs/how-we-work/engineering/engineering.md
similarity index 100%
rename from docs/docs/about/03-engineering/README.md
rename to docs/docs/how-we-work/engineering/engineering.md
diff --git a/docs/docs/about/03-engineering/02-qa.mdx b/docs/docs/how-we-work/engineering/qa.mdx
similarity index 100%
rename from docs/docs/about/03-engineering/02-qa.mdx
rename to docs/docs/how-we-work/engineering/qa.mdx
diff --git a/docs/docs/how-we-work/product-design/product-design.md b/docs/docs/how-we-work/product-design/product-design.md
new file mode 100644
index 000000000..a2016b6b8
--- /dev/null
+++ b/docs/docs/how-we-work/product-design/product-design.md
@@ -0,0 +1,11 @@
+---
+title: Product & Design
+---
+
+## Roadmap
+
+- Conversations over Tickets
+  - Discord's #roadmap channel
+  - Work with the community to turn conversations into Product Specs
+- Future System?
+  - Use Canny?
\ No newline at end of file
diff --git a/docs/docs/about/04-product/01-management.md b/docs/docs/how-we-work/project-management/project-management.md
similarity index 90%
rename from docs/docs/about/04-product/01-management.md
rename to docs/docs/how-we-work/project-management/project-management.md
index c231801c0..58af4a0d3 100644
--- a/docs/docs/about/04-product/01-management.md
+++ b/docs/docs/how-we-work/project-management/project-management.md
@@ -1,6 +1,5 @@
 ---
 title: Project Management
-slug: /product/management
 ---
 
 We use the [Jan Monorepo Project](https://github.com/orgs/janhq/projects/5) in Github to manage our roadmap and sprint Kanbans.
@@ -58,3 +57,10 @@ We aim to always sprint on `tasks` that are a part of the [current roadmap](http
 
 - `Urgent bugs`: assign to an owner (or @engineers if you are not sure) && tag the current `sprint` & `milestone`
 - `All else`: assign the correct roadmap `label(s)` and owner (if any)
+
+
+#### Request for help
+
+As a result, our feature prioritization can feel a bit black box at times.
+
+We'd appreciate high quality insights and volunteers for user interviews through [Discord](https://discord.gg/af6SaTdzpx) and [Github](https://github.com/janhq).
diff --git a/docs/docs/how-we-work/strategy/strategy.md b/docs/docs/how-we-work/strategy/strategy.md
new file mode 100644
index 000000000..09d9b9fb4
--- /dev/null
+++ b/docs/docs/how-we-work/strategy/strategy.md
@@ -0,0 +1,53 @@
+---
+title: Strategy
+---
+
+We only have 2 planning parameters:
+- 10 year vision
+- 2 week sprint
+- Quarterly OKRs
+
+### Ideal Customer
+
+Our ideal customer is an AI enthusiast or business who has experienced some limitations with current AI solutions and is keen to find open source alternatives.
+
+### Problems
+
+Our ideal customer would use Jan to solve one of these problems.
+
+_Control_
+
+- Control (e.g. preventing vendor lock-in)
+- Stability (e.g. runs predictably every time)
+- Local-use (e.g. for speed, or for airgapped environments)
+
+_Privacy_
+
+- Data protection (e.g. personal data or company data)
+- Privacy (e.g. nsfw)
+
+_Customisability_
+
+- Tinkerability (e.g. ability to change model, experiment)
+- Niche Models (e.g. fine-tuned, domain-specific models that outperform OpenAI)
+
+Sources: [^1] [^2] [^3] [^4]
+
+[^1]: [What are you guys doing that can't be done with ChatGPT?](https://www.reddit.com/r/LocalLLaMA/comments/17mghqr/comment/k7ksti6/?utm_source=share&utm_medium=web2x&context=3)
+[^2]: [What's your main interest in running a local LLM instead of an existing API?](https://www.reddit.com/r/LocalLLaMA/comments/1718a9o/whats_your_main_interest_in_running_a_local_llm/)
+[^3]: [Ask HN: What's the best self-hosted/local alternative to GPT-4?](https://news.ycombinator.com/item?id=36138224)
+[^4]: [LoRAs](https://www.reddit.com/r/LocalLLaMA/comments/17mghqr/comment/k7mdz1i/?utm_source=share&utm_medium=web2x&context=3)
+
+### Solution
+
+Jan is a seamless user experience that runs on your personal computer, that glues the different pieces of the open source AI ecosystem to provide an alternative to OpenAI's closed platform.
+
+- We build a comprehensive, seamless platform that takes care of the technical chores across the stack required to run open source AI
+- We run on top of a local folder of non-proprietary files, that anyone can tinker with (yes, even other apps!)
+- We provide open formats for packaging and distributing AI to run reproducibly across devices
+
+
+## Prerequisites
+
+- [Figma](https://figma.com)
+- [ScreenStudio](https://www.screen.studio/)
diff --git a/docs/docs/how-we-work/website-docs/website-docs.md b/docs/docs/how-we-work/website-docs/website-docs.md
new file mode 100644
index 000000000..a152c6dc9
--- /dev/null
+++ b/docs/docs/how-we-work/website-docs/website-docs.md
@@ -0,0 +1,3 @@
+---
+title: Website & Docs
+---
\ No newline at end of file
diff --git a/docs/docs/integrations.md b/docs/docs/integrations.md
new file mode 100644
index 000000000..0884d2242
--- /dev/null
+++ b/docs/docs/integrations.md
@@ -0,0 +1,3 @@
+---
+title: Integrations
+---
\ No newline at end of file
diff --git a/docs/docs/docs/02-integrations/langchain.md b/docs/docs/integrations/langchain.md
similarity index 100%
rename from docs/docs/docs/02-integrations/langchain.md
rename to docs/docs/integrations/langchain.md
diff --git a/docs/docs/docs/02-integrations/llamacpp.md b/docs/docs/integrations/llamacpp.md
similarity index 94%
rename from docs/docs/docs/02-integrations/llamacpp.md
rename to docs/docs/integrations/llamacpp.md
index 9d5004982..2764187c1 100644
--- a/docs/docs/docs/02-integrations/llamacpp.md
+++ b/docs/docs/integrations/llamacpp.md
@@ -1,5 +1,5 @@
 ---
-title: LlamaCPP
+title: llama.cpp
 ---
 
 ## Quicklinks
diff --git a/docs/docs/docs/02-integrations/ollama.md b/docs/docs/integrations/ollama.md
similarity index 100%
rename from docs/docs/docs/02-integrations/ollama.md
rename to docs/docs/integrations/ollama.md
diff --git a/docs/docs/docs/02-integrations/openai.md b/docs/docs/integrations/openai.md
similarity index 100%
rename from docs/docs/docs/02-integrations/openai.md
rename to docs/docs/integrations/openai.md
diff --git a/docs/docs/docs/02-integrations/openrouter.md b/docs/docs/integrations/openrouter.md
similarity index 100%
rename from docs/docs/docs/02-integrations/openrouter.md
rename to docs/docs/integrations/openrouter.md
diff --git a/docs/docs/docs/02-integrations/tensorrt.md b/docs/docs/integrations/tensorrt.md
similarity index 100%
rename from docs/docs/docs/02-integrations/tensorrt.md
rename to docs/docs/integrations/tensorrt.md
diff --git a/docs/docs/partners/become-a-partner.md b/docs/docs/partners/become-a-partner.md
new file mode 100644
index 000000000..dce93e87a
--- /dev/null
+++ b/docs/docs/partners/become-a-partner.md
@@ -0,0 +1,3 @@
+---
+title: Become a Partner
+---
\ No newline at end of file
diff --git a/docs/docs/partners/partners.md b/docs/docs/partners/partners.md
new file mode 100644
index 000000000..1c5eaa0f2
--- /dev/null
+++ b/docs/docs/partners/partners.md
@@ -0,0 +1,3 @@
+---
+title: Partners
+---
\ No newline at end of file
diff --git a/docs/docs/platforms/desktop.md b/docs/docs/platforms/desktop.md
new file mode 100644
index 000000000..fb4ea8389
--- /dev/null
+++ b/docs/docs/platforms/desktop.md
@@ -0,0 +1,84 @@
+---
+title: Jan Desktop
+slug: /desktop
+description: Turn your computer into an AI PC
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+  ]
+---
+
+# Turn any computer into an AI computer
+
+![Alt text](image.png)
+
+<!-- TODO replace with GIF when we turn this page into a website -->
+
+### Designed for Everyone
+
+- **Installs with 1 click.** Jan is easy to use, beautiful, and the core features are free forever.
+- **Runs on consumer laptops.** Tested by 250k+ users across `Windows, Mac, and Linux`, Jan even works on `CPU-only mode`.
+- **Automatic GPU acceleration**. Models responds faster across `NVIDIA, AMD, Apple, and Intel` when benchmarked against industry alternatives.
+
+:::tip
+
+“Normies” can run LLMs like an AI engineer on the Desktop App - no programming experience needed.
+
+:::
+
+### Private & Offline
+
+- **Runs 100% locally**. AI models run directly on your laptop without an internet connection. `You own your AI`.
+- **Private conversations.** Data is saved on your own filesystem in a transparent non-proprietary data format. `You own your data.`
+- **Open source security**. Jan is open source, so you can scruntinize every line in our codebase. So when we say your data is not our product, we mean it. See [the code](https://github.com/janhq/jan) and our [data policy](/how-we-work/analytics).
+
+### Customizable AI
+
+- **Use AI without limitations.** Take control of censorship levels. Jan is usable from the classroom to the boardroom (and few other rooms if that’s your jam).
+- **Use any models**. Download open source models from HuggingFace or upload your own custom models. [link]
+
+:::tip
+
+Download Jan Desktop Client [here](https://github.com/janhq/jan?tab=readme-ov-file#download).
+
+:::
+
+## Jan Desktop is
+
+### For Developers
+
+**You can easily integrate a locally running LLM into your own projects.**
+
+- Turn on `Local API Server` mode to start building on an `OpenAI compatible API`.
+- Jan Desktop comes with a Developer Console out of the box.
+- The UI makes it easy to see logs, configure models and more.
+
+![Alt text](image-1.png)
+
+<!-- CTA ⇒ Developer Hub -->
+
+### For Your Home Server
+
+<!-- [Insert Screenshot of: Jan running in a Terminal (left) || the OpenAI configuration Yaml (right)] -->
+
+- Use Jan as a UI only, pointing to a different backend. [See Docs](/guides/using-models/integrate-with-remote-server)
+- Use Jan as a backend only, pointing to a different frontend. [See Docs](/guides/using-models/integrate-with-remote-server)
+- Run Jan in team-mode on production-grade GPUs. [See Server Suite](/server-suite)
+
+<!-- CTA ⇒ Server Docs -->
+
+### For People who Tinker
+
+- Customize the app’s look and feel though Themes.
+- Customize assistants, models and other features with **no code**.
+- Customize the entire Application through Extensions. Inspired by VSCode extensions, the desktop app can be entirely customized.
+
+[See the default extensions](https://github.com/janhq/jan/tree/main/extensions) bundled with every Desktop install.
+![Alt text](image-4.png)
diff --git a/docs/docs/platforms/hub.md b/docs/docs/platforms/hub.md
new file mode 100644
index 000000000..9d8167618
--- /dev/null
+++ b/docs/docs/platforms/hub.md
@@ -0,0 +1,3 @@
+---
+title: Jan Hub
+---
\ No newline at end of file
diff --git a/docs/docs/platforms/image-1.png b/docs/docs/platforms/image-1.png
new file mode 100644
index 000000000..cd94f34e9
Binary files /dev/null and b/docs/docs/platforms/image-1.png differ
diff --git a/docs/docs/platforms/image-2.png b/docs/docs/platforms/image-2.png
new file mode 100644
index 000000000..cc75d39ce
Binary files /dev/null and b/docs/docs/platforms/image-2.png differ
diff --git a/docs/docs/platforms/image-3.png b/docs/docs/platforms/image-3.png
new file mode 100644
index 000000000..20828beb9
Binary files /dev/null and b/docs/docs/platforms/image-3.png differ
diff --git a/docs/docs/platforms/image-4.png b/docs/docs/platforms/image-4.png
new file mode 100644
index 000000000..38b75c1da
Binary files /dev/null and b/docs/docs/platforms/image-4.png differ
diff --git a/docs/docs/platforms/image.png b/docs/docs/platforms/image.png
new file mode 100644
index 000000000..0237898c7
Binary files /dev/null and b/docs/docs/platforms/image.png differ
diff --git a/docs/docs/platforms/mobile.md b/docs/docs/platforms/mobile.md
new file mode 100644
index 000000000..827544201
--- /dev/null
+++ b/docs/docs/platforms/mobile.md
@@ -0,0 +1,16 @@
+---
+title: Jan Mobile
+slug: /mobile
+description: Jan Mobile allows you to bring your AI on the go
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+  ]
+---
\ No newline at end of file
diff --git a/docs/docs/pricing/pricing.md b/docs/docs/pricing/pricing.md
new file mode 100644
index 000000000..233610468
--- /dev/null
+++ b/docs/docs/pricing/pricing.md
@@ -0,0 +1,10 @@
+---
+title: Pricing
+slug: /pricing
+---
+
+| $0               | $1               | Enterprise              |
+| ---------------- | ---------------- | ----------------------- |
+| Free             | Premium          | TBA                     |
+| ✅ Core features | ✅ Discord badge | ✅ Enterprise-level SLA |
+| ✅ free forever  |                  |                         |
diff --git a/docs/docs/server-suite/admin-console.md b/docs/docs/server-suite/admin-console.md
new file mode 100644
index 000000000..e2da5c096
--- /dev/null
+++ b/docs/docs/server-suite/admin-console.md
@@ -0,0 +1,3 @@
+---
+title: Admin Console
+---
\ No newline at end of file
diff --git a/docs/docs/server-suite/audit-compliance.md b/docs/docs/server-suite/audit-compliance.md
new file mode 100644
index 000000000..af4684899
--- /dev/null
+++ b/docs/docs/server-suite/audit-compliance.md
@@ -0,0 +1,3 @@
+---
+title: Audit & Compliance
+---
\ No newline at end of file
diff --git a/docs/docs/server-suite/enterprise.md b/docs/docs/server-suite/enterprise.md
new file mode 100644
index 000000000..565c14fde
--- /dev/null
+++ b/docs/docs/server-suite/enterprise.md
@@ -0,0 +1,100 @@
+---
+title: Jan Enterprise
+slug: /enterprise
+description: Built for Enterprise Deployments
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+  ]
+---
+
+# Customize and run AI across your organization
+
+Jan can professional backend to create, customize and run AIs at scale, for production-grade data centers.
+
+:::warning
+
+The server suite is actively under development and lacking documentation.
+You can find the source code [here](https://github.com/janhq/jan/tree/dev/server) and [here](https://github.com/janhq/jan/blob/dev/docker-compose.yml).
+
+It is free to use. Your feedback is appreciated 🙏.
+
+:::
+
+## Own your AI. Own your data. Own your IP.
+
+Over time, we expect more teams and organizations to turn to running their own AIs on-prem.
+
+**Why?**
+
+- Prevent shadow data
+- Avoid vendor lock-in
+- Keep your IP in house
+- Uptime and support predictability
+- Eliminate monthly API bills - use your existing hardware
+- Full control over your AI - you can open it up and see what's going on
+
+## Why Jan Enterprise
+
+### Fast deployment
+
+- **1 click deployment**. Immediately serve, customize, and scale models and assistants across your org. Scale your AI team so they can focus on the IP instead of fixing plumbing across every computer.
+- **Scale across infrastructures**: on premise, with cloud providers, or as a hybrid deployment. Run Jan in completely air-gapped environments.
+- **Optimized for datacenter-grade GPUs**: Can run on Nvidia, AMD Hardware, or even normal CPUs. Use TensorRT-LLM for more speedups on A6000s and above.
+
+### Full customization
+
+- Runs custom models or popular LLMs like Llama2, Mistral at production scale
+- API that is fully OpenAI-compatible, i.e. can be a drop-in migration
+- Powerful Agent framework to customize LLMs using RAG or Enterprise Data integrations.
+
+:::tip
+
+Not a Jan fan but convinced about local AI? No worries, here's a list of [awesome local ai](https://github.com/janhq/awesome-local-ai) alternatives that you can use in your team.
+
+:::
+
+## Supported Extensions
+
+The SDK and current implemention accomodate the following potential extensions.
+
+### Admin console
+
+Integrate SAML, OAUTH, OIDC
+
+<!-- link to that page -->
+
+### Identity access management
+
+Grant roles, groups and general ACL
+
+<!-- link to that page -->
+
+### Audit compliance
+
+Plug in Guardrails, LLMGuard, your custom rules engine and more
+
+<!-- Link to that page -->
+
+### Observability
+
+Plug in Langfuse, Langsmith, Openllmetry and more
+
+<!-- Link to this page -->
+
+## Enterprise support SLA
+
+Our core team and AI solutions partners are to help.
+
+Email us at: `inquiries@jan.ai` for:
+
+- Priority case routing
+- Proactive case monitoring
+- 24-hour support response
diff --git a/docs/docs/server-suite/home-server.md b/docs/docs/server-suite/home-server.md
new file mode 100644
index 000000000..97f3afbc7
--- /dev/null
+++ b/docs/docs/server-suite/home-server.md
@@ -0,0 +1,50 @@
+---
+title: Jan Home Server
+slug: /home-server
+description: Built for Home Servers
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+  ]
+---
+
+# Customize and run AI across all of your devices
+
+Self-host and access your AI from anywhere with Jan server suite.
+
+:::warning
+
+Jan's server suite is actively under development and lacking documentation.
+You can find the source code [here](https://github.com/janhq/jan/tree/dev/server) and [here](https://github.com/janhq/jan/blob/dev/docker-compose.yml).
+
+It is free to use. Your feedback is appreciated 🙏.
+
+:::
+
+## Why Home Servers
+
+We built [Jan Desktop](/desktop) for our personal use. We're now building Server Suite, for our team & community use.
+
+Our goal is to help teams, like ours, move past cobbling together demo apps to use AI at work. We should be able to customize and collaborate with AIs that are usable on a daily basis.
+
+**Check out [Server Suite](https://github.com/janhq/jan/tree/dev/server) if you need to:**
+
+- Self-host Jan, with multi client sync
+- Customize it with Personal Data Connectors
+- Simple Authentication (username / pw)
+- Scales across Consumer-grade Hardware, including GPUs
+- Everyone has admin level visibility and can see all conversations
+- Create assistants that has access to the same knowledge base
+
+:::tip
+
+Not a Jan fan but convinced about running AI locally? No worries, here's a list of [awesome local ai](https://github.com/janhq/awesome-local-ai) alternatives that you can use in your home server.
+
+:::
diff --git a/docs/docs/server-suite/identity-access-management.md b/docs/docs/server-suite/identity-access-management.md
new file mode 100644
index 000000000..bdeafa9bd
--- /dev/null
+++ b/docs/docs/server-suite/identity-access-management.md
@@ -0,0 +1,3 @@
+---
+title: Identity & Access Control
+---
\ No newline at end of file
diff --git a/docs/docs/server-suite/observability.md b/docs/docs/server-suite/observability.md
new file mode 100644
index 000000000..6371a6287
--- /dev/null
+++ b/docs/docs/server-suite/observability.md
@@ -0,0 +1,3 @@
+---
+title: Observability
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/ai-employees.md b/docs/docs/solutions/ai-employees.md
new file mode 100644
index 000000000..53f425ab5
--- /dev/null
+++ b/docs/docs/solutions/ai-employees.md
@@ -0,0 +1,4 @@
+---
+title: AI Employees
+tags: [use-cases]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/ai-pc.md b/docs/docs/solutions/ai-pc.md
new file mode 100644
index 000000000..415dadef9
--- /dev/null
+++ b/docs/docs/solutions/ai-pc.md
@@ -0,0 +1,4 @@
+---
+title: AI PC
+tags: [use-cases]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/chatgpt-alternative.md b/docs/docs/solutions/chatgpt-alternative.md
new file mode 100644
index 000000000..84ec2a59b
--- /dev/null
+++ b/docs/docs/solutions/chatgpt-alternative.md
@@ -0,0 +1,4 @@
+---
+title: Self-hosted alternative to OpenAI's Platform
+tags: [use-cases]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/consultants.md b/docs/docs/solutions/consultants.md
new file mode 100644
index 000000000..085a84954
--- /dev/null
+++ b/docs/docs/solutions/consultants.md
@@ -0,0 +1,4 @@
+---
+title: Software Consultants
+tags: [audiences]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/developers.md b/docs/docs/solutions/developers.md
new file mode 100644
index 000000000..e912365bf
--- /dev/null
+++ b/docs/docs/solutions/developers.md
@@ -0,0 +1,4 @@
+---
+title: Developers
+tags: [audiences]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/enterprises.md b/docs/docs/solutions/enterprises.md
new file mode 100644
index 000000000..0a219ee74
--- /dev/null
+++ b/docs/docs/solutions/enterprises.md
@@ -0,0 +1,4 @@
+---
+title: Enterprises
+tags: [audiences]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/finance.md b/docs/docs/solutions/finance.md
new file mode 100644
index 000000000..dde66d618
--- /dev/null
+++ b/docs/docs/solutions/finance.md
@@ -0,0 +1,4 @@
+---
+title: Finance
+tags: [industries]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/government.md b/docs/docs/solutions/government.md
new file mode 100644
index 000000000..cb52f5d71
--- /dev/null
+++ b/docs/docs/solutions/government.md
@@ -0,0 +1,4 @@
+---
+title: Government
+tags: [industries]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/healthcare.md b/docs/docs/solutions/healthcare.md
new file mode 100644
index 000000000..1cd85463b
--- /dev/null
+++ b/docs/docs/solutions/healthcare.md
@@ -0,0 +1,4 @@
+---
+title: Healthcare
+tags: [industries]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/legal.md b/docs/docs/solutions/legal.md
new file mode 100644
index 000000000..6cc88372c
--- /dev/null
+++ b/docs/docs/solutions/legal.md
@@ -0,0 +1,4 @@
+---
+title: Legal
+tags: [industries]
+---
\ No newline at end of file
diff --git a/docs/docs/solutions/startups.md b/docs/docs/solutions/startups.md
new file mode 100644
index 000000000..23cdb5bbe
--- /dev/null
+++ b/docs/docs/solutions/startups.md
@@ -0,0 +1,4 @@
+---
+title: Startups
+tags: [audiences]
+---
\ No newline at end of file
diff --git a/docs/docs/studio/studio.md b/docs/docs/studio/studio.md
new file mode 100644
index 000000000..e69de29bb
diff --git a/docs/docs/team/contributor-program.md b/docs/docs/team/contributor-program.md
new file mode 100644
index 000000000..cacdfa047
--- /dev/null
+++ b/docs/docs/team/contributor-program.md
@@ -0,0 +1,3 @@
+---
+title: Contributor Program
+---
\ No newline at end of file
diff --git a/docs/docs/team/join-us.md b/docs/docs/team/join-us.md
new file mode 100644
index 000000000..84b8c263c
--- /dev/null
+++ b/docs/docs/team/join-us.md
@@ -0,0 +1,12 @@
+---
+title: Join us
+---
+
+- [ ] Explain Core Team, Contributors and Open Source approach
+
+
+[Careers on Bamboo](https://janai.bamboohr.com/careers)
+
+### Careers
+
+Jan has a culture of ownership, independent thought, and lightning fast execution. If you'd like to join us, we have open positions on our [careers page](https://janai.bamboohr.com/careers).
\ No newline at end of file
diff --git a/docs/docs/team/team.md b/docs/docs/team/team.md
new file mode 100644
index 000000000..7d5e07cfb
--- /dev/null
+++ b/docs/docs/team/team.md
@@ -0,0 +1,28 @@
+---
+title: Who we are
+---
+
+What's Jan the company about?
+We aim to build the cognitive framework for future robots
+
+### Open Source
+
+Jan is a startup with an open source business model. We believe in the need for an open source AI ecosystem, and are committed to building it.
+
+- [Jan Framework](https://github.com/janhq/jan) (AGPLv3)
+- [Jan Desktop Client & Local server](https://jan.ai) (AGPLv3, built on Jan Framework)
+- [Nitro: run Local AI](https://github.com/janhq/nitro) (AGPLv3)
+
+
+### Bootstrapped
+
+Jan is currently a bootstrapped startup.
+
+We balance technical invention with the search for a sustainable business model. Thus, we appreciate any business inquiries that can balance growth with cashflow.
+
+**We invite you to join us on our journey to find PMF**. Join our [Discord here](https://discord.gg/BnHRr3Q7Ms)
+
+## Our Team
+
+- Contributors
+- Core Team
\ No newline at end of file
diff --git a/docs/docs/wall-of-love.md b/docs/docs/wall-of-love.md
new file mode 100644
index 000000000..f196c90e9
--- /dev/null
+++ b/docs/docs/wall-of-love.md
@@ -0,0 +1,3 @@
+---
+title: Wall of Love ❤️
+---
\ No newline at end of file
diff --git a/docs/docusaurus.config.js b/docs/docusaurus.config.js
index 4ed7f0bea..42ed55529 100644
--- a/docs/docusaurus.config.js
+++ b/docs/docusaurus.config.js
@@ -224,7 +224,7 @@ const config = {
           description:
             "Jan runs 100% offline on your computer, utilizes open-source AI models, prioritizes privacy, and is highly customizable.",
           keywords:
-            "Jan AI,  Jan, ChatGPT alternative, local AI, private AI, conversational AI, no-subscription fee, large language model ",
+            "Jan AI, Jan, ChatGPT alternative, local AI, private AI, conversational AI, no-subscription fee, large language model ",
           applicationCategory: "BusinessApplication",
           operatingSystem: "Multiple",
           url: "https://jan.ai/",
@@ -239,41 +239,84 @@ const config = {
       },
       items: [
         // Navbar Left
+        // {
+        //   type: "docSidebar",
+        //   sidebarId: "aboutSidebar",
+        //   position: "left",
+        //   label: "About",
+        // },
         {
-          type: "docSidebar",
-          sidebarId: "guidesSidebar",
+          type: "dropdown",
+          label: "About",
           position: "left",
-          label: "Guides",
+          items: [
+            {
+              type: "doc",
+              label: "What is Jan?",
+              docId: "about/about",
+            },
+            {
+              type: "doc",
+              label: "Who we are",
+              docId: "team/team",
+            },
+            {
+              type: "doc",
+              label: "Wall of love",
+              docId: "wall-of-love",
+            },
+          ],
         },
         {
           type: "docSidebar",
-          sidebarId: "developerSidebar",
-          position: "left",
-          label: "Developer",
-        },
-        {
-          position: "left",
-          to: "/api-reference",
-          label: "API Reference",
+          sidebarId: "productSidebar",
+          positionL: "left",
+          label: "Product",
         },
         {
           type: "docSidebar",
+          sidebarId: "ecosystemSidebar",
           position: "left",
-          sidebarId: "docsSidebar",
-          label: "Framework",
+          label: "Ecosystem",
         },
+        // {
+        //   type: "docSidebar",
+        //   sidebarId: "pricingSidebar",
+        //   positionL: "left",
+        //   label: "Pricing",
+        // },
         // Navbar right
+        {
+          type: "dropdown",
+          label: "Docs",
+          position: "right",
+          items: [
+            {
+              type: "docSidebar",
+              sidebarId: "guidesSidebar",
+              label: "User Guide",
+            },
+            {
+              type: "docSidebar",
+              sidebarId: "developerSidebar",
+              label: "Developer",
+            },
+            {
+              to: "/api-reference",
+              label: "API Reference",
+            },
+            {
+              type: "docSidebar",
+              sidebarId: "docsSidebar",
+              label: "Framework",
+            },
+          ],
+        },
         {
           to: "blog",
           label: "Blog",
           position: "right",
         },
-        {
-          type: "docSidebar",
-          sidebarId: "aboutSidebar",
-          position: "right",
-          label: "About",
-        },
       ],
     },
     prism: {
diff --git a/docs/sidebars.js b/docs/sidebars.js
index 00eb8d40d..02ea7589f 100644
--- a/docs/sidebars.js
+++ b/docs/sidebars.js
@@ -13,33 +13,160 @@
 
 /** @type {import('@docusaurus/plugin-content-docs').SidebarsConfig} */
 const sidebars = {
+  aboutSidebar: [
+    {
+      type: "category",
+      label: "What is Jan?",
+      link: { type: "doc", id: "about/about" },
+      items: [
+        //"about/roadmap",
+        "community/community",
+      ],
+    },
+    {
+      type: "category",
+      label: "Who we are",
+      link: { type: "doc", id: "team/team" },
+      items: ["team/join-us", "team/contributor-program"],
+    },
+    "wall-of-love",
+    {
+      type: "category",
+      label: "How We Work",
+      link: { type: "doc", id: "how-we-work" },
+      items: [
+        "how-we-work/strategy/strategy",
+        "how-we-work/project-management/project-management",
+        {
+          type: "category",
+          label: "Engineering",
+          link: { type: "doc", id: "how-we-work/engineering/engineering" },
+          items: [
+            "how-we-work/engineering/ci-cd",
+            "how-we-work/engineering/qa",
+          ],
+        },
+        "how-we-work/product-design/product-design",
+        "how-we-work/analytics/analytics",
+        "how-we-work/website-docs/website-docs",
+      ],
+    },
+  ],
+  productSidebar: [
+    {
+      type: "category",
+      label: "Platforms",
+      collapsible: false,
+      items: [
+        "platforms/desktop",
+        "server-suite/home-server",
+        // "server-suite/enterprise",
+        // "platforms/mobile",
+        // "platforms/hub",
+      ],
+    },
+    {
+      type: "category",
+      collapsible: true,
+      collapsed: false,
+      label: "Features",
+      link: { type: "doc", id: "features/features" },
+      items: [
+        "features/local",
+        "features/remote",
+        "features/api-server",
+        "features/extensions-framework",
+        "features/agents-framework",
+        "features/data-security",
+      ],
+    },
+    // NOTE: Jan Server Suite will be torn out into it's own section in the future
+    // {
+    //   type: "category",
+    //   label: "Jan Server Suite",
+    //   link: { type: "doc", id: "server-suite/server-suite" },
+    //   items: [
+    //     "server-suite/admin-console",
+    //     "server-suite/identity-access-management",
+    //     "server-suite/audit-compliance",
+    //     "server-suite/observability",
+    //   ],
+    // },
+  ],
+  solutionSidebar: [
+    {
+      type: "category",
+      label: "Use Cases",
+      collapsed: true,
+      collapsible: true,
+      items: ["solutions/ai-pc", "solutions/chatgpt-alternative"],
+    },
+    {
+      type: "category",
+      label: "Sectors",
+      collapsed: true,
+      collapsible: true,
+      items: [
+        "solutions/finance",
+        "solutions/healthcare",
+        "solutions/legal",
+        "solutions/government",
+      ],
+    },
+    {
+      type: "category",
+      label: "Organization Type",
+      collapsed: true,
+      collapsible: true,
+      items: [
+        "solutions/developers",
+        "solutions/consultants",
+        "solutions/startups",
+        "solutions/enterprises",
+      ],
+    },
+  ],
+
+  pricingSidebar: ["pricing/pricing"],
+  ecosystemSidebar: [
+    "ecosystem/ecosystem",
+    {
+      type: "category",
+      label: "Partners",
+      link: { type: "doc", id: "partners/partners" },
+      collapsible: true,
+      items: ["partners/become-a-partner"],
+    },
+    {
+      type: "category",
+      label: "Integrations",
+      link: { type: "doc", id: "integrations" },
+      items: [
+        {
+          type: "autogenerated",
+          dirName: "integrations",
+        },
+      ],
+    },
+  ],
   guidesSidebar: [
     {
       type: "autogenerated",
       dirName: "guides",
     },
   ],
-
   developerSidebar: [
     {
       type: "autogenerated",
       dirName: "developer",
     },
   ],
-
   docsSidebar: [
     {
       type: "autogenerated",
       dirName: "docs",
     },
   ],
-
-  aboutSidebar: [
-    {
-      type: "autogenerated",
-      dirName: "about",
-    },
-  ],
 };
 
 module.exports = sidebars;
diff --git a/docs/src/containers/Footer/index.js b/docs/src/containers/Footer/index.js
index 80b5a2d4b..7cd648149 100644
--- a/docs/src/containers/Footer/index.js
+++ b/docs/src/containers/Footer/index.js
@@ -1,7 +1,7 @@
 import React from "react";
 
 import { AiOutlineGithub, AiOutlineTwitter } from "react-icons/ai";
-import { BiLogoDiscordAlt } from "react-icons/bi";
+import { BiLogoDiscordAlt, BiLogoLinkedin } from "react-icons/bi";
 
 const socials = [
   {
@@ -16,6 +16,10 @@ const socials = [
     icon: <AiOutlineGithub className="text-lg text-black dark:text-white" />,
     href: "https://github.com/janhq/jan",
   },
+  {
+    icon: <BiLogoLinkedin className="text-xl text-black dark:text-white" />,
+    href: "https://www.linkedin.com/company/janframework/",
+  }
 ];
 
 const menus = [
@@ -59,6 +63,11 @@ const menus = [
         path: "https://twitter.com/janframework",
         external: true,
       },
+      {
+        menu: "LinkedIn",
+        path: "https://www.linkedin.com/company/janframework/",
+        external: true,
+      }
     ],
   },
   {
diff --git a/docs/static/img/bladerunner.png b/docs/static/img/bladerunner.png
new file mode 100644
index 000000000..be3c6c634
Binary files /dev/null and b/docs/static/img/bladerunner.png differ
diff --git a/docs/static/img/c3po-anakin.jpeg b/docs/static/img/c3po-anakin.jpeg
new file mode 100644
index 000000000..f64917411
Binary files /dev/null and b/docs/static/img/c3po-anakin.jpeg differ
diff --git a/docs/static/img/star-wars-droids.png b/docs/static/img/star-wars-droids.png
new file mode 100644
index 000000000..41819af98
Binary files /dev/null and b/docs/static/img/star-wars-droids.png differ
diff --git a/electron/.prettierrc b/electron/.prettierrc
deleted file mode 100644
index 46f1abcb0..000000000
--- a/electron/.prettierrc
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-  "semi": false,
-  "singleQuote": true,
-  "quoteProps": "consistent",
-  "trailingComma": "es5",
-  "endOfLine": "auto",
-  "plugins": ["prettier-plugin-tailwindcss"]
-}
diff --git a/electron/handlers/app.ts b/electron/handlers/app.ts
deleted file mode 100644
index c1f431ef3..000000000
--- a/electron/handlers/app.ts
+++ /dev/null
@@ -1,173 +0,0 @@
-import { app, ipcMain, dialog, shell } from 'electron'
-import { join, basename, relative as getRelative, isAbsolute } from 'path'
-import { WindowManager } from './../managers/window'
-import { getResourcePath } from './../utils/path'
-import { AppRoute, AppConfiguration } from '@janhq/core'
-import { ServerConfig, startServer, stopServer } from '@janhq/server'
-import {
-  ModuleManager,
-  getJanDataFolderPath,
-  getJanExtensionsPath,
-  init,
-  log,
-  logServer,
-  getAppConfigurations,
-  updateAppConfiguration,
-} from '@janhq/core/node'
-
-export function handleAppIPCs() {
-  /**
-   * Handles the "openAppDirectory" IPC message by opening the app's user data directory.
-   * The `shell.openPath` method is used to open the directory in the user's default file explorer.
-   * @param _event - The IPC event object.
-   */
-  ipcMain.handle(AppRoute.openAppDirectory, async (_event) => {
-    shell.openPath(getJanDataFolderPath())
-  })
-
-  /**
-   * Opens a URL in the user's default browser.
-   * @param _event - The IPC event object.
-   * @param url - The URL to open.
-   */
-  ipcMain.handle(AppRoute.openExternalUrl, async (_event, url) => {
-    shell.openExternal(url)
-  })
-
-  /**
-   * Opens a URL in the user's default browser.
-   * @param _event - The IPC event object.
-   * @param url - The URL to open.
-   */
-  ipcMain.handle(AppRoute.openFileExplore, async (_event, url) => {
-    shell.openPath(url)
-  })
-
-  /**
-   * Joins multiple paths together, respect to the current OS.
-   */
-  ipcMain.handle(AppRoute.joinPath, async (_event, paths: string[]) =>
-    join(...paths)
-  )
-
-  /**
-   * Checks if the given path is a subdirectory of the given directory.
-   *
-   * @param _event - The IPC event object.
-   * @param from - The path to check.
-   * @param to - The directory to check against.
-   *
-   * @returns {Promise<boolean>} - A promise that resolves with the result.
-   */
-  ipcMain.handle(
-    AppRoute.isSubdirectory,
-    async (_event, from: string, to: string) => {
-      const relative = getRelative(from, to)
-      const isSubdir =
-        relative && !relative.startsWith('..') && !isAbsolute(relative)
-
-      if (isSubdir === '') return false
-      else return isSubdir
-    }
-  )
-
-  /**
-   * Retrieve basename from given path, respect to the current OS.
-   */
-  ipcMain.handle(AppRoute.baseName, async (_event, path: string) =>
-    basename(path)
-  )
-
-  /**
-   * Start Jan API Server.
-   */
-  ipcMain.handle(AppRoute.startServer, async (_event, configs?: ServerConfig) =>
-    startServer({
-      host: configs?.host,
-      port: configs?.port,
-      isCorsEnabled: configs?.isCorsEnabled,
-      isVerboseEnabled: configs?.isVerboseEnabled,
-      schemaPath: app.isPackaged
-        ? join(getResourcePath(), 'docs', 'openapi', 'jan.yaml')
-        : undefined,
-      baseDir: app.isPackaged
-        ? join(getResourcePath(), 'docs', 'openapi')
-        : undefined,
-    })
-  )
-
-  /**
-   * Stop Jan API Server.
-   */
-  ipcMain.handle(AppRoute.stopServer, stopServer)
-
-  /**
-   * Relaunches the app in production - reload window in development.
-   * @param _event - The IPC event object.
-   * @param url - The URL to reload.
-   */
-  ipcMain.handle(AppRoute.relaunch, async (_event) => {
-    ModuleManager.instance.clearImportedModules()
-
-    if (app.isPackaged) {
-      app.relaunch()
-      app.exit()
-    } else {
-      for (const modulePath in ModuleManager.instance.requiredModules) {
-        delete require.cache[
-          require.resolve(join(getJanExtensionsPath(), modulePath))
-        ]
-      }
-      init({
-        // Function to check from the main process that user wants to install a extension
-        confirmInstall: async (_extensions: string[]) => {
-          return true
-        },
-        // Path to install extension to
-        extensionsPath: getJanExtensionsPath(),
-      })
-      WindowManager.instance.currentWindow?.reload()
-    }
-  })
-
-  /**
-   * Log message to log file.
-   */
-  ipcMain.handle(AppRoute.log, async (_event, message) => log(message))
-
-  /**
-   * Log message to log file.
-   */
-  ipcMain.handle(AppRoute.logServer, async (_event, message) =>
-    logServer(message)
-  )
-
-  ipcMain.handle(AppRoute.selectDirectory, async () => {
-    const mainWindow = WindowManager.instance.currentWindow
-    if (!mainWindow) {
-      console.error('No main window found')
-      return
-    }
-    const { canceled, filePaths } = await dialog.showOpenDialog(mainWindow, {
-      title: 'Select a folder',
-      buttonLabel: 'Select Folder',
-      properties: ['openDirectory', 'createDirectory'],
-    })
-    if (canceled) {
-      return
-    } else {
-      return filePaths[0]
-    }
-  })
-
-  ipcMain.handle(AppRoute.getAppConfigurations, async () =>
-    getAppConfigurations()
-  )
-
-  ipcMain.handle(
-    AppRoute.updateAppConfiguration,
-    async (_event, appConfiguration: AppConfiguration) => {
-      await updateAppConfiguration(appConfiguration)
-    }
-  )
-}
diff --git a/electron/handlers/common.ts b/electron/handlers/common.ts
new file mode 100644
index 000000000..5a54a92bd
--- /dev/null
+++ b/electron/handlers/common.ts
@@ -0,0 +1,25 @@
+import { Handler, RequestHandler } from '@janhq/core/node'
+import { ipcMain } from 'electron'
+import { WindowManager } from '../managers/window'
+
+export function injectHandler() {
+  const ipcWrapper: Handler = (
+    route: string,
+    listener: (...args: any[]) => any
+  ) => {
+    return ipcMain.handle(route, async (event, ...args: any[]) => {
+      return listener(...args)
+    })
+  }
+
+  const handler = new RequestHandler(
+    ipcWrapper,
+    (channel: string, args: any) => {
+      return WindowManager.instance.currentWindow?.webContents.send(
+        channel,
+        args
+      )
+    }
+  )
+  handler.handle()
+}
diff --git a/electron/handlers/download.ts b/electron/handlers/download.ts
deleted file mode 100644
index f63e56f6b..000000000
--- a/electron/handlers/download.ts
+++ /dev/null
@@ -1,121 +0,0 @@
-import { ipcMain } from 'electron'
-import { resolve } from 'path'
-import { WindowManager } from './../managers/window'
-import request from 'request'
-import { createWriteStream, renameSync } from 'fs'
-import { DownloadEvent, DownloadRoute } from '@janhq/core'
-const progress = require('request-progress')
-import { DownloadManager, getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
-
-export function handleDownloaderIPCs() {
-  /**
-   * Handles the "pauseDownload" IPC message by pausing the download associated with the provided fileName.
-   * @param _event - The IPC event object.
-   * @param fileName - The name of the file being downloaded.
-   */
-  ipcMain.handle(DownloadRoute.pauseDownload, async (_event, fileName) => {
-    DownloadManager.instance.networkRequests[fileName]?.pause()
-  })
-
-  /**
-   * Handles the "resumeDownload" IPC message by resuming the download associated with the provided fileName.
-   * @param _event - The IPC event object.
-   * @param fileName - The name of the file being downloaded.
-   */
-  ipcMain.handle(DownloadRoute.resumeDownload, async (_event, fileName) => {
-    DownloadManager.instance.networkRequests[fileName]?.resume()
-  })
-
-  /**
-   * Handles the "abortDownload" IPC message by aborting the download associated with the provided fileName.
-   * The network request associated with the fileName is then removed from the networkRequests object.
-   * @param _event - The IPC event object.
-   * @param fileName - The name of the file being downloaded.
-   */
-  ipcMain.handle(DownloadRoute.abortDownload, async (_event, fileName) => {
-    const rq = DownloadManager.instance.networkRequests[fileName]
-    if (rq) {
-      DownloadManager.instance.networkRequests[fileName] = undefined
-      rq?.abort()
-    } else {
-      WindowManager?.instance.currentWindow?.webContents.send(
-        DownloadEvent.onFileDownloadError,
-        {
-          fileName,
-          err: { message: 'aborted' },
-        }
-      )
-    }
-  })
-
-  /**
-   * Downloads a file from a given URL.
-   * @param _event - The IPC event object.
-   * @param url - The URL to download the file from.
-   * @param fileName - The name to give the downloaded file.
-   */
-  ipcMain.handle(
-    DownloadRoute.downloadFile,
-    async (_event, url, fileName, network) => {
-      const strictSSL = !network?.ignoreSSL
-      const proxy = network?.proxy?.startsWith('http')
-        ? network.proxy
-        : undefined
-
-      if (typeof fileName === 'string') {
-        fileName = normalizeFilePath(fileName)
-      }
-      const destination = resolve(getJanDataFolderPath(), fileName)
-      const rq = request({ url, strictSSL, proxy })
-
-      // Put request to download manager instance
-      DownloadManager.instance.setRequest(fileName, rq)
-
-      // Downloading file to a temp file first
-      const downloadingTempFile = `${destination}.download`
-
-      progress(rq, {})
-        .on('progress', function (state: any) {
-          WindowManager?.instance.currentWindow?.webContents.send(
-            DownloadEvent.onFileDownloadUpdate,
-            {
-              ...state,
-              fileName,
-            }
-          )
-        })
-        .on('error', function (err: Error) {
-          WindowManager?.instance.currentWindow?.webContents.send(
-            DownloadEvent.onFileDownloadError,
-            {
-              fileName,
-              err,
-            }
-          )
-        })
-        .on('end', function () {
-          if (DownloadManager.instance.networkRequests[fileName]) {
-            // Finished downloading, rename temp file to actual file
-            renameSync(downloadingTempFile, destination)
-
-            WindowManager?.instance.currentWindow?.webContents.send(
-              DownloadEvent.onFileDownloadSuccess,
-              {
-                fileName,
-              }
-            )
-            DownloadManager.instance.setRequest(fileName, undefined)
-          } else {
-            WindowManager?.instance.currentWindow?.webContents.send(
-              DownloadEvent.onFileDownloadError,
-              {
-                fileName,
-                err: { message: 'aborted' },
-              }
-            )
-          }
-        })
-        .pipe(createWriteStream(downloadingTempFile))
-    }
-  )
-}
diff --git a/electron/handlers/extension.ts b/electron/handlers/extension.ts
deleted file mode 100644
index 763c4cdec..000000000
--- a/electron/handlers/extension.ts
+++ /dev/null
@@ -1,104 +0,0 @@
-import { ipcMain, webContents } from 'electron'
-import { readdirSync } from 'fs'
-import { join, extname } from 'path'
-
-import {
-  installExtensions,
-  getExtension,
-  removeExtension,
-  getActiveExtensions,
-  ModuleManager,
-  getJanExtensionsPath,
-} from '@janhq/core/node'
-
-import { getResourcePath } from './../utils/path'
-import { ExtensionRoute } from '@janhq/core'
-
-export function handleExtensionIPCs() {
-  /**MARK: General handlers */
-  /**
-   * Invokes a function from a extension module in main node process.
-   * @param _event - The IPC event object.
-   * @param modulePath - The path to the extension module.
-   * @param method - The name of the function to invoke.
-   * @param args - The arguments to pass to the function.
-   * @returns The result of the invoked function.
-   */
-  ipcMain.handle(
-    ExtensionRoute.invokeExtensionFunc,
-    async (_event, modulePath, method, ...args) => {
-      const module = require(
-        /* webpackIgnore: true */ join(getJanExtensionsPath(), modulePath)
-      )
-      ModuleManager.instance.setModule(modulePath, module)
-
-      if (typeof module[method] === 'function') {
-        return module[method](...args)
-      } else {
-        console.debug(module[method])
-        console.error(`Function "${method}" does not exist in the module.`)
-      }
-    }
-  )
-
-  /**
-   * Returns the paths of the base extensions.
-   * @param _event - The IPC event object.
-   * @returns An array of paths to the base extensions.
-   */
-  ipcMain.handle(ExtensionRoute.baseExtensions, async (_event) => {
-    const baseExtensionPath = join(getResourcePath(), 'pre-install')
-    return readdirSync(baseExtensionPath)
-      .filter((file) => extname(file) === '.tgz')
-      .map((file) => join(baseExtensionPath, file))
-  })
-
-  /**MARK: Extension Manager handlers */
-  ipcMain.handle(ExtensionRoute.installExtension, async (e, extensions) => {
-    // Install and activate all provided extensions
-    const installed = await installExtensions(extensions)
-    return JSON.parse(JSON.stringify(installed))
-  })
-
-  // Register IPC route to uninstall a extension
-  ipcMain.handle(
-    ExtensionRoute.uninstallExtension,
-    async (e, extensions, reload) => {
-      // Uninstall all provided extensions
-      for (const ext of extensions) {
-        const extension = getExtension(ext)
-        await extension.uninstall()
-        if (extension.name) removeExtension(extension.name)
-      }
-
-      // Reload all renderer pages if needed
-      reload && webContents.getAllWebContents().forEach((wc) => wc.reload())
-      return true
-    }
-  )
-
-  // Register IPC route to update a extension
-  ipcMain.handle(
-    ExtensionRoute.updateExtension,
-    async (e, extensions, reload) => {
-      // Update all provided extensions
-      const updated: any[] = []
-      for (const ext of extensions) {
-        const extension = getExtension(ext)
-        const res = await extension.update()
-        if (res) updated.push(extension)
-      }
-
-      // Reload all renderer pages if needed
-      if (updated.length && reload)
-        webContents.getAllWebContents().forEach((wc) => wc.reload())
-
-      return JSON.parse(JSON.stringify(updated))
-    }
-  )
-
-  // Register IPC route to get the list of active extensions
-  ipcMain.handle(ExtensionRoute.getActiveExtensions, () => {
-    return JSON.parse(JSON.stringify(getActiveExtensions()))
-  })
-}
diff --git a/electron/handlers/fileManager.ts b/electron/handlers/fileManager.ts
deleted file mode 100644
index e328cb53b..000000000
--- a/electron/handlers/fileManager.ts
+++ /dev/null
@@ -1,82 +0,0 @@
-import { ipcMain, app } from 'electron'
-// @ts-ignore
-import reflect from '@alumna/reflect'
-
-import { FileManagerRoute, FileStat } from '@janhq/core'
-import { getResourcePath } from './../utils/path'
-import fs from 'fs'
-import { join } from 'path'
-import { getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
-
-/**
- * Handles file system extensions operations.
- */
-export function handleFileMangerIPCs() {
-  // Handles the 'syncFile' IPC event. This event is triggered to synchronize a file from a source path to a destination path.
-  ipcMain.handle(
-    FileManagerRoute.syncFile,
-    async (_event, src: string, dest: string) => {
-      return reflect({
-        src,
-        dest,
-        recursive: true,
-        delete: false,
-        overwrite: true,
-        errorOnExist: false,
-      })
-    }
-  )
-
-  // Handles the 'getJanDataFolderPath' IPC event. This event is triggered to get the user space path.
-  ipcMain.handle(
-    FileManagerRoute.getJanDataFolderPath,
-    (): Promise<string> => Promise.resolve(getJanDataFolderPath())
-  )
-
-  // Handles the 'getResourcePath' IPC event. This event is triggered to get the resource path.
-  ipcMain.handle(FileManagerRoute.getResourcePath, async (_event) =>
-    getResourcePath()
-  )
-
-  ipcMain.handle(FileManagerRoute.getUserHomePath, async (_event) =>
-    app.getPath('home')
-  )
-
-  // handle fs is directory here
-  ipcMain.handle(
-    FileManagerRoute.fileStat,
-    async (_event, path: string): Promise<FileStat | undefined> => {
-      const normalizedPath = normalizeFilePath(path)
-
-      const fullPath = join(getJanDataFolderPath(), normalizedPath)
-      const isExist = fs.existsSync(fullPath)
-      if (!isExist) return undefined
-
-      const isDirectory = fs.lstatSync(fullPath).isDirectory()
-      const size = fs.statSync(fullPath).size
-
-      const fileStat: FileStat = {
-        isDirectory,
-        size,
-      }
-
-      return fileStat
-    }
-  )
-
-  ipcMain.handle(
-    FileManagerRoute.writeBlob,
-    async (_event, path: string, data: string): Promise<void> => {
-      try {
-        const normalizedPath = normalizeFilePath(path)
-        const dataBuffer = Buffer.from(data, 'base64')
-        fs.writeFileSync(
-          join(getJanDataFolderPath(), normalizedPath),
-          dataBuffer
-        )
-      } catch (err) {
-        console.error(`writeFile ${path} result: ${err}`)
-      }
-    }
-  )
-}
diff --git a/electron/handlers/fs.ts b/electron/handlers/fs.ts
deleted file mode 100644
index 34026b940..000000000
--- a/electron/handlers/fs.ts
+++ /dev/null
@@ -1,26 +0,0 @@
-import { ipcMain } from 'electron'
-
-import { getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
-import fs from 'fs'
-import { FileManagerRoute, FileSystemRoute } from '@janhq/core'
-import { join } from 'path'
-/**
- * Handles file system operations.
- */
-export function handleFsIPCs() {
-  const moduleName = 'fs'
-  Object.values(FileSystemRoute).forEach((route) => {
-    ipcMain.handle(route, async (event, ...args) => {
-      return import(moduleName).then((mdl) =>
-        mdl[route](
-          ...args.map((arg) =>
-            typeof arg === 'string' &&
-            (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
-              ? join(getJanDataFolderPath(), normalizeFilePath(arg))
-              : arg
-          )
-        )
-      )
-    })
-  })
-}
diff --git a/electron/handlers/native.ts b/electron/handlers/native.ts
new file mode 100644
index 000000000..14ead07bd
--- /dev/null
+++ b/electron/handlers/native.ts
@@ -0,0 +1,86 @@
+import { app, ipcMain, dialog, shell } from 'electron'
+import { join } from 'path'
+import { WindowManager } from '../managers/window'
+import {
+  ModuleManager,
+  getJanDataFolderPath,
+  getJanExtensionsPath,
+  init,
+} from '@janhq/core/node'
+import { NativeRoute } from '@janhq/core'
+
+export function handleAppIPCs() {
+  /**
+   * Handles the "openAppDirectory" IPC message by opening the app's user data directory.
+   * The `shell.openPath` method is used to open the directory in the user's default file explorer.
+   * @param _event - The IPC event object.
+   */
+  ipcMain.handle(NativeRoute.openAppDirectory, async (_event) => {
+    shell.openPath(getJanDataFolderPath())
+  })
+
+  /**
+   * Opens a URL in the user's default browser.
+   * @param _event - The IPC event object.
+   * @param url - The URL to open.
+   */
+  ipcMain.handle(NativeRoute.openExternalUrl, async (_event, url) => {
+    shell.openExternal(url)
+  })
+
+  /**
+   * Opens a URL in the user's default browser.
+   * @param _event - The IPC event object.
+   * @param url - The URL to open.
+   */
+  ipcMain.handle(NativeRoute.openFileExplore, async (_event, url) => {
+    shell.openPath(url)
+  })
+
+  /**
+   * Relaunches the app in production - reload window in development.
+   * @param _event - The IPC event object.
+   * @param url - The URL to reload.
+   */
+  ipcMain.handle(NativeRoute.relaunch, async (_event) => {
+    ModuleManager.instance.clearImportedModules()
+
+    if (app.isPackaged) {
+      app.relaunch()
+      app.exit()
+    } else {
+      for (const modulePath in ModuleManager.instance.requiredModules) {
+        delete require.cache[
+          require.resolve(join(getJanExtensionsPath(), modulePath))
+        ]
+      }
+      init({
+        // Function to check from the main process that user wants to install a extension
+        confirmInstall: async (_extensions: string[]) => {
+          return true
+        },
+        // Path to install extension to
+        extensionsPath: getJanExtensionsPath(),
+      })
+      WindowManager.instance.currentWindow?.reload()
+    }
+  })
+
+  ipcMain.handle(NativeRoute.selectDirectory, async () => {
+    const mainWindow = WindowManager.instance.currentWindow
+    if (!mainWindow) {
+      console.error('No main window found')
+      return
+    }
+    const { canceled, filePaths } = await dialog.showOpenDialog(mainWindow, {
+      title: 'Select a folder',
+      buttonLabel: 'Select Folder',
+      properties: ['openDirectory', 'createDirectory'],
+    })
+    if (canceled) {
+      return
+    } else {
+      return filePaths[0]
+    }
+  })
+}
diff --git a/electron/handlers/update.ts b/electron/handlers/update.ts
index cbb34c22b..0d8cc4cc0 100644
--- a/electron/handlers/update.ts
+++ b/electron/handlers/update.ts
@@ -11,7 +11,8 @@ export function handleAppUpdates() {
   /* New Update Available */
   autoUpdater.on('update-available', async (_info: any) => {
     const action = await dialog.showMessageBox({
-      message: `Update available. Do you want to download the latest update?`,
+      title: 'Update Available',
+      message: 'Would you like to download and install it now?',
       buttons: ['Download', 'Later'],
     })
     if (action.response === 0) await autoUpdater.downloadUpdate()
@@ -36,7 +37,7 @@ export function handleAppUpdates() {
   autoUpdater.on('error', (info: any) => {
     WindowManager.instance.currentWindow?.webContents.send(
       AppEvent.onAppUpdateDownloadError,
-      {}
+      info
     )
   })
 
diff --git a/electron/main.ts b/electron/main.ts
index 5d7e59c0f..de18b8f9d 100644
--- a/electron/main.ts
+++ b/electron/main.ts
@@ -1,4 +1,4 @@
-import { app, BrowserWindow } from 'electron'
+import { app, BrowserWindow, shell } from 'electron'
 import { join } from 'path'
 /**
  * Managers
@@ -9,12 +9,9 @@ import { log } from '@janhq/core/node'
 /**
  * IPC Handlers
  **/
-import { handleDownloaderIPCs } from './handlers/download'
-import { handleExtensionIPCs } from './handlers/extension'
-import { handleFileMangerIPCs } from './handlers/fileManager'
-import { handleAppIPCs } from './handlers/app'
+import { injectHandler } from './handlers/common'
 import { handleAppUpdates } from './handlers/update'
-import { handleFsIPCs } from './handlers/fs'
+import { handleAppIPCs } from './handlers/native'
 
 /**
  * Utils
@@ -25,25 +22,12 @@ import { migrateExtensions } from './utils/migration'
 import { cleanUpAndQuit } from './utils/clean'
 import { setupExtensions } from './utils/extension'
 import { setupCore } from './utils/setup'
+import { setupReactDevTool } from './utils/dev'
+import { cleanLogs } from './utils/log'
 
 app
   .whenReady()
-  .then(async () => {
-    if (!app.isPackaged) {
-      // Which means you're running from source code
-      const { default: installExtension, REACT_DEVELOPER_TOOLS } = await import(
-        'electron-devtools-installer'
-      ) // Don't use import on top level, since the installer package is dev-only
-      try {
-        const name = installExtension(REACT_DEVELOPER_TOOLS)
-        console.log(`Added Extension: ${name}`)
-      } catch (err) {
-        console.log('An error occurred while installing devtools:')
-        console.error(err)
-        // Only log the error and don't throw it because it's not critical
-      }
-    }
-  })
+  .then(setupReactDevTool)
   .then(setupCore)
   .then(createUserSpace)
   .then(migrateExtensions)
@@ -59,6 +43,7 @@ app
       }
     })
   })
+  .then(() => cleanLogs())
 
 app.once('window-all-closed', () => {
   cleanUpAndQuit()
@@ -92,23 +77,24 @@ function createMainWindow() {
 
   /* Open external links in the default browser */
   mainWindow.webContents.setWindowOpenHandler(({ url }) => {
-    require('electron').shell.openExternal(url)
+    shell.openExternal(url)
     return { action: 'deny' }
   })
 
   /* Enable dev tools for development */
   if (!app.isPackaged) mainWindow.webContents.openDevTools()
+  log(`Version: ${app.getVersion()}`)
 }
 
 /**
  * Handles various IPC messages from the renderer process.
  */
 function handleIPCs() {
-  handleFsIPCs()
-  handleDownloaderIPCs()
-  handleExtensionIPCs()
+  // Inject core handlers for IPCs
+  injectHandler()
+
+  // Handle native IPCs
   handleAppIPCs()
-  handleFileMangerIPCs()
 }
 
 /*
diff --git a/electron/merge-latest-ymls.js b/electron/merge-latest-ymls.js
index 8172a3176..ee8caf825 100644
--- a/electron/merge-latest-ymls.js
+++ b/electron/merge-latest-ymls.js
@@ -9,7 +9,9 @@ const file3 = args[2]
 
 // check that all arguments are present and throw error instead
 if (!file1 || !file2 || !file3) {
-  throw new Error('Please provide 3 file paths as arguments: path to file1, to file2 and destination path')
+  throw new Error(
+    'Please provide 3 file paths as arguments: path to file1, to file2 and destination path'
+  )
 }
 
 const doc1 = yaml.load(fs.readFileSync(file1, 'utf8'))
diff --git a/electron/package.json b/electron/package.json
index 08f15b262..a89803077 100644
--- a/electron/package.json
+++ b/electron/package.json
@@ -4,6 +4,7 @@
   "main": "./build/main.js",
   "author": "Jan <service@jan.ai>",
   "license": "MIT",
+  "productName": "Jan",
   "homepage": "https://github.com/janhq/jan/tree/main/electron",
   "description": "Use offline LLMs with your own data. Run open source models like Llama2 or Falcon on your internal computers/servers.",
   "build": {
@@ -11,7 +12,6 @@
     "productName": "Jan",
     "files": [
       "renderer/**/*",
-      "build/*.{js,map}",
       "build/**/*.{js,map}",
       "pre-install",
       "models/**/*",
@@ -57,16 +57,17 @@
   "scripts": {
     "lint": "eslint . --ext \".js,.jsx,.ts,.tsx\"",
     "test:e2e": "playwright test --workers=1",
-    "dev": "tsc -p . && electron .",
-    "build": "run-script-os",
-    "build:test": "run-script-os",
+    "copy:assets": "rimraf --glob \"./pre-install/*.tgz\" && cpx \"../pre-install/*.tgz\" \"./pre-install\"",
+    "dev": "yarn copy:assets && tsc -p . && electron .",
+    "build": "yarn copy:assets && run-script-os",
+    "build:test": "yarn copy:assets && run-script-os",
     "build:test:darwin": "tsc -p . && electron-builder -p never -m --dir",
     "build:test:win32": "tsc -p . && electron-builder -p never -w --dir",
     "build:test:linux": "tsc -p . && electron-builder -p never -l --dir",
     "build:darwin": "tsc -p . && electron-builder -p never -m",
     "build:win32": "tsc -p . && electron-builder -p never -w",
     "build:linux": "tsc -p . && electron-builder -p never -l deb -l AppImage",
-    "build:publish": "run-script-os",
+    "build:publish": "yarn copy:assets && run-script-os",
     "build:publish:darwin": "tsc -p . && electron-builder -p always -m",
     "build:publish:win32": "tsc -p . && electron-builder -p always -w",
     "build:publish:linux": "tsc -p . && electron-builder -p always -l deb -l AppImage"
@@ -76,7 +77,6 @@
     "@janhq/core": "link:./core",
     "@janhq/server": "link:./server",
     "@npmcli/arborist": "^7.1.0",
-    "@types/request": "^2.48.12",
     "@uiball/loaders": "^1.3.0",
     "electron-store": "^8.1.0",
     "electron-updater": "^6.1.7",
@@ -85,8 +85,6 @@
     "pacote": "^17.0.4",
     "request": "^2.88.2",
     "request-progress": "^3.0.0",
-    "rimraf": "^5.0.5",
-    "typescript": "^5.2.2",
     "ulid": "^2.3.0",
     "use-debounce": "^9.0.4"
   },
@@ -95,6 +93,7 @@
     "@playwright/test": "^1.38.1",
     "@types/npmcli__arborist": "^5.6.4",
     "@types/pacote": "^11.1.7",
+    "@types/request": "^2.48.12",
     "@typescript-eslint/eslint-plugin": "^6.7.3",
     "@typescript-eslint/parser": "^6.7.3",
     "electron": "28.0.0",
@@ -102,7 +101,9 @@
     "electron-devtools-installer": "^3.2.0",
     "electron-playwright-helpers": "^1.6.0",
     "eslint-plugin-react": "^7.33.2",
-    "run-script-os": "^1.1.6"
+    "rimraf": "^5.0.5",
+    "run-script-os": "^1.1.6",
+    "typescript": "^5.2.2"
   },
   "installConfig": {
     "hoistingLimits": "workspaces"
diff --git a/electron/playwright.config.ts b/electron/playwright.config.ts
index 8047b7513..d3dff40c6 100644
--- a/electron/playwright.config.ts
+++ b/electron/playwright.config.ts
@@ -3,14 +3,12 @@ import { PlaywrightTestConfig } from '@playwright/test'
 const config: PlaywrightTestConfig = {
   testDir: './tests/e2e',
   retries: 0,
-  globalTimeout: 300000,
+  globalTimeout: 350000,
   use: {
     screenshot: 'only-on-failure',
     video: 'retain-on-failure',
     trace: 'retain-on-failure',
   },
-
   reporter: [['html', { outputFolder: './playwright-report' }]],
 }
-
 export default config
diff --git a/electron/sign.js b/electron/sign.js
index 6e973eb6e..73afedc4e 100644
--- a/electron/sign.js
+++ b/electron/sign.js
@@ -1,44 +1,48 @@
-const { exec } = require('child_process');
+const { exec } = require('child_process')
 
+function sign({
+  path,
+  name,
+  certUrl,
+  clientId,
+  tenantId,
+  clientSecret,
+  certName,
+  timestampServer,
+  version,
+}) {
+  return new Promise((resolve, reject) => {
+    const command = `azuresigntool.exe sign -kvu "${certUrl}" -kvi "${clientId}" -kvt "${tenantId}" -kvs "${clientSecret}" -kvc "${certName}" -tr "${timestampServer}" -v "${path}"`
 
-function sign({ path, name, certUrl, clientId, tenantId, clientSecret, certName, timestampServer, version }) {
-    return new Promise((resolve, reject) => {
-
-        const command = `azuresigntool.exe sign -kvu "${certUrl}" -kvi "${clientId}" -kvt "${tenantId}" -kvs "${clientSecret}" -kvc "${certName}" -tr "${timestampServer}" -v "${path}"`;
-
-
-        exec(command, (error, stdout, stderr) => {
-            if (error) {
-                console.error(`Error: ${error}`);
-                return reject(error);
-            }
-            console.log(`stdout: ${stdout}`);
-            console.error(`stderr: ${stderr}`);
-            resolve();
-        });
-    });
+    exec(command, (error, stdout, stderr) => {
+      if (error) {
+        console.error(`Error: ${error}`)
+        return reject(error)
+      }
+      console.log(`stdout: ${stdout}`)
+      console.error(`stderr: ${stderr}`)
+      resolve()
+    })
+  })
 }
 
+exports.default = async function (options) {
+  const certUrl = process.env.AZURE_KEY_VAULT_URI
+  const clientId = process.env.AZURE_CLIENT_ID
+  const tenantId = process.env.AZURE_TENANT_ID
+  const clientSecret = process.env.AZURE_CLIENT_SECRET
+  const certName = process.env.AZURE_CERT_NAME
+  const timestampServer = 'http://timestamp.globalsign.com/tsa/r6advanced1'
 
-exports.default = async function(options) {
-
-    const certUrl = process.env.AZURE_KEY_VAULT_URI;
-    const clientId = process.env.AZURE_CLIENT_ID;
-    const tenantId = process.env.AZURE_TENANT_ID;
-    const clientSecret = process.env.AZURE_CLIENT_SECRET;
-    const certName = process.env.AZURE_CERT_NAME;
-    const timestampServer = 'http://timestamp.globalsign.com/tsa/r6advanced1';
-
-
-    await sign({
-        path: options.path,
-        name: "jan-win-x64",
-        certUrl,
-        clientId,
-        tenantId,
-        clientSecret,
-        certName,
-        timestampServer,
-        version: options.version
-    });
-};
+  await sign({
+    path: options.path,
+    name: 'jan-win-x64',
+    certUrl,
+    clientId,
+    tenantId,
+    clientSecret,
+    certName,
+    timestampServer,
+    version: options.version,
+  })
+}
diff --git a/electron/tests/config/constants.ts b/electron/tests/config/constants.ts
new file mode 100644
index 000000000..7039ad58c
--- /dev/null
+++ b/electron/tests/config/constants.ts
@@ -0,0 +1,4 @@
+export const Constants = {
+  VIDEO_DIR: './playwright-video',
+  TIMEOUT: '300000',
+}
diff --git a/electron/tests/config/fixtures.ts b/electron/tests/config/fixtures.ts
new file mode 100644
index 000000000..680b09785
--- /dev/null
+++ b/electron/tests/config/fixtures.ts
@@ -0,0 +1,119 @@
+import {
+  _electron as electron,
+  BrowserContext,
+  ElectronApplication,
+  expect,
+  Page,
+  test as base,
+} from '@playwright/test'
+import {
+  ElectronAppInfo,
+  findLatestBuild,
+  parseElectronApp,
+  stubDialog,
+} from 'electron-playwright-helpers'
+import { Constants } from './constants'
+import { HubPage } from '../pages/hubPage'
+import { CommonActions } from '../pages/commonActions'
+
+export let electronApp: ElectronApplication
+export let page: Page
+export let appInfo: ElectronAppInfo
+export const TIMEOUT = parseInt(process.env.TEST_TIMEOUT || Constants.TIMEOUT)
+
+export async function setupElectron() {
+  process.env.CI = 'e2e'
+
+  const latestBuild = findLatestBuild('dist')
+  expect(latestBuild).toBeTruthy()
+
+  // parse the packaged Electron app and find paths and other info
+  appInfo = parseElectronApp(latestBuild)
+  expect(appInfo).toBeTruthy()
+
+  electronApp = await electron.launch({
+    args: [appInfo.main], // main file from package.json
+    executablePath: appInfo.executable, // path to the Electron executable
+    // recordVideo: { dir: Constants.VIDEO_DIR }, // Specify the directory for video recordings
+  })
+  await stubDialog(electronApp, 'showMessageBox', { response: 1 })
+
+  page = await electronApp.firstWindow({
+    timeout: TIMEOUT,
+  })
+}
+
+export async function teardownElectron() {
+  await page.close()
+  await electronApp.close()
+}
+
+/**
+ * this fixture is needed to record and attach videos / screenshot on failed tests when
+ * tests are run in serial mode (i.e. browser is not closed between tests)
+ */
+export const test = base.extend<
+  {
+    commonActions: CommonActions
+    hubPage: HubPage
+    attachVideoPage: Page
+    attachScreenshotsToReport: void
+  },
+  { createVideoContext: BrowserContext }
+>({
+  commonActions: async ({ request }, use, testInfo) => {
+    await use(new CommonActions(page, testInfo))
+  },
+  hubPage: async ({ commonActions }, use) => {
+    await use(new HubPage(page, commonActions))
+  },
+  createVideoContext: [
+    async ({ playwright }, use) => {
+      const context = electronApp.context()
+      await use(context)
+    },
+    { scope: 'worker' },
+  ],
+
+  attachVideoPage: [
+    async ({ createVideoContext }, use, testInfo) => {
+      await use(page)
+
+      if (testInfo.status !== testInfo.expectedStatus) {
+        const path = await createVideoContext.pages()[0].video()?.path()
+        await createVideoContext.close()
+        await testInfo.attach('video', {
+          path: path,
+        })
+      }
+    },
+    { scope: 'test', auto: true },
+  ],
+
+  attachScreenshotsToReport: [
+    async ({ commonActions }, use, testInfo) => {
+      await use()
+
+      // After the test, we can check whether the test passed or failed.
+      if (testInfo.status !== testInfo.expectedStatus) {
+        await commonActions.takeScreenshot('')
+      }
+    },
+    { auto: true },
+  ],
+})
+
+test.setTimeout(TIMEOUT)
+
+test.beforeAll(async () => {
+  await setupElectron()
+  await page.waitForSelector('img[alt="Jan - Logo"]', {
+    state: 'visible',
+    timeout: TIMEOUT,
+  })
+})
+
+test.afterAll(async () => {
+  // temporally disabling this due to the config for parallel testing WIP
+  // teardownElectron()
+})
diff --git a/electron/tests/e2e/hub.e2e.spec.ts b/electron/tests/e2e/hub.e2e.spec.ts
index 68632058e..d968e7641 100644
--- a/electron/tests/e2e/hub.e2e.spec.ts
+++ b/electron/tests/e2e/hub.e2e.spec.ts
@@ -1,34 +1,19 @@
-import {
-  page,
-  test,
-  setupElectron,
-  teardownElectron,
-  TIMEOUT,
-} from '../pages/basePage'
+import { test, appInfo } from '../config/fixtures'
 import { expect } from '@playwright/test'
 
 test.beforeAll(async () => {
-  const appInfo = await setupElectron()
-  expect(appInfo.asar).toBe(true)
-  expect(appInfo.executable).toBeTruthy()
-  expect(appInfo.main).toBeTruthy()
-  expect(appInfo.name).toBe('jan')
-  expect(appInfo.packageJson).toBeTruthy()
-  expect(appInfo.packageJson.name).toBe('jan')
-  expect(appInfo.platform).toBeTruthy()
-  expect(appInfo.platform).toBe(process.platform)
-  expect(appInfo.resourcesDir).toBeTruthy()
-})
-
-test.afterAll(async () => {
-  await teardownElectron()
-})
-
-test('explores hub', async () => {
-  await page.getByTestId('Hub').first().click({
-    timeout: TIMEOUT,
-  })
-  await page.getByTestId('hub-container-test-id').isVisible({
-    timeout: TIMEOUT,
+  expect(appInfo).toMatchObject({
+    asar: true,
+    executable: expect.anything(),
+    main: expect.anything(),
+    name: 'jan',
+    packageJson: expect.objectContaining({ name: 'jan' }),
+    platform: process.platform,
+    resourcesDir: expect.anything(),
   })
 })
+
+test('explores hub', async ({ hubPage }) => {
+  await hubPage.navigateByMenu()
+  await hubPage.verifyContainerVisible()
+})
diff --git a/electron/tests/e2e/navigation.e2e.spec.ts b/electron/tests/e2e/navigation.e2e.spec.ts
index 2da59953c..b599a951c 100644
--- a/electron/tests/e2e/navigation.e2e.spec.ts
+++ b/electron/tests/e2e/navigation.e2e.spec.ts
@@ -1,32 +1,12 @@
 import { expect } from '@playwright/test'
-import {
-  page,
-  setupElectron,
-  TIMEOUT,
-  test,
-  teardownElectron,
-} from '../pages/basePage'
-
-test.beforeAll(async () => {
-  await setupElectron()
-})
-
-test.afterAll(async () => {
-  await teardownElectron()
-})
+import { page, test, TIMEOUT } from '../config/fixtures'
 
 test('renders left navigation panel', async () => {
-  const systemMonitorBtn = await page
-    .getByTestId('System Monitor')
-    .first()
-    .isEnabled({
-      timeout: TIMEOUT,
-    })
   const settingsBtn = await page
     .getByTestId('Thread')
     .first()
     .isEnabled({ timeout: TIMEOUT })
-  expect([systemMonitorBtn, settingsBtn].filter((e) => !e).length).toBe(0)
+  expect([settingsBtn].filter((e) => !e).length).toBe(0)
   // Chat section should be there
   await page.getByTestId('Local API Server').first().click({
     timeout: TIMEOUT,
diff --git a/electron/tests/e2e/settings.e2e.spec.ts b/electron/tests/e2e/settings.e2e.spec.ts
index 54215d9b1..06b4d1acc 100644
--- a/electron/tests/e2e/settings.e2e.spec.ts
+++ b/electron/tests/e2e/settings.e2e.spec.ts
@@ -1,23 +1,11 @@
 import { expect } from '@playwright/test'
 
-import {
-  setupElectron,
-  teardownElectron,
-  test,
-  page,
-  TIMEOUT,
-} from '../pages/basePage'
-
-test.beforeAll(async () => {
-  await setupElectron()
-})
-
-test.afterAll(async () => {
-  await teardownElectron()
-})
+import { test, page, TIMEOUT } from '../config/fixtures'
 
 test('shows settings', async () => {
-  await page.getByTestId('Settings').first().click({ timeout: TIMEOUT })
+  await page.getByTestId('Settings').first().click({
+    timeout: TIMEOUT,
+  })
   const settingDescription = page.getByTestId('testid-setting-description')
   await expect(settingDescription).toBeVisible({ timeout: TIMEOUT })
 })
diff --git a/electron/tests/pages/basePage.ts b/electron/tests/pages/basePage.ts
index 5f1a6fca1..4e16a3c23 100644
--- a/electron/tests/pages/basePage.ts
+++ b/electron/tests/pages/basePage.ts
@@ -1,67 +1,49 @@
-import {
-  expect,
-  test as base,
-  _electron as electron,
-  ElectronApplication,
-  Page,
-} from '@playwright/test'
-import {
-  findLatestBuild,
-  parseElectronApp,
-  stubDialog,
-} from 'electron-playwright-helpers'
+import { Page, expect } from '@playwright/test'
+import { CommonActions } from './commonActions'
+import { TIMEOUT } from '../config/fixtures'
 
-export const TIMEOUT: number = parseInt(process.env.TEST_TIMEOUT || '300000')
+export class BasePage {
+  menuId: string
 
-export let electronApp: ElectronApplication
-export let page: Page
+  constructor(
+    protected readonly page: Page,
+    readonly action: CommonActions,
+    protected containerId: string
+  ) {}
 
-export async function setupElectron() {
-  process.env.CI = 'e2e'
+  public getValue(key: string) {
+    return this.action.getValue(key)
+  }
 
-  const latestBuild = findLatestBuild('dist')
-  expect(latestBuild).toBeTruthy()
+  public setValue(key: string, value: string) {
+    this.action.setValue(key, value)
+  }
 
-  // parse the packaged Electron app and find paths and other info
-  const appInfo = parseElectronApp(latestBuild)
-  expect(appInfo).toBeTruthy()
+  async takeScreenshot(name: string = '') {
+    await this.action.takeScreenshot(name)
+  }
 
-  electronApp = await electron.launch({
-    args: [appInfo.main], // main file from package.json
-    executablePath: appInfo.executable, // path to the Electron executable
-  })
-  await stubDialog(electronApp, 'showMessageBox', { response: 1 })
+  async navigateByMenu() {
+    await this.page.getByTestId(this.menuId).first().click()
+  }
 
-  page = await electronApp.firstWindow({
-    timeout: TIMEOUT,
-  })
-  // Return appInfo for future use
-  return appInfo
+  async verifyContainerVisible() {
+    const container = this.page.getByTestId(this.containerId)
+    expect(container.isVisible()).toBeTruthy()
+  }
+
+  async waitUpdateLoader() {
+    await this.isElementVisible('img[alt="Jan - Logo"]')
+  }
+
+  //wait and find a specific element with it's selector and return Visible
+  async isElementVisible(selector: any) {
+    let isVisible = true
+    await this.page
+      .waitForSelector(selector, { state: 'visible', timeout: TIMEOUT })
+      .catch(() => {
+        isVisible = false
+      })
+    return isVisible
+  }
 }
-
-export async function teardownElectron() {
-  await page.close()
-  await electronApp.close()
-}
-
-export const test = base.extend<{
-  attachScreenshotsToReport: void
-}>({
-  attachScreenshotsToReport: [
-    async ({ request }, use, testInfo) => {
-      await use()
-
-      // After the test, we can check whether the test passed or failed.
-      if (testInfo.status !== testInfo.expectedStatus) {
-        const screenshot = await page.screenshot()
-        await testInfo.attach('screenshot', {
-          body: screenshot,
-          contentType: 'image/png',
-        })
-      }
-    },
-    { auto: true },
-  ],
-})
-
-test.setTimeout(TIMEOUT)
diff --git a/electron/tests/pages/commonActions.ts b/electron/tests/pages/commonActions.ts
new file mode 100644
index 000000000..08ea15f92
--- /dev/null
+++ b/electron/tests/pages/commonActions.ts
@@ -0,0 +1,34 @@
+import { Page, TestInfo } from '@playwright/test'
+import { page } from '../config/fixtures'
+
+export class CommonActions {
+  private testData = new Map<string, string>()
+
+  constructor(
+    public page: Page,
+    public testInfo: TestInfo
+  ) {}
+
+  async takeScreenshot(name: string) {
+    const screenshot = await page.screenshot({
+      fullPage: true,
+    })
+    const attachmentName = `${this.testInfo.title}_${name || new Date().toISOString().slice(5, 19).replace(/[-:]/g, '').replace('T', '_')}`
+    await this.testInfo.attach(attachmentName.replace(/\s+/g, ''), {
+      body: screenshot,
+      contentType: 'image/png',
+    })
+  }
+
+  async hooks() {
+    console.log('hook from the scenario page')
+  }
+
+  setValue(key: string, value: string) {
+    this.testData.set(key, value)
+  }
+
+  getValue(key: string) {
+    return this.testData.get(key)
+  }
+}
diff --git a/electron/tests/pages/hubPage.ts b/electron/tests/pages/hubPage.ts
new file mode 100644
index 000000000..0299ab15d
--- /dev/null
+++ b/electron/tests/pages/hubPage.ts
@@ -0,0 +1,15 @@
+import { Page } from '@playwright/test'
+import { BasePage } from './basePage'
+import { CommonActions } from './commonActions'
+
+export class HubPage extends BasePage {
+  readonly menuId: string = 'Hub'
+  static readonly containerId: string = 'hub-container-test-id'
+
+  constructor(
+    public page: Page,
+    readonly action: CommonActions
+  ) {
+    super(page, action, HubPage.containerId)
+  }
+}
diff --git a/electron/utils/dev.ts b/electron/utils/dev.ts
new file mode 100644
index 000000000..b2a492886
--- /dev/null
+++ b/electron/utils/dev.ts
@@ -0,0 +1,18 @@
+import { app } from 'electron'
+
+export const setupReactDevTool = async () => {
+  if (!app.isPackaged) {
+    // Which means you're running from source code
+    const { default: installExtension, REACT_DEVELOPER_TOOLS } = await import(
+      'electron-devtools-installer'
+    ) // Don't use import on top level, since the installer package is dev-only
+    try {
+      const name = await installExtension(REACT_DEVELOPER_TOOLS)
+      console.log(`Added Extension: ${name}`)
+    } catch (err) {
+      console.log('An error occurred while installing devtools:')
+      console.error(err)
+      // Only log the error and don't throw it because it's not critical
+    }
+  }
+}
diff --git a/electron/utils/disposable.ts b/electron/utils/disposable.ts
index 462f7e3e5..59018a775 100644
--- a/electron/utils/disposable.ts
+++ b/electron/utils/disposable.ts
@@ -1,8 +1,8 @@
 export function dispose(requiredModules: Record<string, any>) {
   for (const key in requiredModules) {
-    const module = requiredModules[key];
-    if (typeof module["dispose"] === "function") {
-      module["dispose"]();
+    const module = requiredModules[key]
+    if (typeof module['dispose'] === 'function') {
+      module['dispose']()
     }
   }
 }
diff --git a/electron/utils/log.ts b/electron/utils/log.ts
new file mode 100644
index 000000000..84c185d75
--- /dev/null
+++ b/electron/utils/log.ts
@@ -0,0 +1,67 @@
+import { getJanDataFolderPath } from '@janhq/core/node'
+import * as fs from 'fs'
+import * as path from 'path'
+
+export function cleanLogs(
+  maxFileSizeBytes?: number | undefined,
+  daysToKeep?: number | undefined,
+  delayMs?: number | undefined
+): void {
+  const size = maxFileSizeBytes ?? 1 * 1024 * 1024 // 1 MB
+  const days = daysToKeep ?? 7 // 7 days
+  const delays = delayMs ?? 10000 // 10 seconds
+  const logDirectory = path.join(getJanDataFolderPath(), 'logs')
+
+  // Perform log cleaning
+  const currentDate = new Date()
+  fs.readdir(logDirectory, (err, files) => {
+    if (err) {
+      console.error('Error reading log directory:', err)
+      return
+    }
+
+    files.forEach((file) => {
+      const filePath = path.join(logDirectory, file)
+      fs.stat(filePath, (err, stats) => {
+        if (err) {
+          console.error('Error getting file stats:', err)
+          return
+        }
+
+        // Check size
+        if (stats.size > size) {
+          fs.unlink(filePath, (err) => {
+            if (err) {
+              console.error('Error deleting log file:', err)
+              return
+            }
+            console.log(
+              `Deleted log file due to exceeding size limit: ${filePath}`
+            )
+          })
+        } else {
+          // Check age
+          const creationDate = new Date(stats.ctime)
+          const daysDifference = Math.floor(
+            (currentDate.getTime() - creationDate.getTime()) /
+              (1000 * 3600 * 24)
+          )
+          if (daysDifference > days) {
+            fs.unlink(filePath, (err) => {
+              if (err) {
+                console.error('Error deleting log file:', err)
+                return
+              }
+              console.log(`Deleted old log file: ${filePath}`)
+            })
+          }
+        }
+      })
+    })
+  })
+
+  // Schedule the next execution with doubled delays
+  setTimeout(() => {
+    cleanLogs(maxFileSizeBytes, daysToKeep, delays * 2)
+  }, delays)
+}
diff --git a/electron/utils/menu.ts b/electron/utils/menu.ts
index 7721b7c78..893907c48 100644
--- a/electron/utils/menu.ts
+++ b/electron/utils/menu.ts
@@ -1,19 +1,41 @@
 // @ts-nocheck
-import { app, Menu, dialog, shell } from 'electron'
-const isMac = process.platform === 'darwin'
+import { app, Menu, shell, dialog } from 'electron'
 import { autoUpdater } from 'electron-updater'
-import { compareSemanticVersions } from './versionDiff'
+import { log } from '@janhq/core/node'
+const isMac = process.platform === 'darwin'
 
 const template: (Electron.MenuItemConstructorOptions | Electron.MenuItem)[] = [
   {
     label: app.name,
     submenu: [
-      { role: 'about' },
+      {
+        label: `About ${app.name}`,
+        click: () =>
+          dialog.showMessageBox({
+            title: `Jan`,
+            message: `Jan Version v${app.getVersion()}\n\nCopyright © 2024 Jan`,
+          }),
+      },
       {
         label: 'Check for Updates...',
         click: () =>
           // Check for updates and notify user if there are any
-          autoUpdater.checkForUpdatesAndNotify(),
+          autoUpdater
+            .checkForUpdatesAndNotify()
+            .then((updateCheckResult) => {
+              if (
+                !updateCheckResult?.updateInfo ||
+                updateCheckResult?.updateInfo.version === app.getVersion()
+              ) {
+                dialog.showMessageBox({
+                  message: `No updates available.`,
+                })
+                return
+              }
+            })
+            .catch((error) => {
+              log('Error checking for updates:' + JSON.stringify(error))
+            }),
       },
       { type: 'separator' },
       { role: 'services' },
diff --git a/electron/utils/path.ts b/electron/utils/path.ts
index 4e47cc312..4438156bc 100644
--- a/electron/utils/path.ts
+++ b/electron/utils/path.ts
@@ -1,5 +1,3 @@
-import { join } from 'path'
-import { app } from 'electron'
 import { mkdir } from 'fs-extra'
 import { existsSync } from 'fs'
 import { getJanDataFolderPath } from '@janhq/core/node'
@@ -16,13 +14,3 @@ export async function createUserSpace(): Promise<void> {
     }
   }
 }
-
-export function getResourcePath() {
-  let appPath = join(app.getAppPath(), '..', 'app.asar.unpacked')
-
-  if (!app.isPackaged) {
-    // for development mode
-    appPath = join(__dirname, '..', '..')
-  }
-  return appPath
-}
diff --git a/electron/utils/setup.ts b/electron/utils/setup.ts
index 887c3c2b7..01b0b31da 100644
--- a/electron/utils/setup.ts
+++ b/electron/utils/setup.ts
@@ -1,9 +1,9 @@
 import { app } from 'electron'
 
 export const setupCore = async () => {
-    // Setup core api for main process
-    global.core = {
-        // Define appPath function for app to retrieve app path globaly
-        appPath: () => app.getPath('userData')
-    }
-}
\ No newline at end of file
+  // Setup core api for main process
+  global.core = {
+    // Define appPath function for app to retrieve app path globaly
+    appPath: () => app.getPath('userData'),
+  }
+}
diff --git a/electron/utils/versionDiff.ts b/electron/utils/versionDiff.ts
deleted file mode 100644
index 25934e87f..000000000
--- a/electron/utils/versionDiff.ts
+++ /dev/null
@@ -1,21 +0,0 @@
-export const compareSemanticVersions = (a: string, b: string) => {
- 
-    // 1. Split the strings into their parts.
-    const a1 = a.split('.');
-    const b1 = b.split('.');
-    // 2. Contingency in case there's a 4th or 5th version
-    const len = Math.min(a1.length, b1.length);
-    // 3. Look through each version number and compare.
-    for (let i = 0; i < len; i++) {
-        const a2 = +a1[ i ] || 0;
-        const b2 = +b1[ i ] || 0;
-        
-        if (a2 !== b2) {
-            return a2 > b2 ? 1 : -1;        
-        }
-    }
-    
-    // 4. We hit this if the all checked versions so far are equal
-    //
-    return b1.length - a1.length;
-};
\ No newline at end of file
diff --git a/extensions/assistant-extension/package.json b/extensions/assistant-extension/package.json
index 84bcdf47e..baa858655 100644
--- a/extensions/assistant-extension/package.json
+++ b/extensions/assistant-extension/package.json
@@ -1,16 +1,17 @@
 {
   "name": "@janhq/assistant-extension",
-  "version": "1.0.0",
+  "version": "1.0.1",
   "description": "This extension enables assistants, including Jan, a default assistant that can call all downloaded models",
   "main": "dist/index.js",
   "node": "dist/node/index.js",
   "author": "Jan <service@jan.ai>",
   "license": "AGPL-3.0",
   "scripts": {
-    "build": "tsc --module commonjs && rollup -c rollup.config.ts",
-    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install",
-    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && ../../.github/scripts/auto-sign.sh && npm pack && cpx *.tgz ../../electron/pre-install",
-    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install",
+    "clean:modules": "rimraf node_modules/pdf-parse/test && cd node_modules/pdf-parse/lib/pdf.js && rimraf v1.9.426 v1.10.88 v2.0.550",
+    "build": "yarn clean:modules && tsc --module commonjs && rollup -c rollup.config.ts",
+    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install",
+    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && ../../.github/scripts/auto-sign.sh && npm pack && cpx *.tgz ../../pre-install",
+    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install",
     "build:publish": "run-script-os"
   },
   "devDependencies": {
@@ -25,7 +26,7 @@
     "rollup-plugin-define": "^1.0.1",
     "rollup-plugin-sourcemaps": "^0.6.3",
     "rollup-plugin-typescript2": "^0.36.0",
-    "typescript": "^5.3.3",
+    "typescript": "^5.2.2",
     "run-script-os": "^1.1.6"
   },
   "dependencies": {
@@ -44,9 +45,6 @@
   ],
   "bundleDependencies": [
     "@janhq/core",
-    "@langchain/community",
-    "hnswlib-node",
-    "langchain",
-    "pdf-parse"
+    "hnswlib-node"
   ]
 }
diff --git a/extensions/assistant-extension/rollup.config.ts b/extensions/assistant-extension/rollup.config.ts
index 7916ef9c8..d3c39cab2 100644
--- a/extensions/assistant-extension/rollup.config.ts
+++ b/extensions/assistant-extension/rollup.config.ts
@@ -1,22 +1,22 @@
-import resolve from "@rollup/plugin-node-resolve";
-import commonjs from "@rollup/plugin-commonjs";
-import sourceMaps from "rollup-plugin-sourcemaps";
-import typescript from "rollup-plugin-typescript2";
-import json from "@rollup/plugin-json";
-import replace from "@rollup/plugin-replace";
+import resolve from '@rollup/plugin-node-resolve'
+import commonjs from '@rollup/plugin-commonjs'
+import sourceMaps from 'rollup-plugin-sourcemaps'
+import typescript from 'rollup-plugin-typescript2'
+import json from '@rollup/plugin-json'
+import replace from '@rollup/plugin-replace'
 
-const packageJson = require("./package.json");
+const packageJson = require('./package.json')
 
-const pkg = require("./package.json");
+const pkg = require('./package.json')
 
 export default [
   {
     input: `src/index.ts`,
-    output: [{ file: pkg.main, format: "es", sourcemap: true }],
+    output: [{ file: pkg.main, format: 'es', sourcemap: true }],
     // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
     external: [],
     watch: {
-      include: "src/**",
+      include: 'src/**',
     },
     plugins: [
       replace({
@@ -35,7 +35,7 @@ export default [
       // which external modules to include in the bundle
       // https://github.com/rollup/rollup-plugin-node-resolve#usage
       resolve({
-        extensions: [".js", ".ts", ".svelte"],
+        extensions: ['.js', '.ts', '.svelte'],
       }),
 
       // Resolve source maps to the original source
@@ -44,18 +44,11 @@ export default [
   },
   {
     input: `src/node/index.ts`,
-    output: [{ dir: "dist/node", format: "cjs", sourcemap: false }],
+    output: [{ dir: 'dist/node', format: 'cjs', sourcemap: false }],
     // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
-    external: [
-      "@janhq/core/node",
-      "@langchain/community",
-      "langchain",
-      "langsmith",
-      "path",
-      "hnswlib-node",
-    ],
+    external: ['@janhq/core/node', 'path', 'hnswlib-node'],
     watch: {
-      include: "src/node/**",
+      include: 'src/node/**',
     },
     // inlineDynamicImports: true,
     plugins: [
@@ -71,11 +64,11 @@ export default [
       // which external modules to include in the bundle
       // https://github.com/rollup/rollup-plugin-node-resolve#usage
       resolve({
-        extensions: [".ts", ".js", ".json"],
+        extensions: ['.ts', '.js', '.json'],
       }),
 
       // Resolve source maps to the original source
       // sourceMaps(),
     ],
   },
-];
+]
diff --git a/extensions/assistant-extension/src/@types/global.d.ts b/extensions/assistant-extension/src/@types/global.d.ts
index dc11709a4..bc97157cd 100644
--- a/extensions/assistant-extension/src/@types/global.d.ts
+++ b/extensions/assistant-extension/src/@types/global.d.ts
@@ -1,3 +1,3 @@
-declare const NODE: string;
-declare const EXTENSION_NAME: string;
-declare const VERSION: string;
+declare const NODE: string
+declare const EXTENSION_NAME: string
+declare const VERSION: string
diff --git a/extensions/assistant-extension/src/index.ts b/extensions/assistant-extension/src/index.ts
index 6495ea786..0a5319c8a 100644
--- a/extensions/assistant-extension/src/index.ts
+++ b/extensions/assistant-extension/src/index.ts
@@ -9,143 +9,169 @@ import {
   joinPath,
   executeOnMain,
   AssistantExtension,
-} from "@janhq/core";
+  AssistantEvent,
+} from '@janhq/core'
 
 export default class JanAssistantExtension extends AssistantExtension {
-  private static readonly _homeDir = "file://assistants";
+  private static readonly _homeDir = 'file://assistants'
+  private static readonly _threadDir = 'file://threads'
 
-  controller = new AbortController();
-  isCancelled = false;
-  retrievalThreadId: string | undefined = undefined;
+  controller = new AbortController()
+  isCancelled = false
+  retrievalThreadId: string | undefined = undefined
 
   async onLoad() {
     // making the assistant directory
     const assistantDirExist = await fs.existsSync(
-      JanAssistantExtension._homeDir,
-    );
+      JanAssistantExtension._homeDir
+    )
     if (
       localStorage.getItem(`${EXTENSION_NAME}-version`) !== VERSION ||
       !assistantDirExist
     ) {
-      if (!assistantDirExist)
-        await fs.mkdirSync(JanAssistantExtension._homeDir);
+      if (!assistantDirExist) await fs.mkdirSync(JanAssistantExtension._homeDir)
 
       // Write assistant metadata
-      this.createJanAssistant();
+      await this.createJanAssistant()
       // Finished migration
-      localStorage.setItem(`${EXTENSION_NAME}-version`, VERSION);
+      localStorage.setItem(`${EXTENSION_NAME}-version`, VERSION)
+      // Update the assistant list
+      events.emit(AssistantEvent.OnAssistantsUpdate, {})
     }
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      JanAssistantExtension.handleMessageRequest(data, this),
-    );
+      JanAssistantExtension.handleMessageRequest(data, this)
+    )
 
     events.on(InferenceEvent.OnInferenceStopped, () => {
-      JanAssistantExtension.handleInferenceStopped(this);
-    });
+      JanAssistantExtension.handleInferenceStopped(this)
+    })
   }
 
   private static async handleInferenceStopped(instance: JanAssistantExtension) {
-    instance.isCancelled = true;
-    instance.controller?.abort();
+    instance.isCancelled = true
+    instance.controller?.abort()
   }
 
   private static async handleMessageRequest(
     data: MessageRequest,
-    instance: JanAssistantExtension,
+    instance: JanAssistantExtension
   ) {
-    instance.isCancelled = false;
-    instance.controller = new AbortController();
+    instance.isCancelled = false
+    instance.controller = new AbortController()
 
     if (
       data.model?.engine !== InferenceEngine.tool_retrieval_enabled ||
       !data.messages ||
+      // TODO: Since the engine is defined, its unsafe to assume that assistant tools are defined
+      // That could lead to an issue where thread stuck at generating response
       !data.thread?.assistants[0]?.tools
     ) {
-      return;
+      return
     }
 
-    const latestMessage = data.messages[data.messages.length - 1];
+    const latestMessage = data.messages[data.messages.length - 1]
 
-    // Ingest the document if needed
+    // 1. Ingest the document if needed
     if (
       latestMessage &&
       latestMessage.content &&
-      typeof latestMessage.content !== "string"
+      typeof latestMessage.content !== 'string' &&
+      latestMessage.content.length > 1
     ) {
-      const docFile = latestMessage.content[1]?.doc_url?.url;
+      const docFile = latestMessage.content[1]?.doc_url?.url
       if (docFile) {
         await executeOnMain(
           NODE,
-          "toolRetrievalIngestNewDocument",
+          'toolRetrievalIngestNewDocument',
           docFile,
-          data.model?.proxyEngine,
-        );
+          data.model?.proxyEngine
+        )
       }
+    } else if (
+      // Check whether we need to ingest document or not
+      // Otherwise wrong context will be sent
+      !(await fs.existsSync(
+        await joinPath([
+          JanAssistantExtension._threadDir,
+          data.threadId,
+          'memory',
+        ])
+      ))
+    ) {
+      // No document ingested, reroute the result to inference engine
+      const output = {
+        ...data,
+        model: {
+          ...data.model,
+          engine: data.model.proxyEngine,
+        },
+      }
+      events.emit(MessageEvent.OnMessageSent, output)
+      return
     }
-
-    // Load agent on thread changed
+    // 2. Load agent on thread changed
     if (instance.retrievalThreadId !== data.threadId) {
-      await executeOnMain(NODE, "toolRetrievalLoadThreadMemory", data.threadId);
+      await executeOnMain(NODE, 'toolRetrievalLoadThreadMemory', data.threadId)
 
-      instance.retrievalThreadId = data.threadId;
+      instance.retrievalThreadId = data.threadId
 
       // Update the text splitter
       await executeOnMain(
         NODE,
-        "toolRetrievalUpdateTextSplitter",
+        'toolRetrievalUpdateTextSplitter',
         data.thread.assistants[0].tools[0]?.settings?.chunk_size ?? 4000,
-        data.thread.assistants[0].tools[0]?.settings?.chunk_overlap ?? 200,
-      );
+        data.thread.assistants[0].tools[0]?.settings?.chunk_overlap ?? 200
+      )
     }
 
+    // 3. Using the retrieval template with the result and query
     if (latestMessage.content) {
       const prompt =
-        typeof latestMessage.content === "string"
+        typeof latestMessage.content === 'string'
           ? latestMessage.content
-          : latestMessage.content[0].text;
+          : latestMessage.content[0].text
       // Retrieve the result
-      console.debug("toolRetrievalQuery", latestMessage.content);
       const retrievalResult = await executeOnMain(
         NODE,
-        "toolRetrievalQueryResult",
-        prompt,
-      );
+        'toolRetrievalQueryResult',
+        prompt
+      )
+      console.debug('toolRetrievalQueryResult', retrievalResult)
 
-      // Update the message content
-      // Using the retrieval template with the result and query
-      if (data.thread?.assistants[0].tools)
+      // Update message content
+      if (data.thread?.assistants[0]?.tools && retrievalResult)
         data.messages[data.messages.length - 1].content =
           data.thread.assistants[0].tools[0].settings?.retrieval_template
-            ?.replace("{CONTEXT}", retrievalResult)
-            .replace("{QUESTION}", prompt);
+            ?.replace('{CONTEXT}', retrievalResult)
+            .replace('{QUESTION}', prompt)
     }
 
     // Filter out all the messages that are not text
     data.messages = data.messages.map((message) => {
       if (
         message.content &&
-        typeof message.content !== "string" &&
+        typeof message.content !== 'string' &&
         (message.content.length ?? 0) > 0
       ) {
         return {
           ...message,
           content: [message.content[0]],
-        };
+        }
       }
-      return message;
-    });
+      return message
+    })
 
-    // Reroute the result to inference engine
+    // 4. Reroute the result to inference engine
     const output = {
       ...data,
       model: {
         ...data.model,
         engine: data.model.proxyEngine,
       },
-    };
-    events.emit(MessageEvent.OnMessageSent, output);
+    }
+    events.emit(MessageEvent.OnMessageSent, output)
   }
 
   /**
@@ -157,107 +183,107 @@ export default class JanAssistantExtension extends AssistantExtension {
     const assistantDir = await joinPath([
       JanAssistantExtension._homeDir,
       assistant.id,
-    ]);
-    if (!(await fs.existsSync(assistantDir))) await fs.mkdirSync(assistantDir);
+    ])
+    if (!(await fs.existsSync(assistantDir))) await fs.mkdirSync(assistantDir)
 
     // store the assistant metadata json
     const assistantMetadataPath = await joinPath([
       assistantDir,
-      "assistant.json",
-    ]);
+      'assistant.json',
+    ])
     try {
       await fs.writeFileSync(
         assistantMetadataPath,
-        JSON.stringify(assistant, null, 2),
-      );
+        JSON.stringify(assistant, null, 2)
+      )
     } catch (err) {
-      console.error(err);
+      console.error(err)
     }
   }
 
   async getAssistants(): Promise<Assistant[]> {
     // get all the assistant directories
     // get all the assistant metadata json
-    const results: Assistant[] = [];
+    const results: Assistant[] = []
     const allFileName: string[] = await fs.readdirSync(
-      JanAssistantExtension._homeDir,
-    );
+      JanAssistantExtension._homeDir
+    )
     for (const fileName of allFileName) {
       const filePath = await joinPath([
         JanAssistantExtension._homeDir,
         fileName,
-      ]);
+      ])
 
-      if (filePath.includes(".DS_Store")) continue;
+      if (filePath.includes('.DS_Store')) continue
       const jsonFiles: string[] = (await fs.readdirSync(filePath)).filter(
-        (file: string) => file === "assistant.json",
-      );
+        (file: string) => file === 'assistant.json'
+      )
 
       if (jsonFiles.length !== 1) {
         // has more than one assistant file -> ignore
-        continue;
+        continue
       }
 
       const content = await fs.readFileSync(
         await joinPath([filePath, jsonFiles[0]]),
-        "utf-8",
-      );
+        'utf-8'
+      )
       const assistant: Assistant =
-        typeof content === "object" ? content : JSON.parse(content);
+        typeof content === 'object' ? content : JSON.parse(content)
 
-      results.push(assistant);
+      results.push(assistant)
     }
 
-    return results;
+    return results
   }
 
   async deleteAssistant(assistant: Assistant): Promise<void> {
-    if (assistant.id === "jan") {
-      return Promise.reject("Cannot delete Jan Assistant");
+    if (assistant.id === 'jan') {
+      return Promise.reject('Cannot delete Jan Assistant')
     }
 
     // remove the directory
     const assistantDir = await joinPath([
       JanAssistantExtension._homeDir,
       assistant.id,
-    ]);
-    await fs.rmdirSync(assistantDir);
-    return Promise.resolve();
+    ])
+    await fs.rmdirSync(assistantDir)
+    return Promise.resolve()
   }
 
   private async createJanAssistant(): Promise<void> {
     const janAssistant: Assistant = {
-      avatar: "",
+      avatar: '',
       thread_location: undefined,
-      id: "jan",
-      object: "assistant",
+      id: 'jan',
+      object: 'assistant',
       created_at: Date.now(),
-      name: "Jan",
-      description: "A default assistant that can use all downloaded models",
-      model: "*",
-      instructions: "",
+      name: 'Jan',
+      description: 'A default assistant that can use all downloaded models',
+      model: '*',
+      instructions: '',
       tools: [
         {
-          type: "retrieval",
+          type: 'retrieval',
           enabled: false,
           settings: {
             top_k: 2,
             chunk_size: 1024,
             chunk_overlap: 64,
             retrieval_template: `Use the following pieces of context to answer the question at the end. If you don't know the answer, just say that you don't know, don't try to make up an answer.
-            ----------------
-            CONTEXT: {CONTEXT}
-            ----------------
-            QUESTION: {QUESTION}
-            ----------------
-            Helpful Answer:`,
+----------------
+CONTEXT: {CONTEXT}
+----------------
+QUESTION: {QUESTION}
+----------------
+Helpful Answer:`,
           },
         },
       ],
       file_ids: [],
       metadata: undefined,
-    };
+    }
 
-    await this.createAssistant(janAssistant);
+    await this.createAssistant(janAssistant)
   }
 }
diff --git a/extensions/assistant-extension/src/node/engine.ts b/extensions/assistant-extension/src/node/engine.ts
index 54b2a6ba1..70d02af1f 100644
--- a/extensions/assistant-extension/src/node/engine.ts
+++ b/extensions/assistant-extension/src/node/engine.ts
@@ -1,13 +1,13 @@
-import fs from "fs";
-import path from "path";
-import { getJanDataFolderPath } from "@janhq/core/node";
+import fs from 'fs'
+import path from 'path'
+import { getJanDataFolderPath } from '@janhq/core/node'
 
 // Sec: Do not send engine settings over requests
 // Read it manually instead
 export const readEmbeddingEngine = (engineName: string) => {
   const engineSettings = fs.readFileSync(
-    path.join(getJanDataFolderPath(), "engines", `${engineName}.json`),
-    "utf-8",
-  );
-  return JSON.parse(engineSettings);
-};
+    path.join(getJanDataFolderPath(), 'engines', `${engineName}.json`),
+    'utf-8'
+  )
+  return JSON.parse(engineSettings)
+}
diff --git a/extensions/assistant-extension/src/node/index.ts b/extensions/assistant-extension/src/node/index.ts
index 95a7243a4..d52a4b23e 100644
--- a/extensions/assistant-extension/src/node/index.ts
+++ b/extensions/assistant-extension/src/node/index.ts
@@ -1,39 +1,39 @@
-import { getJanDataFolderPath, normalizeFilePath } from "@janhq/core/node";
-import { Retrieval } from "./tools/retrieval";
-import path from "path";
+import { getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
+import { retrieval } from './tools/retrieval'
+import path from 'path'
 
-const retrieval = new Retrieval();
-
-export async function toolRetrievalUpdateTextSplitter(
+export function toolRetrievalUpdateTextSplitter(
   chunkSize: number,
-  chunkOverlap: number,
+  chunkOverlap: number
 ) {
-  retrieval.updateTextSplitter(chunkSize, chunkOverlap);
-  return Promise.resolve();
+  retrieval.updateTextSplitter(chunkSize, chunkOverlap)
 }
 export async function toolRetrievalIngestNewDocument(
   file: string,
-  engine: string,
+  engine: string
 ) {
-  const filePath = path.join(getJanDataFolderPath(), normalizeFilePath(file));
-  const threadPath = path.dirname(filePath.replace("files", ""));
-  retrieval.updateEmbeddingEngine(engine);
-  await retrieval.ingestAgentKnowledge(filePath, `${threadPath}/memory`);
-  return Promise.resolve();
+  const filePath = path.join(getJanDataFolderPath(), normalizeFilePath(file))
+  const threadPath = path.dirname(filePath.replace('files', ''))
+  retrieval.updateEmbeddingEngine(engine)
+  return retrieval
+    .ingestAgentKnowledge(filePath, `${threadPath}/memory`)
+    .catch((err) => {
+      console.error(err)
+    })
 }
 
 export async function toolRetrievalLoadThreadMemory(threadId: string) {
-  try {
-    await retrieval.loadRetrievalAgent(
-      path.join(getJanDataFolderPath(), "threads", threadId, "memory"),
-    );
-    return Promise.resolve();
-  } catch (err) {
-    console.debug(err);
-  }
+  return retrieval
+    .loadRetrievalAgent(
+      path.join(getJanDataFolderPath(), 'threads', threadId, 'memory')
+    )
+    .catch((err) => {
+      console.error(err)
+    })
 }
 
 export async function toolRetrievalQueryResult(query: string) {
-  const res = await retrieval.generateResult(query);
-  return Promise.resolve(res);
+  return retrieval.generateResult(query).catch((err) => {
+    console.error(err)
+  })
 }
diff --git a/extensions/assistant-extension/src/node/tools/retrieval/index.ts b/extensions/assistant-extension/src/node/tools/retrieval/index.ts
index 8c7a6aa2b..e58ec0c46 100644
--- a/extensions/assistant-extension/src/node/tools/retrieval/index.ts
+++ b/extensions/assistant-extension/src/node/tools/retrieval/index.ts
@@ -1,77 +1,80 @@
-import { RecursiveCharacterTextSplitter } from "langchain/text_splitter";
-import { formatDocumentsAsString } from "langchain/util/document";
-import { PDFLoader } from "langchain/document_loaders/fs/pdf";
+import { RecursiveCharacterTextSplitter } from 'langchain/text_splitter'
+import { formatDocumentsAsString } from 'langchain/util/document'
+import { PDFLoader } from 'langchain/document_loaders/fs/pdf'
 
-import { HNSWLib } from "langchain/vectorstores/hnswlib";
+import { HNSWLib } from 'langchain/vectorstores/hnswlib'
 
-import { OpenAIEmbeddings } from "langchain/embeddings/openai";
-import { readEmbeddingEngine } from "../../engine";
+import { OpenAIEmbeddings } from 'langchain/embeddings/openai'
+import { readEmbeddingEngine } from '../../engine'
 
 export class Retrieval {
-  public chunkSize: number = 100;
-  public chunkOverlap?: number = 0;
-  private retriever: any;
+  public chunkSize: number = 100
+  public chunkOverlap?: number = 0
+  private retriever: any
 
-  private embeddingModel?: OpenAIEmbeddings = undefined;
-  private textSplitter?: RecursiveCharacterTextSplitter;
+  private embeddingModel?: OpenAIEmbeddings = undefined
+  private textSplitter?: RecursiveCharacterTextSplitter
 
   constructor(chunkSize: number = 4000, chunkOverlap: number = 200) {
-    this.updateTextSplitter(chunkSize, chunkOverlap);
+    this.updateTextSplitter(chunkSize, chunkOverlap)
   }
 
   public updateTextSplitter(chunkSize: number, chunkOverlap: number): void {
-    this.chunkSize = chunkSize;
-    this.chunkOverlap = chunkOverlap;
+    this.chunkSize = chunkSize
+    this.chunkOverlap = chunkOverlap
     this.textSplitter = new RecursiveCharacterTextSplitter({
       chunkSize: chunkSize,
       chunkOverlap: chunkOverlap,
-    });
+    })
   }
 
   public updateEmbeddingEngine(engine: string): void {
     // Engine settings are not compatible with the current embedding model params
     // Switch case manually for now
-    const settings = readEmbeddingEngine(engine);
-    if (engine === "nitro") {
+    const settings = readEmbeddingEngine(engine)
+    if (engine === 'nitro') {
       this.embeddingModel = new OpenAIEmbeddings(
-        { openAIApiKey: "nitro-embedding" },
-        { basePath: "http://127.0.0.1:3928/v1" },
-      );
+        { openAIApiKey: 'nitro-embedding' },
+        // TODO: Raw settings
+        { basePath: 'http://127.0.0.1:3928/v1' }
+      )
     } else {
       // Fallback to OpenAI Settings
       this.embeddingModel = new OpenAIEmbeddings({
         openAIApiKey: settings.api_key,
-      });
+      })
     }
   }
 
   public ingestAgentKnowledge = async (
     filePath: string,
-    memoryPath: string,
+    memoryPath: string
   ): Promise<any> => {
     const loader = new PDFLoader(filePath, {
       splitPages: true,
-    });
-    if (!this.embeddingModel) return Promise.reject();
-    const doc = await loader.load();
-    const docs = await this.textSplitter!.splitDocuments(doc);
-    const vectorStore = await HNSWLib.fromDocuments(docs, this.embeddingModel);
-    return vectorStore.save(memoryPath);
-  };
+    })
+    if (!this.embeddingModel) return Promise.reject()
+    const doc = await loader.load()
+    const docs = await this.textSplitter!.splitDocuments(doc)
+    const vectorStore = await HNSWLib.fromDocuments(docs, this.embeddingModel)
+    return vectorStore.save(memoryPath)
+  }
 
   public loadRetrievalAgent = async (memoryPath: string): Promise<void> => {
-    if (!this.embeddingModel) return Promise.reject();
-    const vectorStore = await HNSWLib.load(memoryPath, this.embeddingModel);
-    this.retriever = vectorStore.asRetriever(2);
-    return Promise.resolve();
-  };
+    if (!this.embeddingModel) return Promise.reject()
+    const vectorStore = await HNSWLib.load(memoryPath, this.embeddingModel)
+    this.retriever = vectorStore.asRetriever(2)
+    return Promise.resolve()
+  }
 
   public generateResult = async (query: string): Promise<string> => {
     if (!this.retriever) {
-      return Promise.resolve(" ");
+      return Promise.resolve(' ')
     }
-    const relevantDocs = await this.retriever.getRelevantDocuments(query);
-    const serializedDoc = formatDocumentsAsString(relevantDocs);
-    return Promise.resolve(serializedDoc);
-  };
+    const relevantDocs = await this.retriever.getRelevantDocuments(query)
+    const serializedDoc = formatDocumentsAsString(relevantDocs)
+    return Promise.resolve(serializedDoc)
+  }
 }
+
+export const retrieval = new Retrieval()
diff --git a/extensions/assistant-extension/tsconfig.json b/extensions/assistant-extension/tsconfig.json
index d3794cace..e425358c3 100644
--- a/extensions/assistant-extension/tsconfig.json
+++ b/extensions/assistant-extension/tsconfig.json
@@ -14,7 +14,7 @@
     "outDir": "dist",
     "importHelpers": true,
     "typeRoots": ["node_modules/@types"],
-    "skipLibCheck": true,
+    "skipLibCheck": true
   },
-  "include": ["src"],
+  "include": ["src"]
 }
diff --git a/extensions/conversational-extension/.prettierrc b/extensions/conversational-extension/.prettierrc
deleted file mode 100644
index 46f1abcb0..000000000
--- a/extensions/conversational-extension/.prettierrc
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-  "semi": false,
-  "singleQuote": true,
-  "quoteProps": "consistent",
-  "trailingComma": "es5",
-  "endOfLine": "auto",
-  "plugins": ["prettier-plugin-tailwindcss"]
-}
diff --git a/extensions/conversational-extension/package.json b/extensions/conversational-extension/package.json
index a60c12339..8a6da14e5 100644
--- a/extensions/conversational-extension/package.json
+++ b/extensions/conversational-extension/package.json
@@ -7,7 +7,7 @@
   "license": "MIT",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "exports": {
     ".": "./dist/index.js",
@@ -17,12 +17,12 @@
     "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
-    "path-browserify": "^1.0.1",
-    "ts-loader": "^9.5.0"
+    "path-browserify": "^1.0.1"
   },
   "engines": {
     "node": ">=18.0.0"
diff --git a/extensions/conversational-extension/webpack.config.js b/extensions/conversational-extension/webpack.config.js
index 36e338295..a3eb873d7 100644
--- a/extensions/conversational-extension/webpack.config.js
+++ b/extensions/conversational-extension/webpack.config.js
@@ -1,27 +1,27 @@
-const path = require("path");
-const webpack = require("webpack");
+const path = require('path')
+const webpack = require('webpack')
 
 module.exports = {
   experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
+  entry: './src/index.ts', // Adjust the entry point to match your project's main file
+  mode: 'production',
   module: {
     rules: [
       {
         test: /\.tsx?$/,
-        use: "ts-loader",
+        use: 'ts-loader',
         exclude: /node_modules/,
       },
     ],
   },
   output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
+    filename: 'index.js', // Adjust the output file name as needed
+    path: path.resolve(__dirname, 'dist'),
+    library: { type: 'module' }, // Specify ESM output format
   },
   plugins: [new webpack.DefinePlugin({})],
   resolve: {
-    extensions: [".ts", ".js"],
+    extensions: ['.ts', '.js'],
     fallback: {
       path: require.resolve('path-browserify'),
     },
@@ -31,4 +31,4 @@ module.exports = {
     minimize: false,
   },
   // Add loaders and other configuration as needed for your project
-};
+}
diff --git a/extensions/inference-nitro-extension/README.md b/extensions/inference-nitro-extension/README.md
index 455783efb..f499e0b9c 100644
--- a/extensions/inference-nitro-extension/README.md
+++ b/extensions/inference-nitro-extension/README.md
@@ -64,10 +64,10 @@ There are a few things to keep in mind when writing your plugin code:
   In `index.ts`, you will see that the extension function will return a `Promise<any>`.
 
   ```typescript
-  import { core } from "@janhq/core";
+  import { core } from '@janhq/core'
 
   function onStart(): Promise<any> {
-    return core.invokePluginFunc(MODULE_PATH, "run", 0);
+    return core.invokePluginFunc(MODULE_PATH, 'run', 0)
   }
   ```
 
@@ -75,4 +75,3 @@ There are a few things to keep in mind when writing your plugin code:
   [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
 
 So, what are you waiting for? Go ahead and start customizing your plugin!
-
diff --git a/extensions/inference-nitro-extension/bin/version.txt b/extensions/inference-nitro-extension/bin/version.txt
index c2c0004f0..0b9c01996 100644
--- a/extensions/inference-nitro-extension/bin/version.txt
+++ b/extensions/inference-nitro-extension/bin/version.txt
@@ -1 +1 @@
-0.3.5
+0.3.12
diff --git a/extensions/inference-nitro-extension/download.bat b/extensions/inference-nitro-extension/download.bat
index 22e1c85b3..2ef3165c1 100644
--- a/extensions/inference-nitro-extension/download.bat
+++ b/extensions/inference-nitro-extension/download.bat
@@ -1,3 +1,3 @@
 @echo off
 set /p NITRO_VERSION=<./bin/version.txt
-.\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-cuda-12-0.tar.gz -e --strip 1 -o ./bin/win-cuda-12-0 && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-cuda-11-7.tar.gz -e --strip 1 -o ./bin/win-cuda-11-7 && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64.tar.gz -e --strip 1 -o ./bin/win-cpu
+.\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-cuda-12-0.tar.gz -e --strip 1 -o ./bin/win-cuda-12-0 && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-cuda-11-7.tar.gz -e --strip 1 -o ./bin/win-cuda-11-7 && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64.tar.gz -e --strip 1 -o ./bin/win-cpu && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-vulkan.tar.gz -e --strip 1 -o ./bin/win-vulkan && .\node_modules\.bin\download https://delta.jan.ai/vulkaninfoSDK.exe -o ./bin
diff --git a/extensions/inference-nitro-extension/package.json b/extensions/inference-nitro-extension/package.json
index 8ad516ad9..ba6b473eb 100644
--- a/extensions/inference-nitro-extension/package.json
+++ b/extensions/inference-nitro-extension/package.json
@@ -8,13 +8,13 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc --module commonjs && rollup -c rollup.config.ts",
-    "downloadnitro:linux": "NITRO_VERSION=$(cat ./bin/version.txt) && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64.tar.gz -e --strip 1 -o ./bin/linux-cpu && chmod +x ./bin/linux-cpu/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-cuda-12-0.tar.gz -e --strip 1 -o ./bin/linux-cuda-12-0 && chmod +x ./bin/linux-cuda-12-0/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-cuda-11-7.tar.gz -e --strip 1 -o ./bin/linux-cuda-11-7 && chmod +x ./bin/linux-cuda-11-7/nitro",
+    "downloadnitro:linux": "NITRO_VERSION=$(cat ./bin/version.txt) && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64.tar.gz -e --strip 1 -o ./bin/linux-cpu && chmod +x ./bin/linux-cpu/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-cuda-12-0.tar.gz -e --strip 1 -o ./bin/linux-cuda-12-0 && chmod +x ./bin/linux-cuda-12-0/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-cuda-11-7.tar.gz -e --strip 1 -o ./bin/linux-cuda-11-7 && chmod +x ./bin/linux-cuda-11-7/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-vulkan.tar.gz -e --strip 1 -o ./bin/linux-vulkan && chmod +x ./bin/linux-vulkan/nitro && download https://delta.jan.ai/vulkaninfo -o ./bin && chmod +x ./bin/vulkaninfo",
     "downloadnitro:darwin": "NITRO_VERSION=$(cat ./bin/version.txt) && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-mac-arm64.tar.gz -e --strip 1 -o ./bin/mac-arm64 && chmod +x ./bin/mac-arm64/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-mac-amd64.tar.gz -e --strip 1 -o ./bin/mac-x64 && chmod +x ./bin/mac-x64/nitro",
     "downloadnitro:win32": "download.bat",
     "downloadnitro": "run-script-os",
-    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && ../../.github/scripts/auto-sign.sh && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../electron/pre-install",
-    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../electron/pre-install",
-    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && cpx \"bin/**\" \"dist/bin\" &&  npm pack && cpx *.tgz ../../electron/pre-install",
+    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && ../../.github/scripts/auto-sign.sh && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../pre-install",
+    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../pre-install",
+    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && cpx \"bin/**\" \"dist/bin\" &&  npm pack && cpx *.tgz ../../pre-install",
     "build:publish": "run-script-os"
   },
   "exports": {
@@ -35,12 +35,12 @@
     "rollup-plugin-sourcemaps": "^0.6.3",
     "rollup-plugin-typescript2": "^0.36.0",
     "run-script-os": "^1.1.6",
-    "typescript": "^5.2.2"
+    "typescript": "^5.2.2",
+    "@types/os-utils": "^0.0.4",
+    "@rollup/plugin-replace": "^5.0.5"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
-    "@rollup/plugin-replace": "^5.0.5",
-    "@types/os-utils": "^0.0.4",
     "fetch-retry": "^5.0.6",
     "path-browserify": "^1.0.1",
     "rxjs": "^7.8.1",
diff --git a/extensions/inference-nitro-extension/rollup.config.ts b/extensions/inference-nitro-extension/rollup.config.ts
index 77a9fb208..ec8943f9c 100644
--- a/extensions/inference-nitro-extension/rollup.config.ts
+++ b/extensions/inference-nitro-extension/rollup.config.ts
@@ -1,34 +1,34 @@
-import resolve from "@rollup/plugin-node-resolve";
-import commonjs from "@rollup/plugin-commonjs";
-import sourceMaps from "rollup-plugin-sourcemaps";
-import typescript from "rollup-plugin-typescript2";
-import json from "@rollup/plugin-json";
-import replace from "@rollup/plugin-replace";
-const packageJson = require("./package.json");
+import resolve from '@rollup/plugin-node-resolve'
+import commonjs from '@rollup/plugin-commonjs'
+import sourceMaps from 'rollup-plugin-sourcemaps'
+import typescript from 'rollup-plugin-typescript2'
+import json from '@rollup/plugin-json'
+import replace from '@rollup/plugin-replace'
+const packageJson = require('./package.json')
 
-const pkg = require("./package.json");
+const pkg = require('./package.json')
 
 export default [
   {
     input: `src/index.ts`,
-    output: [{ file: pkg.main, format: "es", sourcemap: true }],
+    output: [{ file: pkg.main, format: 'es', sourcemap: true }],
     // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
     external: [],
     watch: {
-      include: "src/**",
+      include: 'src/**',
     },
     plugins: [
       replace({
         NODE: JSON.stringify(`${packageJson.name}/${packageJson.node}`),
         INFERENCE_URL: JSON.stringify(
           process.env.INFERENCE_URL ||
-            "http://127.0.0.1:3928/inferences/llamacpp/chat_completion"
+            'http://127.0.0.1:3928/inferences/llamacpp/chat_completion'
         ),
         TROUBLESHOOTING_URL: JSON.stringify(
-          "https://jan.ai/guides/troubleshooting"
+          'https://jan.ai/guides/troubleshooting'
         ),
         JAN_SERVER_INFERENCE_URL: JSON.stringify(
-          "http://localhost:1337/v1/chat/completions"
+          'http://localhost:1337/v1/chat/completions'
         ),
       }),
       // Allow json resolution
@@ -42,7 +42,7 @@ export default [
       // which external modules to include in the bundle
       // https://github.com/rollup/rollup-plugin-node-resolve#usage
       resolve({
-        extensions: [".js", ".ts", ".svelte"],
+        extensions: ['.js', '.ts', '.svelte'],
       }),
 
       // Resolve source maps to the original source
@@ -52,12 +52,12 @@ export default [
   {
     input: `src/node/index.ts`,
     output: [
-      { file: "dist/node/index.cjs.js", format: "cjs", sourcemap: true },
+      { file: 'dist/node/index.cjs.js', format: 'cjs', sourcemap: true },
     ],
     // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
-    external: ["@janhq/core/node"],
+    external: ['@janhq/core/node'],
     watch: {
-      include: "src/node/**",
+      include: 'src/node/**',
     },
     plugins: [
       // Allow json resolution
@@ -70,11 +70,11 @@ export default [
       // which external modules to include in the bundle
       // https://github.com/rollup/rollup-plugin-node-resolve#usage
       resolve({
-        extensions: [".ts", ".js", ".json"],
+        extensions: ['.ts', '.js', '.json'],
       }),
 
       // Resolve source maps to the original source
       sourceMaps(),
     ],
   },
-];
+]
diff --git a/extensions/inference-nitro-extension/src/@types/global.d.ts b/extensions/inference-nitro-extension/src/@types/global.d.ts
index 7a4fb4805..3a3d2aa32 100644
--- a/extensions/inference-nitro-extension/src/@types/global.d.ts
+++ b/extensions/inference-nitro-extension/src/@types/global.d.ts
@@ -1,13 +1,13 @@
-declare const NODE: string;
-declare const INFERENCE_URL: string;
-declare const TROUBLESHOOTING_URL: string;
-declare const JAN_SERVER_INFERENCE_URL: string;
+declare const NODE: string
+declare const INFERENCE_URL: string
+declare const TROUBLESHOOTING_URL: string
+declare const JAN_SERVER_INFERENCE_URL: string
 
 /**
  * The response from the initModel function.
  * @property error - An error message if the model fails to load.
  */
 interface ModelOperationResponse {
-  error?: any;
-  modelFile?: string;
+  error?: any
+  modelFile?: string
 }
diff --git a/extensions/inference-nitro-extension/src/helpers/sse.ts b/extensions/inference-nitro-extension/src/helpers/sse.ts
index aab260828..06176c9b9 100644
--- a/extensions/inference-nitro-extension/src/helpers/sse.ts
+++ b/extensions/inference-nitro-extension/src/helpers/sse.ts
@@ -1,5 +1,5 @@
-import { Model } from "@janhq/core";
-import { Observable } from "rxjs";
+import { Model } from '@janhq/core'
+import { Observable } from 'rxjs'
 /**
  * Sends a request to the inference server to generate a response based on the recent messages.
  * @param recentMessages - An array of recent messages to use as context for the inference.
@@ -17,50 +17,50 @@ export function requestInference(
       model: model.id,
       stream: true,
       ...model.parameters,
-    });
+    })
     fetch(inferenceUrl, {
-      method: "POST",
+      method: 'POST',
       headers: {
-        "Content-Type": "application/json",
-        "Access-Control-Allow-Origin": "*",
-        Accept: model.parameters.stream
-          ? "text/event-stream"
-          : "application/json",
+        'Content-Type': 'application/json',
+        'Access-Control-Allow-Origin': '*',
+        'Accept': model.parameters.stream
+          ? 'text/event-stream'
+          : 'application/json',
       },
       body: requestBody,
       signal: controller?.signal,
     })
       .then(async (response) => {
         if (model.parameters.stream === false) {
-          const data = await response.json();
-          subscriber.next(data.choices[0]?.message?.content ?? "");
+          const data = await response.json()
+          subscriber.next(data.choices[0]?.message?.content ?? '')
         } else {
-          const stream = response.body;
-          const decoder = new TextDecoder("utf-8");
-          const reader = stream?.getReader();
-          let content = "";
+          const stream = response.body
+          const decoder = new TextDecoder('utf-8')
+          const reader = stream?.getReader()
+          let content = ''
 
           while (true && reader) {
-            const { done, value } = await reader.read();
+            const { done, value } = await reader.read()
             if (done) {
-              break;
+              break
             }
-            const text = decoder.decode(value);
-            const lines = text.trim().split("\n");
+            const text = decoder.decode(value)
+            const lines = text.trim().split('\n')
             for (const line of lines) {
-              if (line.startsWith("data: ") && !line.includes("data: [DONE]")) {
-                const data = JSON.parse(line.replace("data: ", ""));
-                content += data.choices[0]?.delta?.content ?? "";
-                if (content.startsWith("assistant: ")) {
-                  content = content.replace("assistant: ", "");
+              if (line.startsWith('data: ') && !line.includes('data: [DONE]')) {
+                const data = JSON.parse(line.replace('data: ', ''))
+                content += data.choices[0]?.delta?.content ?? ''
+                if (content.startsWith('assistant: ')) {
+                  content = content.replace('assistant: ', '')
                 }
-                subscriber.next(content);
+                subscriber.next(content)
               }
             }
           }
         }
-        subscriber.complete();
+        subscriber.complete()
       })
-      .catch((err) => subscriber.error(err));
-  });
+      .catch((err) => subscriber.error(err))
+  })
 }
diff --git a/extensions/inference-nitro-extension/src/index.ts b/extensions/inference-nitro-extension/src/index.ts
index 9e96ad93f..979b4cfac 100644
--- a/extensions/inference-nitro-extension/src/index.ts
+++ b/extensions/inference-nitro-extension/src/index.ts
@@ -10,6 +10,7 @@ import {
   ChatCompletionRole,
   ContentType,
   MessageRequest,
+  MessageRequestType,
   MessageStatus,
   ThreadContent,
   ThreadMessage,
@@ -25,9 +26,10 @@ import {
   ModelEvent,
   InferenceEvent,
   ModelSettingParams,
-} from "@janhq/core";
-import { requestInference } from "./helpers/sse";
-import { ulid } from "ulid";
+  getJanDataFolderPath,
+} from '@janhq/core'
+import { requestInference } from './helpers/sse'
+import { ulid } from 'ulid'
 
 /**
  * A class that implements the InferenceExtension interface from the @janhq/core package.
@@ -35,16 +37,16 @@ import { ulid } from "ulid";
  * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
  */
 export default class JanInferenceNitroExtension extends InferenceExtension {
-  private static readonly _homeDir = "file://engines";
-  private static readonly _settingsDir = "file://settings";
-  private static readonly _engineMetadataFileName = "nitro.json";
+  private static readonly _homeDir = 'file://engines'
+  private static readonly _settingsDir = 'file://settings'
+  private static readonly _engineMetadataFileName = 'nitro.json'
 
   /**
    * Checking the health for Nitro's process each 5 secs.
    */
-  private static readonly _intervalHealthCheck = 5 * 1000;
+  private static readonly _intervalHealthCheck = 5 * 1000
 
-  private _currentModel: Model | undefined;
+  private _currentModel: Model | undefined
 
   private _engineSettings: ModelSettingParams = {
     ctx_len: 2048,
@@ -52,23 +54,22 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
     cpu_threads: 1,
     cont_batching: false,
     embedding: true,
-  };
+  }
 
-  controller = new AbortController();
-  isCancelled = false;
+  controller = new AbortController()
+  isCancelled = false
 
   /**
    * The interval id for the health check. Used to stop the health check.
    */
-  private getNitroProcesHealthIntervalId: NodeJS.Timeout | undefined =
-    undefined;
+  private getNitroProcesHealthIntervalId: NodeJS.Timeout | undefined = undefined
 
   /**
    * Tracking the current state of nitro process.
    */
-  private nitroProcessInfo: any = undefined;
+  private nitroProcessInfo: any = undefined
 
-  private inferenceUrl = "";
+  private inferenceUrl = ''
 
   /**
    * Subscribes to events emitted by the @janhq/core package.
@@ -76,44 +77,40 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
   async onLoad() {
     if (!(await fs.existsSync(JanInferenceNitroExtension._homeDir))) {
       try {
-        await fs.mkdirSync(JanInferenceNitroExtension._homeDir);
+        await fs.mkdirSync(JanInferenceNitroExtension._homeDir)
       } catch (e) {
-        console.debug(e);
+        console.debug(e)
       }
     }
 
     // init inference url
     // @ts-ignore
-    const electronApi = window?.electronAPI;
-    this.inferenceUrl = INFERENCE_URL;
+    const electronApi = window?.electronAPI
+    this.inferenceUrl = INFERENCE_URL
     if (!electronApi) {
-      this.inferenceUrl = JAN_SERVER_INFERENCE_URL;
+      this.inferenceUrl = `${window.core?.api?.baseApiUrl}/v1/chat/completions`
     }
-    console.debug("Inference url: ", this.inferenceUrl);
+    console.debug('Inference url: ', this.inferenceUrl)
 
     if (!(await fs.existsSync(JanInferenceNitroExtension._settingsDir)))
-      await fs.mkdirSync(JanInferenceNitroExtension._settingsDir);
-    this.writeDefaultEngineSettings();
+      await fs.mkdirSync(JanInferenceNitroExtension._settingsDir)
+    this.writeDefaultEngineSettings()
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
       this.onMessageRequest(data)
-    );
+    )
 
-    events.on(ModelEvent.OnModelInit, (model: Model) =>
-      this.onModelInit(model)
-    );
+    events.on(ModelEvent.OnModelInit, (model: Model) => this.onModelInit(model))
 
-    events.on(ModelEvent.OnModelStop, (model: Model) =>
-      this.onModelStop(model)
-    );
+    events.on(ModelEvent.OnModelStop, (model: Model) => this.onModelStop(model))
 
     events.on(InferenceEvent.OnInferenceStopped, () =>
       this.onInferenceStopped()
-    );
+    )
 
     // Attempt to fetch nvidia info
-    await executeOnMain(NODE, "updateNvidiaInfo", {});
+    await executeOnMain(NODE, 'updateNvidiaInfo', {})
   }
 
   /**
@@ -126,56 +123,62 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
       const engineFile = await joinPath([
         JanInferenceNitroExtension._homeDir,
         JanInferenceNitroExtension._engineMetadataFileName,
-      ]);
+      ])
       if (await fs.existsSync(engineFile)) {
-        const engine = await fs.readFileSync(engineFile, "utf-8");
+        const engine = await fs.readFileSync(engineFile, 'utf-8')
         this._engineSettings =
-          typeof engine === "object" ? engine : JSON.parse(engine);
+          typeof engine === 'object' ? engine : JSON.parse(engine)
       } else {
         await fs.writeFileSync(
           engineFile,
           JSON.stringify(this._engineSettings, null, 2)
-        );
+        )
       }
     } catch (err) {
-      console.error(err);
+      console.error(err)
     }
   }
 
   private async onModelInit(model: Model) {
-    if (model.engine !== InferenceEngine.nitro) return;
+    if (model.engine !== InferenceEngine.nitro) return
 
-    const modelFullPath = await joinPath(["models", model.id]);
-
-    this._currentModel = model;
-    const nitroInitResult = await executeOnMain(NODE, "runModel", {
-      modelFullPath,
+    const modelFolder = await joinPath([
+      await getJanDataFolderPath(),
+      'models',
+      model.id,
+    ])
+    this._currentModel = model
+    const nitroInitResult = await executeOnMain(NODE, 'runModel', {
+      modelFolder,
       model,
-    });
+    })
 
     if (nitroInitResult?.error) {
-      events.emit(ModelEvent.OnModelFail, model);
-      return;
+      events.emit(ModelEvent.OnModelFail, {
+        ...model,
+        error: nitroInitResult.error,
+      })
+      return
     }
 
-    events.emit(ModelEvent.OnModelReady, model);
+    events.emit(ModelEvent.OnModelReady, model)
 
     this.getNitroProcesHealthIntervalId = setInterval(
       () => this.periodicallyGetNitroHealth(),
       JanInferenceNitroExtension._intervalHealthCheck
-    );
+    )
   }
 
   private async onModelStop(model: Model) {
-    if (model.engine !== "nitro") return;
+    if (model.engine !== 'nitro') return
 
-    await executeOnMain(NODE, "stopModel");
-    events.emit(ModelEvent.OnModelStopped, {});
+    await executeOnMain(NODE, 'stopModel')
+    events.emit(ModelEvent.OnModelStopped, {})
 
     // stop the periocally health check
     if (this.getNitroProcesHealthIntervalId) {
-      clearInterval(this.getNitroProcesHealthIntervalId);
-      this.getNitroProcesHealthIntervalId = undefined;
+      clearInterval(this.getNitroProcesHealthIntervalId)
+      this.getNitroProcesHealthIntervalId = undefined
     }
   }
 
@@ -183,19 +186,19 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
    * Periodically check for nitro process's health.
    */
   private async periodicallyGetNitroHealth(): Promise<void> {
-    const health = await executeOnMain(NODE, "getCurrentNitroProcessInfo");
+    const health = await executeOnMain(NODE, 'getCurrentNitroProcessInfo')
 
-    const isRunning = this.nitroProcessInfo?.isRunning ?? false;
+    const isRunning = this.nitroProcessInfo?.isRunning ?? false
     if (isRunning && health.isRunning === false) {
-      console.debug("Nitro process is stopped");
-      events.emit(ModelEvent.OnModelStopped, {});
+      console.debug('Nitro process is stopped')
+      events.emit(ModelEvent.OnModelStopped, {})
     }
-    this.nitroProcessInfo = health;
+    this.nitroProcessInfo = health
   }
 
   private async onInferenceStopped() {
-    this.isCancelled = true;
-    this.controller?.abort();
+    this.isCancelled = true
+    this.controller?.abort()
   }
 
   /**
@@ -204,20 +207,20 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
    * @returns {Promise<any>} A promise that resolves with the inference response.
    */
   async inference(data: MessageRequest): Promise<ThreadMessage> {
-    const timestamp = Date.now();
+    const timestamp = Date.now()
     const message: ThreadMessage = {
       thread_id: data.threadId,
       created: timestamp,
       updated: timestamp,
       status: MessageStatus.Ready,
-      id: "",
+      id: '',
       role: ChatCompletionRole.Assistant,
-      object: "thread.message",
+      object: 'thread.message',
       content: [],
-    };
+    }
 
     return new Promise(async (resolve, reject) => {
-      if (!this._currentModel) return Promise.reject("No model loaded");
+      if (!this._currentModel) return Promise.reject('No model loaded')
 
       requestInference(
         this.inferenceUrl,
@@ -226,13 +229,13 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
       ).subscribe({
         next: (_content: any) => {},
         complete: async () => {
-          resolve(message);
+          resolve(message)
         },
         error: async (err: any) => {
-          reject(err);
+          reject(err)
         },
-      });
-    });
+      })
+    })
   }
 
   /**
@@ -243,31 +246,35 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
    */
   private async onMessageRequest(data: MessageRequest) {
     if (data.model?.engine !== InferenceEngine.nitro || !this._currentModel) {
-      return;
+      return
     }
 
-    const timestamp = Date.now();
+    const timestamp = Date.now()
     const message: ThreadMessage = {
       id: ulid(),
       thread_id: data.threadId,
+      type: data.type,
       assistant_id: data.assistantId,
       role: ChatCompletionRole.Assistant,
       content: [],
       status: MessageStatus.Pending,
       created: timestamp,
       updated: timestamp,
-      object: "thread.message",
-    };
-    events.emit(MessageEvent.OnMessageResponse, message);
+      object: 'thread.message',
+    }
 
-    this.isCancelled = false;
-    this.controller = new AbortController();
+    if (data.type !== MessageRequestType.Summary) {
+      events.emit(MessageEvent.OnMessageResponse, message)
+    }
+
+    this.isCancelled = false
+    this.controller = new AbortController()
 
     // @ts-ignore
     const model: Model = {
       ...(this._currentModel || {}),
       ...(data.model || {}),
-    };
+    }
     requestInference(
       this.inferenceUrl,
       data.messages ?? [],
@@ -281,26 +288,26 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
             value: content.trim(),
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       complete: async () => {
         message.status = message.content.length
           ? MessageStatus.Ready
-          : MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+          : MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       error: async (err: any) => {
         if (this.isCancelled || message.content.length) {
-          message.status = MessageStatus.Stopped;
-          events.emit(MessageEvent.OnMessageUpdate, message);
-          return;
+          message.status = MessageStatus.Stopped
+          events.emit(MessageEvent.OnMessageUpdate, message)
+          return
         }
-        message.status = MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
-        log(`[APP]::Error: ${err.message}`);
+        message.status = MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
+        log(`[APP]::Error: ${err.message}`)
       },
-    });
+    })
   }
 }
diff --git a/extensions/inference-nitro-extension/src/node/accelerator.ts b/extensions/inference-nitro-extension/src/node/accelerator.ts
new file mode 100644
index 000000000..972f88681
--- /dev/null
+++ b/extensions/inference-nitro-extension/src/node/accelerator.ts
@@ -0,0 +1,240 @@
+import { writeFileSync, existsSync, readFileSync } from 'fs'
+import { exec, spawn } from 'child_process'
+import path from 'path'
+import { getJanDataFolderPath, log } from '@janhq/core/node'
+
+/**
+ * Default GPU settings
+ * TODO: This needs to be refactored to support multiple accelerators
+ **/
+const DEFALT_SETTINGS = {
+  notify: true,
+  run_mode: 'cpu',
+  nvidia_driver: {
+    exist: false,
+    version: '',
+  },
+  cuda: {
+    exist: false,
+    version: '',
+  },
+  gpus: [],
+  gpu_highest_vram: '',
+  gpus_in_use: [],
+  is_initial: true,
+  // TODO: This needs to be set based on user toggle in settings
+  vulkan: {
+    enabled: true,
+    gpu_in_use: '1',
+  },
+}
+
+/**
+ * Path to the settings file
+ **/
+export const GPU_INFO_FILE = path.join(
+  getJanDataFolderPath(),
+  'settings',
+  'settings.json'
+)
+
+/**
+ * Current nitro process
+ */
+let nitroProcessInfo: NitroProcessInfo | undefined = undefined
+
+/**
+ * Nitro process info
+ */
+export interface NitroProcessInfo {
+  isRunning: boolean
+}
+
+/**
+ * This will retrive GPU informations and persist settings.json
+ * Will be called when the extension is loaded to turn on GPU acceleration if supported
+ */
+export async function updateNvidiaInfo() {
+  if (process.platform !== 'darwin') {
+    let data
+    try {
+      data = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+    } catch (error) {
+      data = DEFALT_SETTINGS
+      writeFileSync(GPU_INFO_FILE, JSON.stringify(data, null, 2))
+    }
+    updateNvidiaDriverInfo()
+    updateGpuInfo()
+  }
+}
+
+/**
+ * Retrieve current nitro process
+ */
+export const getNitroProcessInfo = (subprocess: any): NitroProcessInfo => {
+  nitroProcessInfo = {
+    isRunning: subprocess != null,
+  }
+  return nitroProcessInfo
+}
+
+/**
+ * Validate nvidia and cuda for linux and windows
+ */
+export async function updateNvidiaDriverInfo(): Promise<void> {
+  exec(
+    'nvidia-smi --query-gpu=driver_version --format=csv,noheader',
+    (error, stdout) => {
+      let data = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+
+      if (!error) {
+        const firstLine = stdout.split('\n')[0].trim()
+        data['nvidia_driver'].exist = true
+        data['nvidia_driver'].version = firstLine
+      } else {
+        data['nvidia_driver'].exist = false
+      }
+
+      writeFileSync(GPU_INFO_FILE, JSON.stringify(data, null, 2))
+      Promise.resolve()
+    }
+  )
+}
+
+/**
+ * Check if file exists in paths
+ */
+export function checkFileExistenceInPaths(
+  file: string,
+  paths: string[]
+): boolean {
+  return paths.some((p) => existsSync(path.join(p, file)))
+}
+
+/**
+ * Validate cuda for linux and windows
+ */
+export function updateCudaExistence(
+  data: Record<string, any> = DEFALT_SETTINGS
+): Record<string, any> {
+  let filesCuda12: string[]
+  let filesCuda11: string[]
+  let paths: string[]
+  let cudaVersion: string = ''
+
+  if (process.platform === 'win32') {
+    filesCuda12 = ['cublas64_12.dll', 'cudart64_12.dll', 'cublasLt64_12.dll']
+    filesCuda11 = ['cublas64_11.dll', 'cudart64_11.dll', 'cublasLt64_11.dll']
+    paths = process.env.PATH ? process.env.PATH.split(path.delimiter) : []
+  } else {
+    filesCuda12 = ['libcudart.so.12', 'libcublas.so.12', 'libcublasLt.so.12']
+    filesCuda11 = ['libcudart.so.11.0', 'libcublas.so.11', 'libcublasLt.so.11']
+    paths = process.env.LD_LIBRARY_PATH
+      ? process.env.LD_LIBRARY_PATH.split(path.delimiter)
+      : []
+    paths.push('/usr/lib/x86_64-linux-gnu/')
+  }
+
+  let cudaExists = filesCuda12.every(
+    (file) => existsSync(file) || checkFileExistenceInPaths(file, paths)
+  )
+
+  if (!cudaExists) {
+    cudaExists = filesCuda11.every(
+      (file) => existsSync(file) || checkFileExistenceInPaths(file, paths)
+    )
+    if (cudaExists) {
+      cudaVersion = '11'
+    }
+  } else {
+    cudaVersion = '12'
+  }
+
+  data['cuda'].exist = cudaExists
+  data['cuda'].version = cudaVersion
+  console.log(data['is_initial'], data['gpus_in_use'])
+  if (cudaExists && data['is_initial'] && data['gpus_in_use'].length > 0) {
+    data.run_mode = 'gpu'
+  }
+  data.is_initial = false
+  return data
+}
+
+/**
+ * Get GPU information
+ */
+export async function updateGpuInfo(): Promise<void> {
+  let data = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+
+  // Cuda
+  if (data['vulkan'] === true) {
+    // Vulkan
+    exec(
+      process.platform === 'win32'
+        ? `${__dirname}\\..\\bin\\vulkaninfoSDK.exe --summary`
+        : `${__dirname}/../bin/vulkaninfo --summary`,
+      (error, stdout) => {
+        if (!error) {
+          const output = stdout.toString()
+          log(output)
+          const gpuRegex = /GPU(\d+):(?:[\s\S]*?)deviceName\s*=\s*(.*)/g
+
+          let gpus = []
+          let match
+          while ((match = gpuRegex.exec(output)) !== null) {
+            const id = match[1]
+            const name = match[2]
+            gpus.push({ id, vram: 0, name })
+          }
+          data.gpus = gpus
+
+          if (!data['gpus_in_use'] || data['gpus_in_use'].length === 0) {
+            data.gpus_in_use = [data.gpus.length > 1 ? '1' : '0']
+          }
+
+          data = updateCudaExistence(data)
+          writeFileSync(GPU_INFO_FILE, JSON.stringify(data, null, 2))
+        }
+        Promise.resolve()
+      }
+    )
+  } else {
+    exec(
+      'nvidia-smi --query-gpu=index,memory.total,name --format=csv,noheader,nounits',
+      (error, stdout) => {
+        if (!error) {
+          log(stdout)
+          // Get GPU info and gpu has higher memory first
+          let highestVram = 0
+          let highestVramId = '0'
+          let gpus = stdout
+            .trim()
+            .split('\n')
+            .map((line) => {
+              let [id, vram, name] = line.split(', ')
+              vram = vram.replace(/\r/g, '')
+              if (parseFloat(vram) > highestVram) {
+                highestVram = parseFloat(vram)
+                highestVramId = id
+              }
+              return { id, vram, name }
+            })
+
+          data.gpus = gpus
+          data.gpu_highest_vram = highestVramId
+        } else {
+          data.gpus = []
+          data.gpu_highest_vram = ''
+        }
+
+        if (!data['gpus_in_use'] || data['gpus_in_use'].length === 0) {
+          data.gpus_in_use = [data['gpu_highest_vram']]
+        }
+
+        data = updateCudaExistence(data)
+        writeFileSync(GPU_INFO_FILE, JSON.stringify(data, null, 2))
+        Promise.resolve()
+      }
+    )
+  }
+}
diff --git a/extensions/inference-nitro-extension/src/node/execute.ts b/extensions/inference-nitro-extension/src/node/execute.ts
index 83b5226d4..08baba0d5 100644
--- a/extensions/inference-nitro-extension/src/node/execute.ts
+++ b/extensions/inference-nitro-extension/src/node/execute.ts
@@ -1,65 +1,79 @@
-import { readFileSync } from "fs";
-import * as path from "path";
-import { NVIDIA_INFO_FILE } from "./nvidia";
+import { readFileSync } from 'fs'
+import * as path from 'path'
+import { GPU_INFO_FILE } from './accelerator'
 
 export interface NitroExecutableOptions {
-  executablePath: string;
-  cudaVisibleDevices: string;
+  executablePath: string
+  cudaVisibleDevices: string
+  vkVisibleDevices: string
 }
 /**
  * Find which executable file to run based on the current platform.
  * @returns The name of the executable file to run.
  */
 export const executableNitroFile = (): NitroExecutableOptions => {
-  let binaryFolder = path.join(__dirname, "..", "bin"); // Current directory by default
-  let cudaVisibleDevices = "";
-  let binaryName = "nitro";
+  let binaryFolder = path.join(__dirname, '..', 'bin') // Current directory by default
+  let cudaVisibleDevices = ''
+  let vkVisibleDevices = ''
+  let binaryName = 'nitro'
   /**
    * The binary folder is different for each platform.
    */
-  if (process.platform === "win32") {
+  if (process.platform === 'win32') {
     /**
-     *  For Windows: win-cpu, win-cuda-11-7, win-cuda-12-0
+     *  For Windows: win-cpu, win-vulkan, win-cuda-11-7, win-cuda-12-0
      */
-    let nvidiaInfo = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-    if (nvidiaInfo["run_mode"] === "cpu") {
-      binaryFolder = path.join(binaryFolder, "win-cpu");
+    let gpuInfo = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+    if (gpuInfo['run_mode'] === 'cpu') {
+      binaryFolder = path.join(binaryFolder, 'win-cpu')
     } else {
-      if (nvidiaInfo["cuda"].version === "11") {
-        binaryFolder = path.join(binaryFolder, "win-cuda-11-7");
+      if (gpuInfo['cuda']?.version === '11') {
+        binaryFolder = path.join(binaryFolder, 'win-cuda-11-7')
       } else {
-        binaryFolder = path.join(binaryFolder, "win-cuda-12-0");
+        binaryFolder = path.join(binaryFolder, 'win-cuda-12-0')
       }
-      cudaVisibleDevices = nvidiaInfo["gpus_in_use"].join(",");
+      cudaVisibleDevices = gpuInfo['gpus_in_use'].join(',')
     }
-    binaryName = "nitro.exe";
-  } else if (process.platform === "darwin") {
+    if (gpuInfo['vulkan'] === true) {
+      binaryFolder = path.join(__dirname, '..', 'bin')
+      binaryFolder = path.join(binaryFolder, 'win-vulkan')
+      vkVisibleDevices = gpuInfo['gpus_in_use'].toString()
+    }
+    binaryName = 'nitro.exe'
+  } else if (process.platform === 'darwin') {
     /**
      *  For MacOS: mac-arm64 (Silicon), mac-x64 (InteL)
      */
-    if (process.arch === "arm64") {
-      binaryFolder = path.join(binaryFolder, "mac-arm64");
+    if (process.arch === 'arm64') {
+      binaryFolder = path.join(binaryFolder, 'mac-arm64')
     } else {
-      binaryFolder = path.join(binaryFolder, "mac-x64");
+      binaryFolder = path.join(binaryFolder, 'mac-x64')
     }
   } else {
     /**
-     *  For Linux: linux-cpu, linux-cuda-11-7, linux-cuda-12-0
+     *  For Linux: linux-cpu, linux-vulkan, linux-cuda-11-7, linux-cuda-12-0
      */
-    let nvidiaInfo = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-    if (nvidiaInfo["run_mode"] === "cpu") {
-      binaryFolder = path.join(binaryFolder, "linux-cpu");
+    let gpuInfo = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+    if (gpuInfo['run_mode'] === 'cpu') {
+      binaryFolder = path.join(binaryFolder, 'linux-cpu')
     } else {
-      if (nvidiaInfo["cuda"].version === "11") {
-        binaryFolder = path.join(binaryFolder, "linux-cuda-11-7");
+      if (gpuInfo['cuda']?.version === '11') {
+        binaryFolder = path.join(binaryFolder, 'linux-cuda-11-7')
       } else {
-        binaryFolder = path.join(binaryFolder, "linux-cuda-12-0");
+        binaryFolder = path.join(binaryFolder, 'linux-cuda-12-0')
       }
-      cudaVisibleDevices = nvidiaInfo["gpus_in_use"].join(",");
+      cudaVisibleDevices = gpuInfo['gpus_in_use'].join(',')
+    }
+
+    if (gpuInfo['vulkan'] === true) {
+      binaryFolder = path.join(__dirname, '..', 'bin')
+      binaryFolder = path.join(binaryFolder, 'win-vulkan')
+      vkVisibleDevices = gpuInfo['gpus_in_use'].toString()
     }
   }
   return {
     executablePath: path.join(binaryFolder, binaryName),
     cudaVisibleDevices,
-  };
-};
+    vkVisibleDevices,
+  }
+}
diff --git a/extensions/inference-nitro-extension/src/node/index.ts b/extensions/inference-nitro-extension/src/node/index.ts
index 7ba90b556..9b2684a6c 100644
--- a/extensions/inference-nitro-extension/src/node/index.ts
+++ b/extensions/inference-nitro-extension/src/node/index.ts
@@ -1,55 +1,50 @@
-import fs from "fs";
-import path from "path";
-import { ChildProcessWithoutNullStreams, spawn } from "child_process";
-import tcpPortUsed from "tcp-port-used";
-import fetchRT from "fetch-retry";
-import {
-  log,
-  getJanDataFolderPath,
-  getSystemResourceInfo,
-} from "@janhq/core/node";
-import { getNitroProcessInfo, updateNvidiaInfo } from "./nvidia";
+import fs from 'fs'
+import path from 'path'
+import { ChildProcessWithoutNullStreams, spawn } from 'child_process'
+import tcpPortUsed from 'tcp-port-used'
+import fetchRT from 'fetch-retry'
+import { log, getSystemResourceInfo } from '@janhq/core/node'
+import { getNitroProcessInfo, updateNvidiaInfo } from './accelerator'
 import {
   Model,
   InferenceEngine,
   ModelSettingParams,
   PromptTemplate,
-} from "@janhq/core";
-import { executableNitroFile } from "./execute";
+} from '@janhq/core'
+import { executableNitroFile } from './execute'
 
 // Polyfill fetch with retry
-const fetchRetry = fetchRT(fetch);
+const fetchRetry = fetchRT(fetch)
 
 /**
  * The response object for model init operation.
  */
 interface ModelInitOptions {
-  modelFullPath: string;
-  model: Model;
+  modelFolder: string
+  model: Model
 }
 // The PORT to use for the Nitro subprocess
-const PORT = 3928;
+const PORT = 3928
 // The HOST address to use for the Nitro subprocess
-const LOCAL_HOST = "127.0.0.1";
+const LOCAL_HOST = '127.0.0.1'
 // The URL for the Nitro subprocess
-const NITRO_HTTP_SERVER_URL = `http://${LOCAL_HOST}:${PORT}`;
+const NITRO_HTTP_SERVER_URL = `http://${LOCAL_HOST}:${PORT}`
 // The URL for the Nitro subprocess to load a model
-const NITRO_HTTP_LOAD_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/loadmodel`;
+const NITRO_HTTP_LOAD_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/loadmodel`
 // The URL for the Nitro subprocess to validate a model
-const NITRO_HTTP_VALIDATE_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/modelstatus`;
+const NITRO_HTTP_VALIDATE_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/modelstatus`
 // The URL for the Nitro subprocess to kill itself
-const NITRO_HTTP_KILL_URL = `${NITRO_HTTP_SERVER_URL}/processmanager/destroy`;
+const NITRO_HTTP_KILL_URL = `${NITRO_HTTP_SERVER_URL}/processmanager/destroy`
 
 // The supported model format
 // TODO: Should be an array to support more models
-const SUPPORTED_MODEL_FORMAT = ".gguf";
+const SUPPORTED_MODEL_FORMAT = '.gguf'
 
 // The subprocess instance for Nitro
-let subprocess: ChildProcessWithoutNullStreams | undefined = undefined;
-// The current model file url
-let currentModelFile: string = "";
+let subprocess: ChildProcessWithoutNullStreams | undefined = undefined
+
 // The current model settings
-let currentSettings: ModelSettingParams | undefined = undefined;
+let currentSettings: ModelSettingParams | undefined = undefined
 
 /**
  * Stops a Nitro subprocess.
@@ -57,7 +52,7 @@ let currentSettings: ModelSettingParams | undefined = undefined;
  * @returns A Promise that resolves when the subprocess is terminated successfully, or rejects with an error message if the subprocess fails to terminate.
  */
 function stopModel(): Promise<void> {
-  return killSubprocess();
+  return killSubprocess()
 }
 
 /**
@@ -67,62 +62,79 @@ function stopModel(): Promise<void> {
  * TODO: Should pass absolute of the model file instead of just the name - So we can modurize the module.ts to npm package
  */
 async function runModel(
-  wrapper: ModelInitOptions,
+  wrapper: ModelInitOptions
 ): Promise<ModelOperationResponse | void> {
   if (wrapper.model.engine !== InferenceEngine.nitro) {
     // Not a nitro model
-    return Promise.resolve();
+    return Promise.resolve()
   }
 
-  currentModelFile = wrapper.modelFullPath;
-  const janRoot = await getJanDataFolderPath();
-  if (!currentModelFile.includes(janRoot)) {
-    currentModelFile = path.join(janRoot, currentModelFile);
-  }
-  const files: string[] = fs.readdirSync(currentModelFile);
-
-  // Look for GGUF model file
-  const ggufBinFile = files.find(
-    (file) =>
-      file === path.basename(currentModelFile) ||
-      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT),
-  );
-
-  if (!ggufBinFile) return Promise.reject("No GGUF model file found");
-
-  currentModelFile = path.join(currentModelFile, ggufBinFile);
-
   if (wrapper.model.engine !== InferenceEngine.nitro) {
-    return Promise.reject("Not a nitro model");
+    return Promise.reject('Not a nitro model')
   } else {
-    const nitroResourceProbe = await getSystemResourceInfo();
+    const nitroResourceProbe = await getSystemResourceInfo()
     // Convert settings.prompt_template to system_prompt, user_prompt, ai_prompt
     if (wrapper.model.settings.prompt_template) {
-      const promptTemplate = wrapper.model.settings.prompt_template;
-      const prompt = promptTemplateConverter(promptTemplate);
+      const promptTemplate = wrapper.model.settings.prompt_template
+      const prompt = promptTemplateConverter(promptTemplate)
       if (prompt?.error) {
-        return Promise.reject(prompt.error);
+        return Promise.reject(prompt.error)
       }
-      wrapper.model.settings.system_prompt = prompt.system_prompt;
-      wrapper.model.settings.user_prompt = prompt.user_prompt;
-      wrapper.model.settings.ai_prompt = prompt.ai_prompt;
+      wrapper.model.settings.system_prompt = prompt.system_prompt
+      wrapper.model.settings.user_prompt = prompt.user_prompt
+      wrapper.model.settings.ai_prompt = prompt.ai_prompt
     }
 
-    const modelFolderPath = path.join(janRoot, "models", wrapper.model.id);
-    const modelPath = wrapper.model.settings.llama_model_path
-      ? path.join(modelFolderPath, wrapper.model.settings.llama_model_path)
-      : currentModelFile;
+    // modelFolder is the absolute path to the running model folder
+    // e.g. ~/jan/models/llama-2
+    let modelFolder = wrapper.modelFolder
+
+    let llama_model_path = wrapper.model.settings.llama_model_path
+
+    // Absolute model path support
+    if (
+      wrapper.model?.sources.length &&
+      wrapper.model.sources.every((e) => fs.existsSync(e.url))
+    ) {
+      llama_model_path =
+        wrapper.model.sources.length === 1
+          ? wrapper.model.sources[0].url
+          : wrapper.model.sources.find((e) =>
+              e.url.includes(llama_model_path ?? wrapper.model.id)
+            )?.url
+    }
+
+    if (!llama_model_path || !path.isAbsolute(llama_model_path)) {
+      // Look for GGUF model file
+      const modelFiles: string[] = fs.readdirSync(modelFolder)
+      const ggufBinFile = modelFiles.find(
+        (file) =>
+          // 1. Prioritize llama_model_path (predefined)
+          (llama_model_path && file === llama_model_path) ||
+          // 2. Prioritize GGUF File (manual import)
+          file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT) ||
+          // 3. Fallback Model ID (for backward compatibility)
+          file === wrapper.model.id
+      )
+      if (ggufBinFile) llama_model_path = path.join(modelFolder, ggufBinFile)
+    }
+
+    // Look for absolute source path for single model
+
+    if (!llama_model_path) return Promise.reject('No GGUF model file found')
 
     currentSettings = {
       ...wrapper.model.settings,
-      llama_model_path: modelPath,
+      llama_model_path,
       // This is critical and requires real CPU physical core count (or performance core)
       cpu_threads: Math.max(1, nitroResourceProbe.numCpuPhysicalCore),
       ...(wrapper.model.settings.mmproj && {
-        mmproj: path.join(modelFolderPath, wrapper.model.settings.mmproj),
+        mmproj: path.isAbsolute(wrapper.model.settings.mmproj)
+          ? wrapper.model.settings.mmproj
+          : path.join(modelFolder, wrapper.model.settings.mmproj),
       }),
-    };
-    return runNitroAndLoadModel();
+    }
+    return runNitroAndLoadModel()
   }
 }
 
@@ -142,10 +154,10 @@ async function runNitroAndLoadModel() {
        * Should wait for awhile to make sure the port is free and subprocess is killed
        * The tested threshold is 500ms
        **/
-      if (process.platform === "win32") {
-        return new Promise((resolve) => setTimeout(resolve, 500));
+      if (process.platform === 'win32') {
+        return new Promise((resolve) => setTimeout(resolve, 500))
       } else {
-        return Promise.resolve();
+        return Promise.resolve()
       }
     })
     .then(spawnNitroProcess)
@@ -153,9 +165,9 @@ async function runNitroAndLoadModel() {
     .then(validateModelStatus)
     .catch((err) => {
       // TODO: Broadcast error so app could display proper error message
-      log(`[NITRO]::Error: ${err}`);
-      return { error: err };
-    });
+      log(`[NITRO]::Error: ${err}`)
+      return { error: err }
+    })
 }
 
 /**
@@ -165,43 +177,43 @@ async function runNitroAndLoadModel() {
  */
 function promptTemplateConverter(promptTemplate: string): PromptTemplate {
   // Split the string using the markers
-  const systemMarker = "{system_message}";
-  const promptMarker = "{prompt}";
+  const systemMarker = '{system_message}'
+  const promptMarker = '{prompt}'
 
   if (
     promptTemplate.includes(systemMarker) &&
     promptTemplate.includes(promptMarker)
   ) {
     // Find the indices of the markers
-    const systemIndex = promptTemplate.indexOf(systemMarker);
-    const promptIndex = promptTemplate.indexOf(promptMarker);
+    const systemIndex = promptTemplate.indexOf(systemMarker)
+    const promptIndex = promptTemplate.indexOf(promptMarker)
 
     // Extract the parts of the string
-    const system_prompt = promptTemplate.substring(0, systemIndex);
+    const system_prompt = promptTemplate.substring(0, systemIndex)
     const user_prompt = promptTemplate.substring(
       systemIndex + systemMarker.length,
-      promptIndex,
-    );
+      promptIndex
+    )
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length,
-    );
+      promptIndex + promptMarker.length
+    )
 
     // Return the split parts
-    return { system_prompt, user_prompt, ai_prompt };
+    return { system_prompt, user_prompt, ai_prompt }
   } else if (promptTemplate.includes(promptMarker)) {
     // Extract the parts of the string for the case where only promptMarker is present
-    const promptIndex = promptTemplate.indexOf(promptMarker);
-    const user_prompt = promptTemplate.substring(0, promptIndex);
+    const promptIndex = promptTemplate.indexOf(promptMarker)
+    const user_prompt = promptTemplate.substring(0, promptIndex)
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length,
-    );
+      promptIndex + promptMarker.length
+    )
 
     // Return the split parts
-    return { user_prompt, ai_prompt };
+    return { user_prompt, ai_prompt }
   }
 
   // Return an error if none of the conditions are met
-  return { error: "Cannot split prompt template" };
+  return { error: 'Cannot split prompt template' }
 }
 
 /**
@@ -210,13 +222,13 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
  */
 function loadLLMModel(settings: any): Promise<Response> {
   if (!settings?.ngl) {
-    settings.ngl = 100;
+    settings.ngl = 100
   }
-  log(`[NITRO]::Debug: Loading model with params ${JSON.stringify(settings)}`);
+  log(`[NITRO]::Debug: Loading model with params ${JSON.stringify(settings)}`)
   return fetchRetry(NITRO_HTTP_LOAD_MODEL_URL, {
-    method: "POST",
+    method: 'POST',
     headers: {
-      "Content-Type": "application/json",
+      'Content-Type': 'application/json',
     },
     body: JSON.stringify(settings),
     retries: 3,
@@ -225,15 +237,15 @@ function loadLLMModel(settings: any): Promise<Response> {
     .then((res) => {
       log(
         `[NITRO]::Debug: Load model success with response ${JSON.stringify(
-          res,
-        )}`,
-      );
-      return Promise.resolve(res);
+          res
+        )}`
+      )
+      return Promise.resolve(res)
     })
     .catch((err) => {
-      log(`[NITRO]::Error: Load model failed with error ${err}`);
-      return Promise.reject(err);
-    });
+      log(`[NITRO]::Error: Load model failed with error ${err}`)
+      return Promise.reject(err)
+    })
 }
 
 /**
@@ -246,9 +258,9 @@ async function validateModelStatus(): Promise<void> {
   // Send a GET request to the validation URL.
   // Retry the request up to 3 times if it fails, with a delay of 500 milliseconds between retries.
   return fetchRetry(NITRO_HTTP_VALIDATE_MODEL_URL, {
-    method: "GET",
+    method: 'GET',
     headers: {
-      "Content-Type": "application/json",
+      'Content-Type': 'application/json',
     },
     retries: 5,
     retryDelay: 500,
@@ -257,10 +269,10 @@ async function validateModelStatus(): Promise<void> {
       `[NITRO]::Debug: Validate model state with response ${JSON.stringify(
         res.status
       )}`
-    );
+    )
     // If the response is OK, check model_loaded status.
     if (res.ok) {
-      const body = await res.json();
+      const body = await res.json()
       // If the model is loaded, return an empty object.
       // Otherwise, return an object with an error message.
       if (body.model_loaded) {
@@ -268,17 +280,17 @@ async function validateModelStatus(): Promise<void> {
           `[NITRO]::Debug: Validate model state success with response ${JSON.stringify(
             body
           )}`
-        );
-        return Promise.resolve();
+        )
+        return Promise.resolve()
       }
     }
     log(
       `[NITRO]::Debug: Validate model state failed with response ${JSON.stringify(
         res.statusText
       )}`
-    );
-    return Promise.reject("Validate model status failed");
-  });
+    )
+    return Promise.reject('Validate model status failed')
+  })
 }
 
 /**
@@ -286,21 +298,27 @@ async function validateModelStatus(): Promise<void> {
  * @returns A Promise that resolves when the subprocess is terminated successfully, or rejects with an error message if the subprocess fails to terminate.
  */
 async function killSubprocess(): Promise<void> {
-  const controller = new AbortController();
-  setTimeout(() => controller.abort(), 5000);
-  log(`[NITRO]::Debug: Request to kill Nitro`);
+  const controller = new AbortController()
+  setTimeout(() => controller.abort(), 5000)
+  log(`[NITRO]::Debug: Request to kill Nitro`)
 
   return fetch(NITRO_HTTP_KILL_URL, {
-    method: "DELETE",
+    method: 'DELETE',
     signal: controller.signal,
   })
     .then(() => {
-      subprocess?.kill();
-      subprocess = undefined;
+      subprocess?.kill()
+      subprocess = undefined
     })
-    .catch(() => {})
+    .catch(() => {}) // Do nothing with this attempt
     .then(() => tcpPortUsed.waitUntilFree(PORT, 300, 5000))
-    .then(() => log(`[NITRO]::Debug: Nitro process is terminated`));
+    .then(() => log(`[NITRO]::Debug: Nitro process is terminated`))
+    .catch((err) => {
+      log(
+        `[NITRO]::Debug: Could not kill running process on port ${PORT}. Might be another process running on the same port? ${err}`
+      )
+      throw 'PORT_NOT_AVAILABLE'
+    })
 }
 
 /**
@@ -308,49 +326,53 @@ async function killSubprocess(): Promise<void> {
  * @returns A promise that resolves when the Nitro subprocess is started.
  */
 function spawnNitroProcess(): Promise<any> {
-  log(`[NITRO]::Debug: Spawning Nitro subprocess...`);
+  log(`[NITRO]::Debug: Spawning Nitro subprocess...`)
 
   return new Promise<void>(async (resolve, reject) => {
-    let binaryFolder = path.join(__dirname, "..", "bin"); // Current directory by default
-    let executableOptions = executableNitroFile();
+    let binaryFolder = path.join(__dirname, '..', 'bin') // Current directory by default
+    let executableOptions = executableNitroFile()
 
-    const args: string[] = ["1", LOCAL_HOST, PORT.toString()];
+    const args: string[] = ['1', LOCAL_HOST, PORT.toString()]
     // Execute the binary
     log(
-      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`,
-    );
+      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`
+    )
     subprocess = spawn(
       executableOptions.executablePath,
-      ["1", LOCAL_HOST, PORT.toString()],
+      ['1', LOCAL_HOST, PORT.toString()],
       {
         cwd: binaryFolder,
         env: {
           ...process.env,
           CUDA_VISIBLE_DEVICES: executableOptions.cudaVisibleDevices,
+          // Vulkan - Support 1 device at a time for now
+          ...(executableOptions.vkVisibleDevices?.length > 0 && {
+            GGML_VULKAN_DEVICE: executableOptions.vkVisibleDevices[0],
+          }),
         },
-      },
-    );
+      }
+    )
 
     // Handle subprocess output
-    subprocess.stdout.on("data", (data: any) => {
-      log(`[NITRO]::Debug: ${data}`);
-    });
+    subprocess.stdout.on('data', (data: any) => {
+      log(`[NITRO]::Debug: ${data}`)
+    })
 
-    subprocess.stderr.on("data", (data: any) => {
-      log(`[NITRO]::Error: ${data}`);
-    });
+    subprocess.stderr.on('data', (data: any) => {
+      log(`[NITRO]::Error: ${data}`)
+    })
 
-    subprocess.on("close", (code: any) => {
-      log(`[NITRO]::Debug: Nitro exited with code: ${code}`);
-      subprocess = undefined;
-      reject(`child process exited with code ${code}`);
-    });
+    subprocess.on('close', (code: any) => {
+      log(`[NITRO]::Debug: Nitro exited with code: ${code}`)
+      subprocess = undefined
+      reject(`child process exited with code ${code}`)
+    })
 
     tcpPortUsed.waitUntilUsed(PORT, 300, 30000).then(() => {
-      log(`[NITRO]::Debug: Nitro is ready`);
-      resolve();
-    });
-  });
+      log(`[NITRO]::Debug: Nitro is ready`)
+      resolve()
+    })
+  })
 }
 
 /**
@@ -360,7 +382,7 @@ function spawnNitroProcess(): Promise<any> {
  */
 function dispose() {
   // clean other registered resources here
-  killSubprocess();
+  killSubprocess()
 }
 
 export default {
@@ -370,4 +392,4 @@ export default {
   dispose,
   updateNvidiaInfo,
   getCurrentNitroProcessInfo: () => getNitroProcessInfo(subprocess),
-};
+}
diff --git a/extensions/inference-nitro-extension/src/node/nvidia.ts b/extensions/inference-nitro-extension/src/node/nvidia.ts
deleted file mode 100644
index bed2856a1..000000000
--- a/extensions/inference-nitro-extension/src/node/nvidia.ts
+++ /dev/null
@@ -1,197 +0,0 @@
-import { writeFileSync, existsSync, readFileSync } from "fs";
-import { exec } from "child_process";
-import path from "path";
-import { getJanDataFolderPath } from "@janhq/core/node";
-
-/**
- * Default GPU settings
- **/
-const DEFALT_SETTINGS = {
-  notify: true,
-  run_mode: "cpu",
-  nvidia_driver: {
-    exist: false,
-    version: "",
-  },
-  cuda: {
-    exist: false,
-    version: "",
-  },
-  gpus: [],
-  gpu_highest_vram: "",
-  gpus_in_use: [],
-  is_initial: true,
-};
-
-/**
- * Path to the settings file
- **/
-export const NVIDIA_INFO_FILE = path.join(
-  getJanDataFolderPath(),
-  "settings",
-  "settings.json"
-);
-
-/**
- * Current nitro process
- */
-let nitroProcessInfo: NitroProcessInfo | undefined = undefined;
-
-/**
- * Nitro process info
- */
-export interface NitroProcessInfo {
-  isRunning: boolean;
-}
-
-/**
- * This will retrive GPU informations and persist settings.json
- * Will be called when the extension is loaded to turn on GPU acceleration if supported
- */
-export async function updateNvidiaInfo() {
-  if (process.platform !== "darwin") {
-    let data;
-    try {
-      data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-    } catch (error) {
-      data = DEFALT_SETTINGS;
-      writeFileSync(NVIDIA_INFO_FILE, JSON.stringify(data, null, 2));
-    }
-    updateNvidiaDriverInfo();
-    updateGpuInfo();
-  }
-}
-
-/**
- * Retrieve current nitro process
- */
-export const getNitroProcessInfo = (subprocess: any): NitroProcessInfo => {
-  nitroProcessInfo = {
-    isRunning: subprocess != null,
-  };
-  return nitroProcessInfo;
-};
-
-/**
- * Validate nvidia and cuda for linux and windows
- */
-export async function updateNvidiaDriverInfo(): Promise<void> {
-  exec(
-    "nvidia-smi --query-gpu=driver_version --format=csv,noheader",
-    (error, stdout) => {
-      let data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-
-      if (!error) {
-        const firstLine = stdout.split("\n")[0].trim();
-        data["nvidia_driver"].exist = true;
-        data["nvidia_driver"].version = firstLine;
-      } else {
-        data["nvidia_driver"].exist = false;
-      }
-
-      writeFileSync(NVIDIA_INFO_FILE, JSON.stringify(data, null, 2));
-      Promise.resolve();
-    }
-  );
-}
-
-/**
- * Check if file exists in paths
- */
-export function checkFileExistenceInPaths(
-  file: string,
-  paths: string[]
-): boolean {
-  return paths.some((p) => existsSync(path.join(p, file)));
-}
-
-/**
- * Validate cuda for linux and windows
- */
-export function updateCudaExistence(data: Record<string, any> = DEFALT_SETTINGS): Record<string, any> {
-  let filesCuda12: string[];
-  let filesCuda11: string[];
-  let paths: string[];
-  let cudaVersion: string = "";
-
-  if (process.platform === "win32") {
-    filesCuda12 = ["cublas64_12.dll", "cudart64_12.dll", "cublasLt64_12.dll"];
-    filesCuda11 = ["cublas64_11.dll", "cudart64_11.dll", "cublasLt64_11.dll"];
-    paths = process.env.PATH ? process.env.PATH.split(path.delimiter) : [];
-  } else {
-    filesCuda12 = ["libcudart.so.12", "libcublas.so.12", "libcublasLt.so.12"];
-    filesCuda11 = ["libcudart.so.11.0", "libcublas.so.11", "libcublasLt.so.11"];
-    paths = process.env.LD_LIBRARY_PATH
-      ? process.env.LD_LIBRARY_PATH.split(path.delimiter)
-      : [];
-    paths.push("/usr/lib/x86_64-linux-gnu/");
-  }
-
-  let cudaExists = filesCuda12.every(
-    (file) => existsSync(file) || checkFileExistenceInPaths(file, paths)
-  );
-
-  if (!cudaExists) {
-    cudaExists = filesCuda11.every(
-      (file) => existsSync(file) || checkFileExistenceInPaths(file, paths)
-    );
-    if (cudaExists) {
-      cudaVersion = "11";
-    }
-  } else {
-    cudaVersion = "12";
-  }
-
-  data["cuda"].exist = cudaExists;
-  data["cuda"].version = cudaVersion;
-  console.log(data["is_initial"], data["gpus_in_use"]);
-  if (cudaExists && data["is_initial"] && data["gpus_in_use"].length > 0) {
-    data.run_mode = "gpu";
-  }
-  data.is_initial = false;
-  return data;
-}
-
-/**
- * Get GPU information
- */
-export async function updateGpuInfo(): Promise<void> {
-  exec(
-    "nvidia-smi --query-gpu=index,memory.total,name --format=csv,noheader,nounits",
-    (error, stdout) => {
-      let data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-
-      if (!error) {
-        // Get GPU info and gpu has higher memory first
-        let highestVram = 0;
-        let highestVramId = "0";
-        let gpus = stdout
-          .trim()
-          .split("\n")
-          .map((line) => {
-            let [id, vram, name] = line.split(", ");
-            vram = vram.replace(/\r/g, "");
-            if (parseFloat(vram) > highestVram) {
-              highestVram = parseFloat(vram);
-              highestVramId = id;
-            }
-            return { id, vram, name };
-          });
-
-        data.gpus = gpus;
-        data.gpu_highest_vram = highestVramId;
-      } else {
-        data.gpus = [];
-        data.gpu_highest_vram = "";
-      }
-
-      if (!data["gpus_in_use"] || data["gpus_in_use"].length === 0) {
-        data.gpus_in_use = [data["gpu_highest_vram"]];
-      }
-
-      data = updateCudaExistence(data);
-      writeFileSync(NVIDIA_INFO_FILE, JSON.stringify(data, null, 2));
-      Promise.resolve();
-    }
-  );
-}
diff --git a/extensions/inference-openai-extension/package.json b/extensions/inference-openai-extension/package.json
index 5fa0ce974..5efdbf874 100644
--- a/extensions/inference-openai-extension/package.json
+++ b/extensions/inference-openai-extension/package.json
@@ -8,7 +8,7 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "exports": {
     ".": "./dist/index.js",
@@ -18,13 +18,13 @@
     "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
     "fetch-retry": "^5.0.6",
     "path-browserify": "^1.0.1",
-    "ts-loader": "^9.5.0",
     "ulid": "^2.3.0"
   },
   "engines": {
diff --git a/extensions/inference-openai-extension/src/@types/global.d.ts b/extensions/inference-openai-extension/src/@types/global.d.ts
index 84f86c145..a49bb5a2f 100644
--- a/extensions/inference-openai-extension/src/@types/global.d.ts
+++ b/extensions/inference-openai-extension/src/@types/global.d.ts
@@ -1,26 +1,26 @@
-declare const MODULE: string;
-declare const OPENAI_DOMAIN: string;
+declare const MODULE: string
+declare const OPENAI_DOMAIN: string
 
 declare interface EngineSettings {
-  full_url?: string;
-  api_key?: string;
+  full_url?: string
+  api_key?: string
 }
 
 enum OpenAIChatCompletionModelName {
-  "gpt-3.5-turbo-instruct" = "gpt-3.5-turbo-instruct",
-  "gpt-3.5-turbo-instruct-0914" = "gpt-3.5-turbo-instruct-0914",
-  "gpt-4-1106-preview" = "gpt-4-1106-preview",
-  "gpt-3.5-turbo-0613" = "gpt-3.5-turbo-0613",
-  "gpt-3.5-turbo-0301" = "gpt-3.5-turbo-0301",
-  "gpt-3.5-turbo" = "gpt-3.5-turbo",
-  "gpt-3.5-turbo-16k-0613" = "gpt-3.5-turbo-16k-0613",
-  "gpt-3.5-turbo-1106" = "gpt-3.5-turbo-1106",
-  "gpt-4-vision-preview" = "gpt-4-vision-preview",
-  "gpt-4" = "gpt-4",
-  "gpt-4-0314" = "gpt-4-0314",
-  "gpt-4-0613" = "gpt-4-0613",
+  'gpt-3.5-turbo-instruct' = 'gpt-3.5-turbo-instruct',
+  'gpt-3.5-turbo-instruct-0914' = 'gpt-3.5-turbo-instruct-0914',
+  'gpt-4-1106-preview' = 'gpt-4-1106-preview',
+  'gpt-3.5-turbo-0613' = 'gpt-3.5-turbo-0613',
+  'gpt-3.5-turbo-0301' = 'gpt-3.5-turbo-0301',
+  'gpt-3.5-turbo' = 'gpt-3.5-turbo',
+  'gpt-3.5-turbo-16k-0613' = 'gpt-3.5-turbo-16k-0613',
+  'gpt-3.5-turbo-1106' = 'gpt-3.5-turbo-1106',
+  'gpt-4-vision-preview' = 'gpt-4-vision-preview',
+  'gpt-4' = 'gpt-4',
+  'gpt-4-0314' = 'gpt-4-0314',
+  'gpt-4-0613' = 'gpt-4-0613',
 }
 
-declare type OpenAIModel = Omit<Model, "id"> & {
-  id: OpenAIChatCompletionModelName;
-};
+declare type OpenAIModel = Omit<Model, 'id'> & {
+  id: OpenAIChatCompletionModelName
+}
diff --git a/extensions/inference-openai-extension/src/helpers/sse.ts b/extensions/inference-openai-extension/src/helpers/sse.ts
index fb75816e7..11db38282 100644
--- a/extensions/inference-openai-extension/src/helpers/sse.ts
+++ b/extensions/inference-openai-extension/src/helpers/sse.ts
@@ -1,4 +1,4 @@
-import { Observable } from "rxjs";
+import { Observable } from 'rxjs'
 
 /**
  * Sends a request to the inference server to generate a response based on the recent messages.
@@ -14,26 +14,26 @@ export function requestInference(
   controller?: AbortController
 ): Observable<string> {
   return new Observable((subscriber) => {
-    let model_id: string = model.id;
+    let model_id: string = model.id
     if (engine.full_url.includes(OPENAI_DOMAIN)) {
-      model_id = engine.full_url.split("/")[5];
+      model_id = engine.full_url.split('/')[5]
     }
     const requestBody = JSON.stringify({
       messages: recentMessages,
       stream: true,
       model: model_id,
       ...model.parameters,
-    });
+    })
     fetch(`${engine.full_url}`, {
-      method: "POST",
+      method: 'POST',
       headers: {
-        "Content-Type": "application/json",
-        Accept: model.parameters.stream
-          ? "text/event-stream"
-          : "application/json",
-        "Access-Control-Allow-Origin": "*",
-        Authorization: `Bearer ${engine.api_key}`,
-        "api-key": `${engine.api_key}`,
+        'Content-Type': 'application/json',
+        'Accept': model.parameters.stream
+          ? 'text/event-stream'
+          : 'application/json',
+        'Access-Control-Allow-Origin': '*',
+        'Authorization': `Bearer ${engine.api_key}`,
+        'api-key': `${engine.api_key}`,
       },
       body: requestBody,
       signal: controller?.signal,
@@ -41,41 +41,41 @@ export function requestInference(
       .then(async (response) => {
         if (!response.ok) {
           subscriber.next(
-            (await response.json()).error?.message ?? "Error occured"
-          );
-          subscriber.complete();
-          return;
+            (await response.json()).error?.message ?? 'Error occurred.'
+          )
+          subscriber.complete()
+          return
         }
         if (model.parameters.stream === false) {
-          const data = await response.json();
-          subscriber.next(data.choices[0]?.message?.content ?? "");
+          const data = await response.json()
+          subscriber.next(data.choices[0]?.message?.content ?? '')
         } else {
-          const stream = response.body;
-          const decoder = new TextDecoder("utf-8");
-          const reader = stream?.getReader();
-          let content = "";
+          const stream = response.body
+          const decoder = new TextDecoder('utf-8')
+          const reader = stream?.getReader()
+          let content = ''
 
           while (true && reader) {
-            const { done, value } = await reader.read();
+            const { done, value } = await reader.read()
             if (done) {
-              break;
+              break
             }
-            const text = decoder.decode(value);
-            const lines = text.trim().split("\n");
+            const text = decoder.decode(value)
+            const lines = text.trim().split('\n')
             for (const line of lines) {
-              if (line.startsWith("data: ") && !line.includes("data: [DONE]")) {
-                const data = JSON.parse(line.replace("data: ", ""));
-                content += data.choices[0]?.delta?.content ?? "";
-                if (content.startsWith("assistant: ")) {
-                  content = content.replace("assistant: ", "");
+              if (line.startsWith('data: ') && !line.includes('data: [DONE]')) {
+                const data = JSON.parse(line.replace('data: ', ''))
+                content += data.choices[0]?.delta?.content ?? ''
+                if (content.startsWith('assistant: ')) {
+                  content = content.replace('assistant: ', '')
                 }
-                subscriber.next(content);
+                subscriber.next(content)
               }
             }
           }
         }
-        subscriber.complete();
+        subscriber.complete()
       })
-      .catch((err) => subscriber.error(err));
-  });
+      .catch((err) => subscriber.error(err))
+  })
 }
diff --git a/extensions/inference-openai-extension/src/index.ts b/extensions/inference-openai-extension/src/index.ts
index fd1230bc7..481171742 100644
--- a/extensions/inference-openai-extension/src/index.ts
+++ b/extensions/inference-openai-extension/src/index.ts
@@ -18,14 +18,15 @@ import {
   InferenceEngine,
   BaseExtension,
   MessageEvent,
+  MessageRequestType,
   ModelEvent,
   InferenceEvent,
   AppConfigurationEventName,
   joinPath,
-} from "@janhq/core";
-import { requestInference } from "./helpers/sse";
-import { ulid } from "ulid";
-import { join } from "path";
+} from '@janhq/core'
+import { requestInference } from './helpers/sse'
+import { ulid } from 'ulid'
+import { join } from 'path'
 
 /**
  * A class that implements the InferenceExtension interface from the @janhq/core package.
@@ -33,18 +34,18 @@ import { join } from "path";
  * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
  */
 export default class JanInferenceOpenAIExtension extends BaseExtension {
-  private static readonly _engineDir = "file://engines";
-  private static readonly _engineMetadataFileName = "openai.json";
+  private static readonly _engineDir = 'file://engines'
+  private static readonly _engineMetadataFileName = 'openai.json'
 
-  private static _currentModel: OpenAIModel;
+  private static _currentModel: OpenAIModel
 
   private static _engineSettings: EngineSettings = {
-    full_url: "https://api.openai.com/v1/chat/completions",
-    api_key: "sk-<your key here>",
-  };
+    full_url: 'https://api.openai.com/v1/chat/completions',
+    api_key: 'sk-<your key here>',
+  }
 
-  controller = new AbortController();
-  isCancelled = false;
+  controller = new AbortController()
+  isCancelled = false
 
   /**
    * Subscribes to events emitted by the @janhq/core package.
@@ -53,40 +54,40 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
     if (!(await fs.existsSync(JanInferenceOpenAIExtension._engineDir))) {
       await fs
         .mkdirSync(JanInferenceOpenAIExtension._engineDir)
-        .catch((err) => console.debug(err));
+        .catch((err) => console.debug(err))
     }
 
-    JanInferenceOpenAIExtension.writeDefaultEngineSettings();
+    JanInferenceOpenAIExtension.writeDefaultEngineSettings()
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data) =>
-      JanInferenceOpenAIExtension.handleMessageRequest(data, this),
-    );
+      JanInferenceOpenAIExtension.handleMessageRequest(data, this)
+    )
 
     events.on(ModelEvent.OnModelInit, (model: OpenAIModel) => {
-      JanInferenceOpenAIExtension.handleModelInit(model);
-    });
+      JanInferenceOpenAIExtension.handleModelInit(model)
+    })
 
     events.on(ModelEvent.OnModelStop, (model: OpenAIModel) => {
-      JanInferenceOpenAIExtension.handleModelStop(model);
-    });
+      JanInferenceOpenAIExtension.handleModelStop(model)
+    })
     events.on(InferenceEvent.OnInferenceStopped, () => {
-      JanInferenceOpenAIExtension.handleInferenceStopped(this);
-    });
+      JanInferenceOpenAIExtension.handleInferenceStopped(this)
+    })
 
     const settingsFilePath = await joinPath([
       JanInferenceOpenAIExtension._engineDir,
       JanInferenceOpenAIExtension._engineMetadataFileName,
-    ]);
+    ])
 
     events.on(
       AppConfigurationEventName.OnConfigurationUpdate,
       (settingsKey: string) => {
         // Update settings on changes
         if (settingsKey === settingsFilePath)
-          JanInferenceOpenAIExtension.writeDefaultEngineSettings();
-      },
-    );
+          JanInferenceOpenAIExtension.writeDefaultEngineSettings()
+      }
+    )
   }
 
   /**
@@ -98,45 +99,45 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
     try {
       const engineFile = join(
         JanInferenceOpenAIExtension._engineDir,
-        JanInferenceOpenAIExtension._engineMetadataFileName,
-      );
+        JanInferenceOpenAIExtension._engineMetadataFileName
+      )
       if (await fs.existsSync(engineFile)) {
-        const engine = await fs.readFileSync(engineFile, "utf-8");
+        const engine = await fs.readFileSync(engineFile, 'utf-8')
         JanInferenceOpenAIExtension._engineSettings =
-          typeof engine === "object" ? engine : JSON.parse(engine);
+          typeof engine === 'object' ? engine : JSON.parse(engine)
       } else {
         await fs.writeFileSync(
           engineFile,
-          JSON.stringify(JanInferenceOpenAIExtension._engineSettings, null, 2),
-        );
+          JSON.stringify(JanInferenceOpenAIExtension._engineSettings, null, 2)
+        )
       }
     } catch (err) {
-      console.error(err);
+      console.error(err)
     }
   }
   private static async handleModelInit(model: OpenAIModel) {
     if (model.engine !== InferenceEngine.openai) {
-      return;
+      return
     } else {
-      JanInferenceOpenAIExtension._currentModel = model;
-      JanInferenceOpenAIExtension.writeDefaultEngineSettings();
+      JanInferenceOpenAIExtension._currentModel = model
+      JanInferenceOpenAIExtension.writeDefaultEngineSettings()
       // Todo: Check model list with API key
-      events.emit(ModelEvent.OnModelReady, model);
+      events.emit(ModelEvent.OnModelReady, model)
     }
   }
 
   private static async handleModelStop(model: OpenAIModel) {
-    if (model.engine !== "openai") {
-      return;
+    if (model.engine !== 'openai') {
+      return
     }
-    events.emit(ModelEvent.OnModelStopped, model);
+    events.emit(ModelEvent.OnModelStopped, model)
   }
 
   private static async handleInferenceStopped(
-    instance: JanInferenceOpenAIExtension,
+    instance: JanInferenceOpenAIExtension
   ) {
-    instance.isCancelled = true;
-    instance.controller?.abort();
+    instance.isCancelled = true
+    instance.controller?.abort()
   }
 
   /**
@@ -147,28 +148,32 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
    */
   private static async handleMessageRequest(
     data: MessageRequest,
-    instance: JanInferenceOpenAIExtension,
+    instance: JanInferenceOpenAIExtension
   ) {
-    if (data.model.engine !== "openai") {
-      return;
+    if (data.model.engine !== 'openai') {
+      return
     }
 
-    const timestamp = Date.now();
+    const timestamp = Date.now()
     const message: ThreadMessage = {
       id: ulid(),
       thread_id: data.threadId,
+      type: data.type,
       assistant_id: data.assistantId,
       role: ChatCompletionRole.Assistant,
       content: [],
       status: MessageStatus.Pending,
       created: timestamp,
       updated: timestamp,
-      object: "thread.message",
-    };
-    events.emit(MessageEvent.OnMessageResponse, message);
+      object: 'thread.message',
+    }
 
-    instance.isCancelled = false;
-    instance.controller = new AbortController();
+    if (data.type !== MessageRequestType.Summary) {
+      events.emit(MessageEvent.OnMessageResponse, message)
+    }
+
+    instance.isCancelled = false
+    instance.controller = new AbortController()
 
     requestInference(
       data?.messages ?? [],
@@ -177,7 +182,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
         ...JanInferenceOpenAIExtension._currentModel,
         parameters: data.model.parameters,
       },
-      instance.controller,
+      instance.controller
     ).subscribe({
       next: (content) => {
         const messageContent: ThreadContent = {
@@ -186,33 +191,33 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
             value: content.trim(),
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       complete: async () => {
         message.status = message.content.length
           ? MessageStatus.Ready
-          : MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+          : MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       error: async (err) => {
         if (instance.isCancelled || message.content.length > 0) {
-          message.status = MessageStatus.Stopped;
-          events.emit(MessageEvent.OnMessageUpdate, message);
-          return;
+          message.status = MessageStatus.Stopped
+          events.emit(MessageEvent.OnMessageUpdate, message)
+          return
         }
         const messageContent: ThreadContent = {
           type: ContentType.Text,
           text: {
-            value: "Error occurred: " + err.message,
+            value: 'Error occurred: ' + err.message,
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        message.status = MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        message.status = MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
-    });
+    })
   }
 }
diff --git a/extensions/inference-openai-extension/tsconfig.json b/extensions/inference-openai-extension/tsconfig.json
index 7bfdd9009..2477d58ce 100644
--- a/extensions/inference-openai-extension/tsconfig.json
+++ b/extensions/inference-openai-extension/tsconfig.json
@@ -8,7 +8,7 @@
     "forceConsistentCasingInFileNames": true,
     "strict": false,
     "skipLibCheck": true,
-    "rootDir": "./src",
+    "rootDir": "./src"
   },
-  "include": ["./src"],
+  "include": ["./src"]
 }
diff --git a/extensions/inference-openai-extension/webpack.config.js b/extensions/inference-openai-extension/webpack.config.js
index 72b7d90c1..ee2e3b624 100644
--- a/extensions/inference-openai-extension/webpack.config.js
+++ b/extensions/inference-openai-extension/webpack.config.js
@@ -1,16 +1,16 @@
-const path = require("path");
-const webpack = require("webpack");
-const packageJson = require("./package.json");
+const path = require('path')
+const webpack = require('webpack')
+const packageJson = require('./package.json')
 
 module.exports = {
   experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
+  entry: './src/index.ts', // Adjust the entry point to match your project's main file
+  mode: 'production',
   module: {
     rules: [
       {
         test: /\.tsx?$/,
-        use: "ts-loader",
+        use: 'ts-loader',
         exclude: /node_modules/,
       },
     ],
@@ -18,22 +18,22 @@ module.exports = {
   plugins: [
     new webpack.DefinePlugin({
       MODULE: JSON.stringify(`${packageJson.name}/${packageJson.module}`),
-      OPENAI_DOMAIN: JSON.stringify("openai.azure.com"),
+      OPENAI_DOMAIN: JSON.stringify('openai.azure.com'),
     }),
   ],
   output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
+    filename: 'index.js', // Adjust the output file name as needed
+    path: path.resolve(__dirname, 'dist'),
+    library: { type: 'module' }, // Specify ESM output format
   },
   resolve: {
-    extensions: [".ts", ".js"],
+    extensions: ['.ts', '.js'],
     fallback: {
-      path: require.resolve("path-browserify"),
+      path: require.resolve('path-browserify'),
     },
   },
   optimization: {
     minimize: false,
   },
   // Add loaders and other configuration as needed for your project
-};
+}
diff --git a/extensions/inference-triton-trtllm-extension/package.json b/extensions/inference-triton-trtllm-extension/package.json
index 1d27f9f18..455f8030e 100644
--- a/extensions/inference-triton-trtllm-extension/package.json
+++ b/extensions/inference-triton-trtllm-extension/package.json
@@ -8,7 +8,7 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "exports": {
     ".": "./dist/index.js",
@@ -18,13 +18,13 @@
     "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
     "fetch-retry": "^5.0.6",
     "path-browserify": "^1.0.1",
-    "ts-loader": "^9.5.0",
     "ulid": "^2.3.0",
     "rxjs": "^7.8.1"
   },
diff --git a/extensions/inference-triton-trtllm-extension/src/@types/global.d.ts b/extensions/inference-triton-trtllm-extension/src/@types/global.d.ts
index 6224b8e68..c834feba0 100644
--- a/extensions/inference-triton-trtllm-extension/src/@types/global.d.ts
+++ b/extensions/inference-triton-trtllm-extension/src/@types/global.d.ts
@@ -1,5 +1,5 @@
-import { Model } from "@janhq/core";
+import { Model } from '@janhq/core'
 
 declare interface EngineSettings {
-    base_url?: string;
+  base_url?: string
 }
diff --git a/extensions/inference-triton-trtllm-extension/src/helpers/sse.ts b/extensions/inference-triton-trtllm-extension/src/helpers/sse.ts
index da20fa32d..9aff61265 100644
--- a/extensions/inference-triton-trtllm-extension/src/helpers/sse.ts
+++ b/extensions/inference-triton-trtllm-extension/src/helpers/sse.ts
@@ -1,6 +1,6 @@
-import { Observable } from "rxjs";
-import { EngineSettings } from "../@types/global";
-import { Model } from "@janhq/core";
+import { Observable } from 'rxjs'
+import { EngineSettings } from '../@types/global'
+import { Model } from '@janhq/core'
 
 /**
  * Sends a request to the inference server to generate a response based on the recent messages.
@@ -16,48 +16,48 @@ export function requestInference(
   controller?: AbortController
 ): Observable<string> {
   return new Observable((subscriber) => {
-    const text_input = recentMessages.map((message) => message.text).join("\n");
+    const text_input = recentMessages.map((message) => message.text).join('\n')
     const requestBody = JSON.stringify({
       text_input: text_input,
       max_tokens: 4096,
       temperature: 0,
-      bad_words: "",
-      stop_words: "[DONE]",
-      stream: true
-    });
+      bad_words: '',
+      stop_words: '[DONE]',
+      stream: true,
+    })
     fetch(`${engine.base_url}/v2/models/ensemble/generate_stream`, {
-      method: "POST",
+      method: 'POST',
       headers: {
-        "Content-Type": "application/json",
-        Accept: "text/event-stream",
-        "Access-Control-Allow-Origin": "*",
+        'Content-Type': 'application/json',
+        'Accept': 'text/event-stream',
+        'Access-Control-Allow-Origin': '*',
       },
       body: requestBody,
       signal: controller?.signal,
     })
       .then(async (response) => {
-        const stream = response.body;
-        const decoder = new TextDecoder("utf-8");
-        const reader = stream?.getReader();
-        let content = "";
+        const stream = response.body
+        const decoder = new TextDecoder('utf-8')
+        const reader = stream?.getReader()
+        let content = ''
 
         while (true && reader) {
-          const { done, value } = await reader.read();
+          const { done, value } = await reader.read()
           if (done) {
-            break;
+            break
           }
-          const text = decoder.decode(value);
-          const lines = text.trim().split("\n");
+          const text = decoder.decode(value)
+          const lines = text.trim().split('\n')
           for (const line of lines) {
-            if (line.startsWith("data: ") && !line.includes("data: [DONE]")) {
-              const data = JSON.parse(line.replace("data: ", ""));
-              content += data.choices[0]?.delta?.content ?? "";
-              subscriber.next(content);
+            if (line.startsWith('data: ') && !line.includes('data: [DONE]')) {
+              const data = JSON.parse(line.replace('data: ', ''))
+              content += data.choices[0]?.delta?.content ?? ''
+              subscriber.next(content)
             }
           }
         }
-        subscriber.complete();
+        subscriber.complete()
       })
-      .catch((err) => subscriber.error(err));
-  });
+      .catch((err) => subscriber.error(err))
+  })
 }
diff --git a/extensions/inference-triton-trtllm-extension/src/index.ts b/extensions/inference-triton-trtllm-extension/src/index.ts
index 11ddf7893..f009a81e0 100644
--- a/extensions/inference-triton-trtllm-extension/src/index.ts
+++ b/extensions/inference-triton-trtllm-extension/src/index.ts
@@ -20,51 +20,49 @@ import {
   BaseExtension,
   MessageEvent,
   ModelEvent,
-} from "@janhq/core";
-import { requestInference } from "./helpers/sse";
-import { ulid } from "ulid";
-import { join } from "path";
-import { EngineSettings } from "./@types/global";
+} from '@janhq/core'
+import { requestInference } from './helpers/sse'
+import { ulid } from 'ulid'
+import { join } from 'path'
+import { EngineSettings } from './@types/global'
 
 /**
  * A class that implements the InferenceExtension interface from the @janhq/core package.
  * The class provides methods for initializing and stopping a model, and for making inference requests.
  * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
  */
-export default class JanInferenceTritonTrtLLMExtension
-  extends BaseExtension
-{
-  private static readonly _homeDir = "file://engines";
-  private static readonly _engineMetadataFileName = "triton_trtllm.json";
+export default class JanInferenceTritonTrtLLMExtension extends BaseExtension {
+  private static readonly _homeDir = 'file://engines'
+  private static readonly _engineMetadataFileName = 'triton_trtllm.json'
 
-  static _currentModel: Model;
+  static _currentModel: Model
 
   static _engineSettings: EngineSettings = {
-    base_url: "",
-  };
+    base_url: '',
+  }
 
-  controller = new AbortController();
-  isCancelled = false;
+  controller = new AbortController()
+  isCancelled = false
 
   /**
    * Subscribes to events emitted by the @janhq/core package.
    */
   async onLoad() {
     if (!(await fs.existsSync(JanInferenceTritonTrtLLMExtension._homeDir)))
-      JanInferenceTritonTrtLLMExtension.writeDefaultEngineSettings();
+      JanInferenceTritonTrtLLMExtension.writeDefaultEngineSettings()
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data) =>
       JanInferenceTritonTrtLLMExtension.handleMessageRequest(data, this)
-    );
+    )
 
     events.on(ModelEvent.OnModelInit, (model: Model) => {
-      JanInferenceTritonTrtLLMExtension.handleModelInit(model);
-    });
+      JanInferenceTritonTrtLLMExtension.handleModelInit(model)
+    })
 
     events.on(ModelEvent.OnModelStop, (model: Model) => {
-      JanInferenceTritonTrtLLMExtension.handleModelStop(model);
-    });
+      JanInferenceTritonTrtLLMExtension.handleModelStop(model)
+    })
   }
 
   /**
@@ -81,7 +79,7 @@ export default class JanInferenceTritonTrtLLMExtension
     modelId: string,
     settings?: ModelSettingParams
   ): Promise<void> {
-    return;
+    return
   }
 
   static async writeDefaultEngineSettings() {
@@ -89,11 +87,11 @@ export default class JanInferenceTritonTrtLLMExtension
       const engine_json = join(
         JanInferenceTritonTrtLLMExtension._homeDir,
         JanInferenceTritonTrtLLMExtension._engineMetadataFileName
-      );
+      )
       if (await fs.existsSync(engine_json)) {
-        const engine = await fs.readFileSync(engine_json, "utf-8");
+        const engine = await fs.readFileSync(engine_json, 'utf-8')
         JanInferenceTritonTrtLLMExtension._engineSettings =
-          typeof engine === "object" ? engine : JSON.parse(engine);
+          typeof engine === 'object' ? engine : JSON.parse(engine)
       } else {
         await fs.writeFileSync(
           engine_json,
@@ -102,10 +100,10 @@ export default class JanInferenceTritonTrtLLMExtension
             null,
             2
           )
-        );
+        )
       }
     } catch (err) {
-      console.error(err);
+      console.error(err)
     }
   }
   /**
@@ -119,26 +117,26 @@ export default class JanInferenceTritonTrtLLMExtension
    * @returns {Promise<void>} A promise that resolves when the streaming is stopped.
    */
   async stopInference(): Promise<void> {
-    this.isCancelled = true;
-    this.controller?.abort();
+    this.isCancelled = true
+    this.controller?.abort()
   }
 
   private static async handleModelInit(model: Model) {
-    if (model.engine !== "triton_trtllm") {
-      return;
+    if (model.engine !== 'triton_trtllm') {
+      return
     } else {
-      JanInferenceTritonTrtLLMExtension._currentModel = model;
-      JanInferenceTritonTrtLLMExtension.writeDefaultEngineSettings();
+      JanInferenceTritonTrtLLMExtension._currentModel = model
+      JanInferenceTritonTrtLLMExtension.writeDefaultEngineSettings()
       // Todo: Check model list with API key
-      events.emit(ModelEvent.OnModelReady, model);
+      events.emit(ModelEvent.OnModelReady, model)
     }
   }
 
   private static async handleModelStop(model: Model) {
-    if (model.engine !== "triton_trtllm") {
-      return;
+    if (model.engine !== 'triton_trtllm') {
+      return
     }
-    events.emit(ModelEvent.OnModelStopped, model);
+    events.emit(ModelEvent.OnModelStopped, model)
   }
 
   /**
@@ -151,11 +149,11 @@ export default class JanInferenceTritonTrtLLMExtension
     data: MessageRequest,
     instance: JanInferenceTritonTrtLLMExtension
   ) {
-    if (data.model.engine !== "triton_trtllm") {
-      return;
+    if (data.model.engine !== 'triton_trtllm') {
+      return
     }
 
-    const timestamp = Date.now();
+    const timestamp = Date.now()
     const message: ThreadMessage = {
       id: ulid(),
       thread_id: data.threadId,
@@ -165,12 +163,12 @@ export default class JanInferenceTritonTrtLLMExtension
       status: MessageStatus.Pending,
       created: timestamp,
       updated: timestamp,
-      object: "thread.message",
-    };
-    events.emit(MessageEvent.OnMessageResponse, message);
+      object: 'thread.message',
+    }
+    events.emit(MessageEvent.OnMessageResponse, message)
 
-    instance.isCancelled = false;
-    instance.controller = new AbortController();
+    instance.isCancelled = false
+    instance.controller = new AbortController()
 
     requestInference(
       data?.messages ?? [],
@@ -188,33 +186,33 @@ export default class JanInferenceTritonTrtLLMExtension
             value: content.trim(),
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       complete: async () => {
         message.status = message.content.length
           ? MessageStatus.Ready
-          : MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+          : MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       error: async (err) => {
         if (instance.isCancelled || message.content.length) {
-          message.status = MessageStatus.Error;
-          events.emit(MessageEvent.OnMessageUpdate, message);
-          return;
+          message.status = MessageStatus.Error
+          events.emit(MessageEvent.OnMessageUpdate, message)
+          return
         }
         const messageContent: ThreadContent = {
           type: ContentType.Text,
           text: {
-            value: "Error occurred: " + err.message,
+            value: 'Error occurred: ' + err.message,
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        message.status = MessageStatus.Ready;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        message.status = MessageStatus.Ready
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
-    });
+    })
   }
 }
diff --git a/extensions/inference-triton-trtllm-extension/tsconfig.json b/extensions/inference-triton-trtllm-extension/tsconfig.json
index 7bfdd9009..2477d58ce 100644
--- a/extensions/inference-triton-trtllm-extension/tsconfig.json
+++ b/extensions/inference-triton-trtllm-extension/tsconfig.json
@@ -8,7 +8,7 @@
     "forceConsistentCasingInFileNames": true,
     "strict": false,
     "skipLibCheck": true,
-    "rootDir": "./src",
+    "rootDir": "./src"
   },
-  "include": ["./src"],
+  "include": ["./src"]
 }
diff --git a/extensions/inference-triton-trtllm-extension/webpack.config.js b/extensions/inference-triton-trtllm-extension/webpack.config.js
index 57a0adb0a..e83370a1a 100644
--- a/extensions/inference-triton-trtllm-extension/webpack.config.js
+++ b/extensions/inference-triton-trtllm-extension/webpack.config.js
@@ -1,16 +1,16 @@
-const path = require("path");
-const webpack = require("webpack");
-const packageJson = require("./package.json");
+const path = require('path')
+const webpack = require('webpack')
+const packageJson = require('./package.json')
 
 module.exports = {
   experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
+  entry: './src/index.ts', // Adjust the entry point to match your project's main file
+  mode: 'production',
   module: {
     rules: [
       {
         test: /\.tsx?$/,
-        use: "ts-loader",
+        use: 'ts-loader',
         exclude: /node_modules/,
       },
     ],
@@ -21,18 +21,18 @@ module.exports = {
     }),
   ],
   output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
+    filename: 'index.js', // Adjust the output file name as needed
+    path: path.resolve(__dirname, 'dist'),
+    library: { type: 'module' }, // Specify ESM output format
   },
   resolve: {
-    extensions: [".ts", ".js"],
+    extensions: ['.ts', '.js'],
     fallback: {
-      path: require.resolve("path-browserify"),
+      path: require.resolve('path-browserify'),
     },
   },
   optimization: {
     minimize: false,
   },
   // Add loaders and other configuration as needed for your project
-};
+}
diff --git a/extensions/model-extension/.prettierrc b/extensions/model-extension/.prettierrc
deleted file mode 100644
index 46f1abcb0..000000000
--- a/extensions/model-extension/.prettierrc
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-  "semi": false,
-  "singleQuote": true,
-  "quoteProps": "consistent",
-  "trailingComma": "es5",
-  "endOfLine": "auto",
-  "plugins": ["prettier-plugin-tailwindcss"]
-}
diff --git a/extensions/model-extension/package.json b/extensions/model-extension/package.json
index 86f177d14..e99122bcf 100644
--- a/extensions/model-extension/package.json
+++ b/extensions/model-extension/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@janhq/model-extension",
-  "version": "1.0.23",
+  "version": "1.0.25",
   "description": "Model Management Extension provides model exploration and seamless downloads",
   "main": "dist/index.js",
   "module": "dist/module.js",
@@ -8,13 +8,14 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "devDependencies": {
     "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "files": [
     "dist/*",
@@ -23,7 +24,6 @@
   ],
   "dependencies": {
     "@janhq/core": "file:../../core",
-    "path-browserify": "^1.0.1",
-    "ts-loader": "^9.5.0"
+    "path-browserify": "^1.0.1"
   }
 }
diff --git a/extensions/model-extension/src/@types/global.d.ts b/extensions/model-extension/src/@types/global.d.ts
index e998455f2..7a9202a62 100644
--- a/extensions/model-extension/src/@types/global.d.ts
+++ b/extensions/model-extension/src/@types/global.d.ts
@@ -1,3 +1,15 @@
-declare const EXTENSION_NAME: string
-declare const MODULE_PATH: string
-declare const VERSION: stringå
+export {}
+declare global {
+  declare const EXTENSION_NAME: string
+  declare const MODULE_PATH: string
+  declare const VERSION: string
+
+  interface Core {
+    api: APIFunctions
+    events: EventEmitter
+  }
+  interface Window {
+    core?: Core | undefined
+    electronAPI?: any | undefined
+  }
+}
diff --git a/extensions/model-extension/src/helpers/path.ts b/extensions/model-extension/src/helpers/path.ts
new file mode 100644
index 000000000..cbb151aa6
--- /dev/null
+++ b/extensions/model-extension/src/helpers/path.ts
@@ -0,0 +1,11 @@
+/**
+ *  try to retrieve the download file name from the source url
+ */
+
+export function extractFileName(url: string, fileExtension: string): string {
+  const extractedFileName = url.split('/').pop()
+  const fileName = extractedFileName.toLowerCase().endsWith(fileExtension)
+    ? extractedFileName
+    : extractedFileName + fileExtension
+  return fileName
+}
diff --git a/extensions/model-extension/src/index.ts b/extensions/model-extension/src/index.ts
index b9fa7731e..926e65ee5 100644
--- a/extensions/model-extension/src/index.ts
+++ b/extensions/model-extension/src/index.ts
@@ -8,8 +8,15 @@ import {
   ModelExtension,
   Model,
   getJanDataFolderPath,
+  events,
+  DownloadEvent,
+  DownloadRoute,
+  ModelEvent,
+  DownloadState,
 } from '@janhq/core'
 
+import { extractFileName } from './helpers/path'
+
 /**
  * A extension for models
  */
@@ -29,6 +36,8 @@ export default class JanModelExtension extends ModelExtension {
    */
   async onLoad() {
     this.copyModelsToHomeDir()
+    // Handle Desktop Events
+    this.handleDesktopEvents()
   }
 
   /**
@@ -61,6 +70,8 @@ export default class JanModelExtension extends ModelExtension {
 
       // Finished migration
       localStorage.setItem(`${EXTENSION_NAME}-version`, VERSION)
+
+      events.emit(ModelEvent.OnModelsUpdate, {})
     } catch (err) {
       console.error(err)
     }
@@ -83,31 +94,66 @@ export default class JanModelExtension extends ModelExtension {
     if (model.sources.length > 1) {
       // path to model binaries
       for (const source of model.sources) {
-        let path = this.extractFileName(source.url)
+        let path = extractFileName(
+          source.url,
+          JanModelExtension._supportedModelFormat
+        )
         if (source.filename) {
           path = await joinPath([modelDirPath, source.filename])
         }
 
         downloadFile(source.url, path, network)
       }
+      // TODO: handle multiple binaries for web later
     } else {
-      const fileName = this.extractFileName(model.sources[0]?.url)
+      const fileName = extractFileName(
+        model.sources[0]?.url,
+        JanModelExtension._supportedModelFormat
+      )
       const path = await joinPath([modelDirPath, fileName])
       downloadFile(model.sources[0]?.url, path, network)
+
+      if (window && window.core?.api && window.core.api.baseApiUrl) {
+        this.startPollingDownloadProgress(model.id)
+      }
     }
   }
 
   /**
-   *  try to retrieve the download file name from the source url
+   * Specifically for Jan server.
    */
-  private extractFileName(url: string): string {
-    const extractedFileName = url.split('/').pop()
-    const fileName = extractedFileName
-      .toLowerCase()
-      .endsWith(JanModelExtension._supportedModelFormat)
-      ? extractedFileName
-      : extractedFileName + JanModelExtension._supportedModelFormat
-    return fileName
+  private async startPollingDownloadProgress(modelId: string): Promise<void> {
+    // wait for some seconds before polling
+    await new Promise((resolve) => setTimeout(resolve, 3000))
+
+    return new Promise((resolve) => {
+      const interval = setInterval(async () => {
+        fetch(
+          `${window.core.api.baseApiUrl}/v1/download/${DownloadRoute.getDownloadProgress}/${modelId}`,
+          {
+            method: 'GET',
+            headers: { contentType: 'application/json' },
+          }
+        ).then(async (res) => {
+          const state: DownloadState = await res.json()
+          if (state.downloadState === 'end') {
+            events.emit(DownloadEvent.onFileDownloadSuccess, state)
+            clearInterval(interval)
+            resolve()
+            return
+          }
+
+          if (state.downloadState === 'error') {
+            events.emit(DownloadEvent.onFileDownloadError, state)
+            clearInterval(interval)
+            resolve()
+            return
+          }
+
+          events.emit(DownloadEvent.onFileDownloadUpdate, state)
+        })
+      }, 1000)
+    })
   }
 
   /**
@@ -174,15 +220,20 @@ export default class JanModelExtension extends ModelExtension {
   async getDownloadedModels(): Promise<Model[]> {
     return await this.getModelsMetadata(
       async (modelDir: string, model: Model) => {
-        if (model.engine !== JanModelExtension._offlineInferenceEngine) {
+        if (model.engine !== JanModelExtension._offlineInferenceEngine)
           return true
-        }
+
+        // model binaries (sources) are absolute path & exist
+        const existFiles = await Promise.all(
+          model.sources.map((source) => fs.existsSync(source.url))
+        )
+        if (existFiles.every((exist) => exist)) return true
+
         return await fs
           .readdirSync(await joinPath([JanModelExtension._homeDir, modelDir]))
           .then((files: string[]) => {
-            // or model binary exists in the directory
-            // model binary name can match model ID or be a .gguf file and not be an incompleted model file
-            // TODO: Check diff between urls, filenames
+            // Model binary exists in the directory
+            // Model binary name can match model ID or be a .gguf file and not be an incompleted model file
             return (
               files.includes(modelDir) ||
               files.filter(
@@ -228,8 +279,19 @@ export default class JanModelExtension extends ModelExtension {
         if (await fs.existsSync(jsonPath)) {
           // if we have the model.json file, read it
           let model = await this.readModelMetadata(jsonPath)
+
           model = typeof model === 'object' ? model : JSON.parse(model)
 
+          // This to ensure backward compatibility with `model.json` with `source_url`
+          if (model['source_url'] != null) {
+            model['sources'] = [
+              {
+                filename: model.id,
+                url: model['source_url'],
+              },
+            ]
+          }
+
           if (selector && !(await selector?.(dirName, model))) {
             return
           }
@@ -243,31 +305,18 @@ export default class JanModelExtension extends ModelExtension {
       })
       const results = await Promise.allSettled(readJsonPromises)
       const modelData = results.map((result) => {
-        if (result.status === 'fulfilled') {
+        if (result.status === 'fulfilled' && result.value) {
           try {
-            // This to ensure backward compatibility with `model.json` with `source_url`
-            const tmpModel =
+            const model =
               typeof result.value === 'object'
                 ? result.value
                 : JSON.parse(result.value)
-            if (tmpModel['source_url'] != null) {
-              tmpModel['source'] = [
-                {
-                  filename: tmpModel.id,
-                  url: tmpModel['source_url'],
-                },
-              ]
-            }
-
-            return tmpModel as Model
+            return model as Model
           } catch {
             console.debug(`Unable to parse model metadata: ${result.value}`)
-            return undefined
           }
-        } else {
-          console.error(result.reason)
-          return undefined
         }
+        return undefined
       })
 
       return modelData.filter((e) => !!e)
@@ -318,7 +367,7 @@ export default class JanModelExtension extends ModelExtension {
       return
     }
 
-    const defaultModel = await this.getDefaultModel() as Model
+    const defaultModel = (await this.getDefaultModel()) as Model
     if (!defaultModel) {
       console.error('Unable to find default model')
       return
@@ -382,4 +431,28 @@ export default class JanModelExtension extends ModelExtension {
   async getConfiguredModels(): Promise<Model[]> {
     return this.getModelsMetadata()
   }
+
+  handleDesktopEvents() {
+    if (window && window.electronAPI) {
+      window.electronAPI.onFileDownloadUpdate(
+        async (_event: string, state: DownloadState | undefined) => {
+          if (!state) return
+          state.downloadState = 'downloading'
+          events.emit(DownloadEvent.onFileDownloadUpdate, state)
+        }
+      )
+      window.electronAPI.onFileDownloadError(
+        async (_event: string, state: DownloadState) => {
+          state.downloadState = 'error'
+          events.emit(DownloadEvent.onFileDownloadError, state)
+        }
+      )
+      window.electronAPI.onFileDownloadSuccess(
+        async (_event: string, state: DownloadState) => {
+          state.downloadState = 'end'
+          events.emit(DownloadEvent.onFileDownloadSuccess, state)
+        }
+      )
+    }
+  }
 }
diff --git a/extensions/monitoring-extension/package.json b/extensions/monitoring-extension/package.json
index 20d3c485f..582f7cd7b 100644
--- a/extensions/monitoring-extension/package.json
+++ b/extensions/monitoring-extension/package.json
@@ -8,17 +8,17 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "devDependencies": {
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
-    "node-os-utils": "^1.3.7",
-    "ts-loader": "^9.5.0"
+    "node-os-utils": "^1.3.7"
   },
   "files": [
     "dist/*",
diff --git a/extensions/monitoring-extension/src/@types/global.d.ts b/extensions/monitoring-extension/src/@types/global.d.ts
index 3b45ccc5a..8106353cf 100644
--- a/extensions/monitoring-extension/src/@types/global.d.ts
+++ b/extensions/monitoring-extension/src/@types/global.d.ts
@@ -1 +1 @@
-declare const MODULE: string;
+declare const MODULE: string
diff --git a/extensions/monitoring-extension/src/index.ts b/extensions/monitoring-extension/src/index.ts
index 9297a770f..ce9b2fc14 100644
--- a/extensions/monitoring-extension/src/index.ts
+++ b/extensions/monitoring-extension/src/index.ts
@@ -1,4 +1,4 @@
-import { MonitoringExtension, executeOnMain } from "@janhq/core";
+import { MonitoringExtension, executeOnMain } from '@janhq/core'
 
 /**
  * JanMonitoringExtension is a extension that provides system monitoring functionality.
@@ -20,7 +20,7 @@ export default class JanMonitoringExtension extends MonitoringExtension {
    * @returns A Promise that resolves to an object containing information about the system resources.
    */
   getResourcesInfo(): Promise<any> {
-    return executeOnMain(MODULE, "getResourcesInfo");
+    return executeOnMain(MODULE, 'getResourcesInfo')
   }
 
   /**
@@ -28,6 +28,6 @@ export default class JanMonitoringExtension extends MonitoringExtension {
    * @returns A Promise that resolves to an object containing information about the current system load.
    */
   getCurrentLoad(): Promise<any> {
-    return executeOnMain(MODULE, "getCurrentLoad");
+    return executeOnMain(MODULE, 'getCurrentLoad')
   }
 }
diff --git a/extensions/monitoring-extension/src/module.ts b/extensions/monitoring-extension/src/module.ts
index 2c1b14343..27781a5d6 100644
--- a/extensions/monitoring-extension/src/module.ts
+++ b/extensions/monitoring-extension/src/module.ts
@@ -1,73 +1,92 @@
-const nodeOsUtils = require("node-os-utils");
-const getJanDataFolderPath = require("@janhq/core/node").getJanDataFolderPath;
-const path = require("path");
-const { readFileSync } = require("fs");
-const exec = require("child_process").exec;
+const nodeOsUtils = require('node-os-utils')
+const getJanDataFolderPath = require('@janhq/core/node').getJanDataFolderPath
+const path = require('path')
+const { readFileSync } = require('fs')
+const exec = require('child_process').exec
 
 const NVIDIA_INFO_FILE = path.join(
   getJanDataFolderPath(),
-  "settings",
-  "settings.json"
-);
+  'settings',
+  'settings.json'
+)
 
 const getResourcesInfo = () =>
   new Promise((resolve) => {
     nodeOsUtils.mem.used().then((ramUsedInfo) => {
-      const totalMemory = ramUsedInfo.totalMemMb * 1024 * 1024;
-      const usedMemory = ramUsedInfo.usedMemMb * 1024 * 1024;
+      const totalMemory = ramUsedInfo.totalMemMb * 1024 * 1024
+      const usedMemory = ramUsedInfo.usedMemMb * 1024 * 1024
       const response = {
         mem: {
           totalMemory,
           usedMemory,
         },
-      };
-      resolve(response);
-    });
-  });
+      }
+      resolve(response)
+    })
+  })
 
 const getCurrentLoad = () =>
   new Promise((resolve, reject) => {
     nodeOsUtils.cpu.usage().then((cpuPercentage) => {
       let data = {
-        run_mode: "cpu",
+        run_mode: 'cpu',
         gpus_in_use: [],
-      };
-      if (process.platform !== "darwin") {
-        data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
       }
-      if (data.run_mode === "gpu" && data.gpus_in_use.length > 0) {
-        const gpuIds = data["gpus_in_use"].join(",");
-        if (gpuIds !== "") {
+      if (process.platform !== 'darwin') {
+        data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, 'utf-8'))
+      }
+      if (data.run_mode === 'gpu' && data.gpus_in_use.length > 0) {
+        const gpuIds = data['gpus_in_use'].join(',')
+        if (gpuIds !== '' && data['vulkan'] !== true) {
           exec(
             `nvidia-smi --query-gpu=index,name,temperature.gpu,utilization.gpu,memory.total,memory.free,utilization.memory --format=csv,noheader,nounits --id=${gpuIds}`,
-            (error, stdout, stderr) => {
+            (error, stdout, _) => {
               if (error) {
-                console.error(`exec error: ${error}`);
-                reject(error);
-                return;
+                console.error(`exec error: ${error}`)
+                reject(error)
+                return
               }
-              const gpuInfo = stdout.trim().split("\n").map((line) => {
-                const [id, name, temperature, utilization, memoryTotal, memoryFree, memoryUtilization] = line.split(", ").map(item => item.replace(/\r/g, ""));
-                return { id, name, temperature, utilization, memoryTotal, memoryFree, memoryUtilization };
-              });
+              const gpuInfo = stdout
+                .trim()
+                .split('\n')
+                .map((line) => {
+                  const [
+                    id,
+                    name,
+                    temperature,
+                    utilization,
+                    memoryTotal,
+                    memoryFree,
+                    memoryUtilization,
+                  ] = line.split(', ').map((item) => item.replace(/\r/g, ''))
+                  return {
+                    id,
+                    name,
+                    temperature,
+                    utilization,
+                    memoryTotal,
+                    memoryFree,
+                    memoryUtilization,
+                  }
+                })
               resolve({
                 cpu: { usage: cpuPercentage },
-                gpu: gpuInfo
-              });
+                gpu: gpuInfo,
+              })
             }
-          );
+          )
         } else {
           // Handle the case where gpuIds is empty
-          resolve({ cpu: { usage: cpuPercentage }, gpu: [] });
+          resolve({ cpu: { usage: cpuPercentage }, gpu: [] })
         }
       } else {
         // Handle the case where run_mode is not 'gpu' or no GPUs are in use
-        resolve({ cpu: { usage: cpuPercentage }, gpu: [] });
+        resolve({ cpu: { usage: cpuPercentage }, gpu: [] })
       }
-    });
-  });
+    })
+  })
 
 module.exports = {
   getResourcesInfo,
   getCurrentLoad,
-};
\ No newline at end of file
+}
diff --git a/extensions/monitoring-extension/webpack.config.js b/extensions/monitoring-extension/webpack.config.js
index f54059222..c8c3a34f7 100644
--- a/extensions/monitoring-extension/webpack.config.js
+++ b/extensions/monitoring-extension/webpack.config.js
@@ -1,24 +1,24 @@
-const path = require("path");
-const webpack = require("webpack");
-const packageJson = require("./package.json");
+const path = require('path')
+const webpack = require('webpack')
+const packageJson = require('./package.json')
 
 module.exports = {
   experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
+  entry: './src/index.ts', // Adjust the entry point to match your project's main file
+  mode: 'production',
   module: {
     rules: [
       {
         test: /\.tsx?$/,
-        use: "ts-loader",
+        use: 'ts-loader',
         exclude: /node_modules/,
       },
     ],
   },
   output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
+    filename: 'index.js', // Adjust the output file name as needed
+    path: path.resolve(__dirname, 'dist'),
+    library: { type: 'module' }, // Specify ESM output format
   },
   plugins: [
     new webpack.DefinePlugin({
@@ -26,10 +26,10 @@ module.exports = {
     }),
   ],
   resolve: {
-    extensions: [".ts", ".js"],
+    extensions: ['.ts', '.js'],
   },
   optimization: {
     minimize: false,
   },
   // Add loaders and other configuration as needed for your project
-};
+}
diff --git a/models/dolphin-phi-2/model.json b/models/dolphin-phi-2/model.json
new file mode 100644
index 000000000..c25ff8f69
--- /dev/null
+++ b/models/dolphin-phi-2/model.json
@@ -0,0 +1,32 @@
+{
+    "sources": [
+      {
+        "url": "https://huggingface.co/TheBloke/dolphin-2_6-phi-2-GGUF/resolve/main/dolphin-2_6-phi-2.Q8_0.gguf",
+        "filename": "dolphin-2_6-phi-2.Q8_0.gguf"
+      }
+    ],
+    "id": "dolphin-phi-2",
+    "object": "model",
+    "name": "Dolphin Phi-2 2.7B Q8",
+    "version": "1.0",
+    "description": "Dolphin Phi-2 is a 2.7B model, fine-tuned for chat, excelling in common sense and logical reasoning benchmarks.",
+    "format": "gguf",
+    "settings": {
+      "ctx_len": 4096,
+      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+      "llama_model_path": "dolphin-2_6-phi-2.Q8_0.gguf"
+    },
+    "parameters": {
+      "max_tokens": 4096,
+      "stop": ["<|im_end|>"]
+    },
+    "metadata": {
+      "author": "Cognitive Computations, Microsoft",
+      "tags": [
+        "3B",
+        "Finetuned"
+      ],
+      "size": 2960000000
+    },
+    "engine": "nitro"
+  }
diff --git a/models/llamacorn-1.1b/model.json b/models/llamacorn-1.1b/model.json
new file mode 100644
index 000000000..056fb9050
--- /dev/null
+++ b/models/llamacorn-1.1b/model.json
@@ -0,0 +1,37 @@
+{
+    "sources": [
+        {
+            "url":"https://huggingface.co/janhq/llamacorn-1.1b-chat-GGUF/resolve/main/llamacorn-1.1b-chat.Q8_0.gguf",
+            "filename": "llamacorn-1.1b-chat.Q8_0.gguf"
+        }
+    ],
+    "id": "llamacorn-1.1b",
+    "object": "model",
+    "name": "LlamaCorn 1.1B Q8",
+    "version": "1.0",
+    "description": "LlamaCorn is designed to improve chat functionality from TinyLlama.",
+    "format": "gguf",
+    "settings": {
+      "ctx_len": 2048,
+      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+      "llama_model_path": "llamacorn-1.1b-chat.Q8_0.gguf"
+    },
+    "parameters": {
+      "temperature": 0.7,
+      "top_p": 0.95,
+      "stream": true,
+      "max_tokens": 2048,
+      "stop": [],
+      "frequency_penalty": 0,
+      "presence_penalty": 0
+    },
+    "metadata": {
+      "author": "Jan",
+      "tags": [
+        "Tiny",
+        "Finetuned"
+      ],
+      "size": 1170000000
+    },
+    "engine": "nitro"
+  }
\ No newline at end of file
diff --git a/models/mistral-ins-7b-q4/cover.png b/models/mistral-ins-7b-q4/cover.png
index 000445ecb..73b82e599 100644
Binary files a/models/mistral-ins-7b-q4/cover.png and b/models/mistral-ins-7b-q4/cover.png differ
diff --git a/models/mistral-ins-7b-q4/model.json b/models/mistral-ins-7b-q4/model.json
index bfdaffa90..75e0cbf9f 100644
--- a/models/mistral-ins-7b-q4/model.json
+++ b/models/mistral-ins-7b-q4/model.json
@@ -29,7 +29,7 @@
     "author": "MistralAI, The Bloke",
     "tags": ["Featured", "7B", "Foundational Model"],
     "size": 4370000000,
-    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/mistral-ins-7b-q4/cover.png"
+    "cover": "https://raw.githubusercontent.com/janhq/jan/dev/models/mistral-ins-7b-q4/cover.png"
   },
   "engine": "nitro"
 }
diff --git a/models/openchat-3.5-7b/model.json b/models/openchat-3.5-7b/model.json
index 294f7d269..18db33f8e 100644
--- a/models/openchat-3.5-7b/model.json
+++ b/models/openchat-3.5-7b/model.json
@@ -1,8 +1,8 @@
 {
   "sources": [
     {
-      "filename": "openchat-3.5-1210.Q4_K_M.gguf",
-      "url": "https://huggingface.co/TheBloke/openchat-3.5-1210-GGUF/resolve/main/openchat-3.5-1210.Q4_K_M.gguf"
+      "filename": "openchat-3.5-0106.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/openchat-3.5-0106-GGUF/resolve/main/openchat-3.5-0106.Q4_K_M.gguf"
     }
   ],
   "id": "openchat-3.5-7b",
@@ -14,7 +14,7 @@
   "settings": {
     "ctx_len": 4096,
     "prompt_template": "GPT4 Correct User: {prompt}<|end_of_turn|>GPT4 Correct Assistant:",
-    "llama_model_path": "openchat-3.5-1210.Q4_K_M.gguf"
+    "llama_model_path": "openchat-3.5-0106.Q4_K_M.gguf"
   },
   "parameters": {
     "temperature": 0.7,
diff --git a/models/openhermes-neural-7b/cover.png b/models/openhermes-neural-7b/cover.png
index 5b9da0aef..8976d8449 100644
Binary files a/models/openhermes-neural-7b/cover.png and b/models/openhermes-neural-7b/cover.png differ
diff --git a/models/openhermes-neural-7b/model.json b/models/openhermes-neural-7b/model.json
index 87e1df143..a13a0f2b8 100644
--- a/models/openhermes-neural-7b/model.json
+++ b/models/openhermes-neural-7b/model.json
@@ -28,7 +28,7 @@
     "author": "Intel, Jan",
     "tags": ["7B", "Merged", "Featured"],
     "size": 4370000000,
-    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/openhermes-neural-7b/cover.png"
+    "cover": "https://raw.githubusercontent.com/janhq/jan/dev/models/openhermes-neural-7b/cover.png"
   },
   "engine": "nitro"
 }
diff --git a/models/stable-zephyr-3b/model.json b/models/stable-zephyr-3b/model.json
new file mode 100644
index 000000000..724299ea5
--- /dev/null
+++ b/models/stable-zephyr-3b/model.json
@@ -0,0 +1,34 @@
+{
+    "sources": [
+      {
+        "url": "https://huggingface.co/TheBloke/stablelm-zephyr-3b-GGUF/resolve/main/stablelm-zephyr-3b.Q8_0.gguf",
+        "filename": "stablelm-zephyr-3b.Q8_0.gguf"
+      }
+    ],
+    "id": "stable-zephyr-3b",
+    "object": "model",
+    "name": "Stable Zephyr 3B Q8",
+    "version": "1.0",
+    "description": "StableLM Zephyr 3B is trained for safe and reliable chatting.",
+    "format": "gguf",
+    "settings": {
+      "ctx_len": 4096,
+      "prompt_template": "<|user|>\n{prompt}<|endoftext|>\n<|assistant|>",
+      "llama_model_path": "stablelm-zephyr-3b.Q8_0.gguf"
+    },
+    "parameters": {
+      "temperature": 0.7,
+      "top_p": 0.95,
+      "stream": true,
+      "max_tokens": 4096,
+      "stop": ["<|endoftext|>"],
+      "frequency_penalty": 0,
+      "presence_penalty": 0
+    },
+    "metadata": {
+      "author": "StabilityAI",
+      "tags": ["3B", "Finetuned"],
+      "size": 2970000000
+    },
+    "engine": "nitro"
+  }
\ No newline at end of file
diff --git a/models/trinity-v1.2-7b/cover.png b/models/trinity-v1.2-7b/cover.png
index a548e3c17..fbef0bb56 100644
Binary files a/models/trinity-v1.2-7b/cover.png and b/models/trinity-v1.2-7b/cover.png differ
diff --git a/models/trinity-v1.2-7b/model.json b/models/trinity-v1.2-7b/model.json
index 2dda120e6..947629642 100644
--- a/models/trinity-v1.2-7b/model.json
+++ b/models/trinity-v1.2-7b/model.json
@@ -28,7 +28,7 @@
     "author": "Jan",
     "tags": ["7B", "Merged", "Featured"],
     "size": 4370000000,
-    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/trinity-v1.2-7b/cover.png"
+    "cover": "https://raw.githubusercontent.com/janhq/jan/dev/models/trinity-v1.2-7b/cover.png"
   },
   "engine": "nitro"
 }
diff --git a/models/yarn-mistral-7b/model.json b/models/yarn-mistral-7b/model.json
deleted file mode 100644
index ee6de1319..000000000
--- a/models/yarn-mistral-7b/model.json
+++ /dev/null
@@ -1,31 +0,0 @@
-{
-  "sources": [
-    {
-      "url": "https://huggingface.co/TheBloke/Yarn-Mistral-7B-128k-GGUF/resolve/main/yarn-mistral-7b-128k.Q4_K_M.gguf"
-    }
-  ],
-  "id": "yarn-mistral-7b",
-  "object": "model",
-  "name": "Yarn Mistral 7B Q4",
-  "version": "1.0",
-  "description": "Yarn Mistral 7B is a language model for long context and supports a 128k token context window.",
-  "format": "gguf",
-  "settings": {
-    "ctx_len": 4096,
-    "prompt_template": "{prompt}"
-  },
-  "parameters": {
-    "temperature": 0.7,
-    "top_p": 0.95,
-    "stream": true,
-    "max_tokens": 4096,
-    "frequency_penalty": 0,
-    "presence_penalty": 0
-  },
-  "metadata": {
-    "author": "NousResearch, The Bloke",
-    "tags": ["7B", "Finetuned"],
-    "size": 4370000000
-  },
-  "engine": "nitro"
-}
diff --git a/package.json b/package.json
index 4b8bc4af0..957934fda 100644
--- a/package.json
+++ b/package.json
@@ -21,22 +21,23 @@
     "lint": "yarn workspace jan lint && yarn workspace jan-web lint",
     "test:unit": "yarn workspace @janhq/core test",
     "test": "yarn workspace jan test:e2e",
-    "copy:assets": "cpx \"models/**\" \"electron/models/\" && cpx \"docs/openapi/**\" \"electron/docs/openapi\"",
+    "copy:assets": "cpx \"models/**\" \"electron/models/\" && cpx \"pre-install/*.tgz\" \"electron/pre-install/\" && cpx \"docs/openapi/**\" \"electron/docs/openapi\"",
     "dev:electron": "yarn copy:assets && yarn workspace jan dev",
     "dev:web": "yarn workspace jan-web dev",
-    "dev:server": "yarn workspace @janhq/server dev",
+    "dev:server": "yarn copy:assets && yarn workspace @janhq/server dev",
     "dev": "concurrently --kill-others \"yarn dev:web\" \"wait-on http://localhost:3000 && yarn dev:electron\"",
     "test-local": "yarn lint && yarn build:test && yarn test",
     "dev:uikit": "yarn workspace @janhq/uikit install && yarn workspace @janhq/uikit dev",
     "build:uikit": "yarn workspace @janhq/uikit install && yarn workspace @janhq/uikit build",
-    "build:server": "cd server && yarn install && yarn run build",
+    "build:server": "yarn copy:assets && cd server && yarn install && yarn run build",
     "build:core": "cd core && yarn install && yarn run build",
     "build:web": "yarn workspace jan-web build && cpx \"web/out/**\" \"electron/renderer/\"",
     "build:electron": "yarn copy:assets && yarn workspace jan build",
     "build:electron:test": "yarn workspace jan build:test",
-    "build:extensions:windows": "rimraf ./electron/pre-install/*.tgz && powershell -command \"$jobs = Get-ChildItem -Path './extensions' -Directory | ForEach-Object { Start-Job -Name ($_.Name) -ScriptBlock { param($_dir); try { Set-Location $_dir; npm install; npm run build:publish; Write-Output 'Build successful in ' + $_dir } catch { Write-Error 'Error in ' + $_dir; throw } } -ArgumentList $_.FullName }; $jobs | Wait-Job; $jobs | ForEach-Object { Receive-Job -Job $_ -Keep } | ForEach-Object { Write-Host $_ }; $failed = $jobs | Where-Object { $_.State -ne 'Completed' -or $_.ChildJobs[0].JobStateInfo.State -ne 'Completed' }; if ($failed) { Exit 1 }\"",
-    "build:extensions:linux": "rimraf ./electron/pre-install/*.tgz && find ./extensions -mindepth 1 -maxdepth 1 -type d -print0 | xargs -0 -n 1 -P 4 -I {} sh -c 'cd {} && npm install && npm run build:publish'",
-    "build:extensions:darwin": "rimraf ./electron/pre-install/*.tgz && find ./extensions -mindepth 1 -maxdepth 1 -type d -print0 | xargs -0 -n 1 -P 4 -I {} sh -c 'cd {} && npm install && npm run build:publish'",
+    "build:extensions:windows": "rimraf ./pre-install/*.tgz && powershell -command \"$jobs = Get-ChildItem -Path './extensions' -Directory | ForEach-Object { Start-Job -Name ($_.Name) -ScriptBlock { param($_dir); try { Set-Location $_dir; npm install; npm run build:publish; Write-Output 'Build successful in ' + $_dir } catch { Write-Error 'Error in ' + $_dir; throw } } -ArgumentList $_.FullName }; $jobs | Wait-Job; $jobs | ForEach-Object { Receive-Job -Job $_ -Keep } | ForEach-Object { Write-Host $_ }; $failed = $jobs | Where-Object { $_.State -ne 'Completed' -or $_.ChildJobs[0].JobStateInfo.State -ne 'Completed' }; if ($failed) { Exit 1 }\"",
+    "build:extensions:linux": "rimraf ./pre-install/*.tgz && find ./extensions -mindepth 1 -maxdepth 1 -type d -print0 | xargs -0 -n 1 -P 4 -I {} sh -c 'cd {} && npm install && npm run build:publish'",
+    "build:extensions:darwin": "rimraf ./pre-install/*.tgz && find ./extensions -mindepth 1 -maxdepth 1 -type d -print0 | xargs -0 -n 1 -P 4 -I {} sh -c 'cd {} && npm install && npm run build:publish'",
+    "build:extensions:server": "yarn workspace build:extensions ",
     "build:extensions": "run-script-os",
     "build:test": "yarn copy:assets && yarn build:web && yarn workspace jan build:test",
     "build": "yarn build:web && yarn build:electron",
diff --git a/pre-install/.gitkeep b/pre-install/.gitkeep
new file mode 100644
index 000000000..e69de29bb
diff --git a/server/helpers/setup.ts b/server/helpers/setup.ts
new file mode 100644
index 000000000..7d8f8914a
--- /dev/null
+++ b/server/helpers/setup.ts
@@ -0,0 +1,73 @@
+import { join, extname } from 'path'
+import { existsSync, readdirSync, writeFileSync, mkdirSync } from 'fs'
+import { init, installExtensions } from '@janhq/core/node'
+
+export async function setup() {
+  /**
+   * Setup Jan Data Directory
+   */
+  const appDir = process.env.JAN_DATA_DIRECTORY ?? join(__dirname, '..', 'jan')
+
+  console.debug(`Create app data directory at ${appDir}...`)
+  if (!existsSync(appDir)) mkdirSync(appDir)
+  //@ts-ignore
+  global.core = {
+    // Define appPath function for app to retrieve app path globaly
+    appPath: () => appDir,
+  }
+  init({
+    extensionsPath: join(appDir, 'extensions'),
+  })
+
+  /**
+   * Write app configurations. See #1619
+   */
+  console.debug('Writing config file...')
+  writeFileSync(
+    join(appDir, 'settings.json'),
+    JSON.stringify({
+      data_folder: appDir,
+    }),
+    'utf-8'
+  )
+
+  if (!existsSync(join(appDir, 'settings'))) {
+    console.debug('Writing nvidia config file...')
+    mkdirSync(join(appDir, 'settings'))
+    writeFileSync(
+      join(appDir, 'settings', 'settings.json'),
+      JSON.stringify(
+        {
+          notify: true,
+          run_mode: 'cpu',
+          nvidia_driver: {
+            exist: false,
+            version: '',
+          },
+          cuda: {
+            exist: false,
+            version: '',
+          },
+          gpus: [],
+          gpu_highest_vram: '',
+          gpus_in_use: [],
+          is_initial: true,
+        }),
+      'utf-8'
+    )
+  }
+
+  /**
+   * Install extensions
+   */
+
+  console.debug('Installing extensions...')
+
+  const baseExtensionPath = join(__dirname, '../../..', 'pre-install')
+  const extensions = readdirSync(baseExtensionPath)
+    .filter((file) => extname(file) === '.tgz')
+    .map((file) => join(baseExtensionPath, file))
+
+  await installExtensions(extensions)
+  console.debug('Extensions installed')
+}
diff --git a/server/index.ts b/server/index.ts
index 05bfdca96..98cc8385d 100644
--- a/server/index.ts
+++ b/server/index.ts
@@ -1,26 +1,27 @@
-import fastify from "fastify";
-import dotenv from "dotenv";
+import fastify from 'fastify'
+import dotenv from 'dotenv'
 import {
   getServerLogPath,
   v1Router,
   logServer,
   getJanExtensionsPath,
-} from "@janhq/core/node";
-import { join } from "path";
+} from '@janhq/core/node'
+import { join } from 'path'
+import tcpPortUsed from 'tcp-port-used'
 
 // Load environment variables
-dotenv.config();
+dotenv.config()
 
 // Define default settings
-const JAN_API_HOST = process.env.JAN_API_HOST || "127.0.0.1";
-const JAN_API_PORT = Number.parseInt(process.env.JAN_API_PORT || "1337");
+const JAN_API_HOST = process.env.JAN_API_HOST || '127.0.0.1'
+const JAN_API_PORT = Number.parseInt(process.env.JAN_API_PORT || '1337')
 
 // Initialize server settings
-let server: any | undefined = undefined;
-let hostSetting: string = JAN_API_HOST;
-let portSetting: number = JAN_API_PORT;
-let corsEnabled: boolean = true;
-let isVerbose: boolean = true;
+let server: any | undefined = undefined
+let hostSetting: string = JAN_API_HOST
+let portSetting: number = JAN_API_PORT
+let corsEnabled: boolean = true
+let isVerbose: boolean = true
 
 /**
  * Server configurations
@@ -32,80 +33,93 @@ let isVerbose: boolean = true;
  * @param baseDir - Base directory for the OpenAPI schema file
  */
 export interface ServerConfig {
-  host?: string;
-  port?: number;
-  isCorsEnabled?: boolean;
-  isVerboseEnabled?: boolean;
-  schemaPath?: string;
-  baseDir?: string;
+  host?: string
+  port?: number
+  isCorsEnabled?: boolean
+  isVerboseEnabled?: boolean
+  schemaPath?: string
+  baseDir?: string
+  storageAdataper?: any
 }
 
 /**
  * Function to start the server
  * @param configs - Server configurations
  */
-export const startServer = async (configs?: ServerConfig) => {
+export const startServer = async (configs?: ServerConfig): Promise<boolean> => {
+  if (configs?.port && configs?.host) {
+    const inUse = await tcpPortUsed.check(Number(configs.port), configs.host)
+    if (inUse) {
+      const errorMessage = `Port ${configs.port} is already in use.`
+      logServer(errorMessage)
+      throw new Error(errorMessage)
+    }
+  }
+
   // Update server settings
-  isVerbose = configs?.isVerboseEnabled ?? true;
-  hostSetting = configs?.host ?? JAN_API_HOST;
-  portSetting = configs?.port ?? JAN_API_PORT;
-  corsEnabled = configs?.isCorsEnabled ?? true;
-  const serverLogPath = getServerLogPath();
+  isVerbose = configs?.isVerboseEnabled ?? true
+  hostSetting = configs?.host ?? JAN_API_HOST
+  portSetting = configs?.port ?? JAN_API_PORT
+  corsEnabled = configs?.isCorsEnabled ?? true
+  const serverLogPath = getServerLogPath()
 
   // Start the server
   try {
     // Log server start
-    if (isVerbose) logServer(`Debug: Starting JAN API server...`);
+    if (isVerbose) logServer(`Debug: Starting JAN API server...`)
 
     // Initialize Fastify server with logging
     server = fastify({
       logger: {
-        level: "info",
+        level: 'info',
         file: serverLogPath,
       },
-    });
+    })
 
     // Register CORS if enabled
-    if (corsEnabled) await server.register(require("@fastify/cors"), {});
+    if (corsEnabled) await server.register(require('@fastify/cors'), {})
 
     // Register Swagger for API documentation
-    await server.register(require("@fastify/swagger"), {
-      mode: "static",
+    await server.register(require('@fastify/swagger'), {
+      mode: 'static',
       specification: {
-        path: configs?.schemaPath ?? "./../docs/openapi/jan.yaml",
-        baseDir: configs?.baseDir ?? "./../docs/openapi",
+        path: configs?.schemaPath ?? './../docs/openapi/jan.yaml',
+        baseDir: configs?.baseDir ?? './../docs/openapi',
       },
-    });
+    })
 
     // Register Swagger UI
-    await server.register(require("@fastify/swagger-ui"), {
-      routePrefix: "/",
-      baseDir: configs?.baseDir ?? join(__dirname, "../..", "./docs/openapi"),
+    await server.register(require('@fastify/swagger-ui'), {
+      routePrefix: '/',
+      baseDir: configs?.baseDir ?? join(__dirname, '../..', './docs/openapi'),
       uiConfig: {
-        docExpansion: "full",
+        docExpansion: 'full',
         deepLinking: false,
       },
       staticCSP: false,
       transformSpecificationClone: true,
-    });
+    })
 
     // Register static file serving for extensions
     // TODO: Watch extension files changes and reload
     await server.register(
       (childContext: any, _: any, done: any) => {
-        childContext.register(require("@fastify/static"), {
+        childContext.register(require('@fastify/static'), {
           root: getJanExtensionsPath(),
           wildcard: false,
-        });
+        })
 
-        done();
+        done()
       },
-      { prefix: "extensions" }
-    );
+      { prefix: 'extensions' }
+    )
+
+    // Register proxy middleware
+    if (configs?.storageAdataper)
+      server.addHook('preHandler', configs.storageAdataper)
 
     // Register API routes
-    await server.register(v1Router, { prefix: "/v1" });
-
+    await server.register(v1Router, { prefix: '/v1' })
     // Start listening for requests
     await server
       .listen({
@@ -117,13 +131,15 @@ export const startServer = async (configs?: ServerConfig) => {
         if (isVerbose)
           logServer(
             `Debug: JAN API listening at: http://${hostSetting}:${portSetting}`
-          );
-      });
+          )
+      })
+    return true
   } catch (e) {
     // Log any errors
-    if (isVerbose) logServer(`Error: ${e}`);
+    if (isVerbose) logServer(`Error: ${e}`)
   }
-};
+  return false
+}
 
 /**
  * Function to stop the server
@@ -131,11 +147,11 @@ export const startServer = async (configs?: ServerConfig) => {
 export const stopServer = async () => {
   try {
     // Log server stop
-    if (isVerbose) logServer(`Debug: Server stopped`);
+    if (isVerbose) logServer(`Debug: Server stopped`)
     // Stop the server
-    await server.close();
+    await server.close()
   } catch (e) {
     // Log any errors
-    if (isVerbose) logServer(`Error: ${e}`);
+    if (isVerbose) logServer(`Error: ${e}`)
   }
-};
+}
diff --git a/server/main.ts b/server/main.ts
index c3eb69135..71fb11106 100644
--- a/server/main.ts
+++ b/server/main.ts
@@ -1,3 +1,7 @@
-import { startServer } from "./index";
-
-startServer();
+import { s3 } from './middleware/s3'
+import { setup } from './helpers/setup'
+import { startServer as start } from './index'
+/**
+ * Setup extensions and start the server
+ */
+setup().then(() => start({ storageAdataper: s3 }))
diff --git a/server/middleware/s3.ts b/server/middleware/s3.ts
new file mode 100644
index 000000000..28971a42b
--- /dev/null
+++ b/server/middleware/s3.ts
@@ -0,0 +1,70 @@
+import { join } from 'path'
+
+// Middleware to intercept requests and proxy if certain conditions are met
+const config = {
+  endpoint: process.env.AWS_ENDPOINT,
+  region: process.env.AWS_REGION,
+  credentials: {
+    accessKeyId: process.env.AWS_ACCESS_KEY_ID,
+    secretAccessKey: process.env.AWS_SECRET_ACCESS_KEY,
+  },
+}
+
+const S3_BUCKET_NAME = process.env.S3_BUCKET_NAME
+
+const fs = require('@cyclic.sh/s3fs')(S3_BUCKET_NAME, config)
+const PROXY_PREFIX = '/v1/fs'
+const PROXY_ROUTES = ['/threads', '/messages']
+
+export const s3 = (req: any, reply: any, done: any) => {
+  // Proxy FS requests to S3 using S3FS
+  if (req.url.startsWith(PROXY_PREFIX)) {
+    const route = req.url.split('/').pop()
+    const args = parseRequestArgs(req)
+
+    // Proxy matched requests to the s3fs module
+    if (args.length && PROXY_ROUTES.some((route) => args[0].includes(route))) {
+      try {
+        // Handle customized route
+        // S3FS does not handle appendFileSync
+        if (route === 'appendFileSync') {
+          let result = handAppendFileSync(args)
+
+          reply.status(200).send(result)
+          return
+        }
+        // Reroute the other requests to the s3fs module
+        const result = fs[route](...args)
+        reply.status(200).send(result)
+        return
+      } catch (ex) {
+        console.log(ex)
+      }
+    }
+  }
+  // Let other requests go through
+  done()
+}
+
+const parseRequestArgs = (req: Request) => {
+  const {
+    getJanDataFolderPath,
+    normalizeFilePath,
+  } = require('@janhq/core/node')
+
+  return JSON.parse(req.body as any).map((arg: any) =>
+    typeof arg === 'string' &&
+    (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
+      ? join(getJanDataFolderPath(), normalizeFilePath(arg))
+      : arg
+  )
+}
+
+const handAppendFileSync = (args: any[]) => {
+  if (fs.existsSync(args[0])) {
+    const data = fs.readFileSync(args[0], 'utf-8')
+    return fs.writeFileSync(args[0], data + args[1])
+  } else {
+    return fs.writeFileSync(args[0], args[1])
+  }
+}
diff --git a/server/nodemon.json b/server/nodemon.json
deleted file mode 100644
index 0ea41ca96..000000000
--- a/server/nodemon.json
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "watch": ["main.ts", "v1"],
-    "ext": "ts, json",
-    "exec": "tsc && node ./build/main.js"
-}
\ No newline at end of file
diff --git a/server/package.json b/server/package.json
index f61730da4..d9a2bbc9a 100644
--- a/server/package.json
+++ b/server/package.json
@@ -18,26 +18,29 @@
   },
   "dependencies": {
     "@alumna/reflect": "^1.1.3",
+    "@cyclic.sh/s3fs": "^1.2.9",
     "@fastify/cors": "^8.4.2",
     "@fastify/static": "^6.12.0",
     "@fastify/swagger": "^8.13.0",
     "@fastify/swagger-ui": "2.0.1",
     "@janhq/core": "link:./core",
+    "@npmcli/arborist": "^7.3.1",
     "dotenv": "^16.3.1",
     "fastify": "^4.24.3",
-    "request": "^2.88.2",
     "fetch-retry": "^5.0.6",
-    "tcp-port-used": "^1.0.2",
-    "request-progress": "^3.0.0"
+    "node-fetch": "2",
+    "request": "^2.88.2",
+    "request-progress": "^3.0.0",
+    "tcp-port-used": "^1.0.2"
   },
   "devDependencies": {
     "@types/body-parser": "^1.19.5",
     "@types/npmcli__arborist": "^5.6.4",
+    "@types/tcp-port-used": "^1.0.4",
     "@typescript-eslint/eslint-plugin": "^6.7.3",
     "@typescript-eslint/parser": "^6.7.3",
     "eslint-plugin-react": "^7.33.2",
     "run-script-os": "^1.1.6",
-    "@types/tcp-port-used": "^1.0.4",
     "typescript": "^5.2.2"
   }
 }
diff --git a/server/tsconfig.json b/server/tsconfig.json
index 2c4fc4a64..dd27b8932 100644
--- a/server/tsconfig.json
+++ b/server/tsconfig.json
@@ -20,5 +20,5 @@
   // "sourceMap": true,
 
   "include": ["./**/*.ts"],
-  "exclude": ["core", "build", "dist", "tests", "node_modules"]
+  "exclude": ["core", "build", "dist", "tests", "node_modules", "extensions"]
 }
diff --git a/uikit/src/input/styles.scss b/uikit/src/input/styles.scss
index 9990da8b4..e649f494d 100644
--- a/uikit/src/input/styles.scss
+++ b/uikit/src/input/styles.scss
@@ -1,6 +1,6 @@
 .input {
   @apply border-border placeholder:text-muted-foreground flex h-9 w-full rounded-lg border bg-transparent px-3 py-1 transition-colors;
-  @apply disabled:cursor-not-allowed disabled:bg-zinc-100 disabled:dark:bg-zinc-800 disabled:dark:text-zinc-600;
+  @apply disabled:text-muted-foreground disabled:cursor-not-allowed disabled:bg-zinc-100 disabled:dark:bg-zinc-800 disabled:dark:text-zinc-600;
   @apply focus-within:outline-none focus-visible:outline-0 focus-visible:ring-2 focus-visible:ring-blue-500 focus-visible:ring-offset-1;
   @apply file:border-0 file:bg-transparent file:font-medium;
 }
diff --git a/uikit/src/select/styles.scss b/uikit/src/select/styles.scss
index bc5b6c0cc..90485723a 100644
--- a/uikit/src/select/styles.scss
+++ b/uikit/src/select/styles.scss
@@ -1,6 +1,6 @@
 .select {
   @apply placeholder:text-muted-foreground border-border flex h-9 w-full items-center justify-between whitespace-nowrap rounded-md border bg-transparent px-3 py-2 text-sm shadow-sm disabled:cursor-not-allowed [&>span]:line-clamp-1;
-  @apply disabled:cursor-not-allowed disabled:bg-zinc-100 disabled:dark:bg-zinc-800 disabled:dark:text-zinc-600;
+  @apply disabled:text-muted-foreground disabled:cursor-not-allowed disabled:bg-zinc-100 disabled:dark:bg-zinc-800 disabled:dark:text-zinc-600;
   @apply focus-within:outline-none focus-visible:outline-0 focus-visible:ring-2 focus-visible:ring-blue-500 focus-visible:ring-offset-1;
 
   &-caret {
@@ -21,6 +21,7 @@
 
   &-item {
     @apply hover:bg-secondary relative my-1 block w-full cursor-pointer select-none items-center rounded-sm px-4 py-2 text-sm data-[disabled]:pointer-events-none data-[disabled]:opacity-50;
+    @apply focus:outline-none focus-visible:outline-0;
   }
 
   &-trigger-viewport {
diff --git a/uikit/types/declaration.d.ts b/uikit/types/declaration.d.ts
index 85b1a7136..f8e975fa5 100644
--- a/uikit/types/declaration.d.ts
+++ b/uikit/types/declaration.d.ts
@@ -1,4 +1,4 @@
 declare module '*.scss' {
-  const content: Record<string, string>;
-  export default content;
-}
\ No newline at end of file
+  const content: Record<string, string>
+  export default content
+}
diff --git a/web/.prettierignore b/web/.prettierignore
deleted file mode 100644
index 02d9145c1..000000000
--- a/web/.prettierignore
+++ /dev/null
@@ -1,5 +0,0 @@
-.next/
-node_modules/
-dist/
-*.hbs
-*.mdx
\ No newline at end of file
diff --git a/web/.prettierrc b/web/.prettierrc
deleted file mode 100644
index 46f1abcb0..000000000
--- a/web/.prettierrc
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-  "semi": false,
-  "singleQuote": true,
-  "quoteProps": "consistent",
-  "trailingComma": "es5",
-  "endOfLine": "auto",
-  "plugins": ["prettier-plugin-tailwindcss"]
-}
diff --git a/web/app/error.tsx b/web/app/error.tsx
new file mode 100644
index 000000000..25b24b9ef
--- /dev/null
+++ b/web/app/error.tsx
@@ -0,0 +1,89 @@
+'use client' // Error components must be Client Components
+
+import { useEffect, useState } from 'react'
+
+export default function Error({
+  error,
+}: {
+  error: Error & { digest?: string }
+  reset: () => void
+}) {
+  const [showFull, setShowFull] = useState(false)
+  useEffect(() => {
+    // Log the error to an error reporting service
+    console.error(error)
+  }, [error])
+
+  return (
+    <>
+      <div className="flex h-screen w-full items-center justify-center overflow-auto bg-white p-5">
+        <div className="w-full text-center">
+          <div className="inline-flex rounded-full bg-red-100 p-4">
+            <div className="rounded-full bg-red-200 stroke-red-600 p-4">
+              <svg
+                className="h-16 w-16"
+                viewBox="0 0 28 28"
+                fill="none"
+                xmlns="http://www.w3.org/2000/svg"
+              >
+                <path
+                  d="M6 8H6.01M6 16H6.01M6 12H18C20.2091 12 22 10.2091 22 8C22 5.79086 20.2091 4 18 4H6C3.79086 4 2 5.79086 2 8C2 10.2091 3.79086 12 6 12ZM6 12C3.79086 12 2 13.7909 2 16C2 18.2091 3.79086 20 6 20H14"
+                  stroke-width="2"
+                  stroke-linecap="round"
+                  stroke-linejoin="round"
+                ></path>
+                <path
+                  d="M17 16L22 21M22 16L17 21"
+                  stroke-width="2"
+                  stroke-linecap="round"
+                  stroke-linejoin="round"
+                ></path>
+              </svg>
+            </div>
+          </div>
+          <h1 className="mt-5 text-xl font-bold text-slate-800">
+            Oops! Unexpected error occurred.
+          </h1>
+          <p className="lg:text-md my-2 text-slate-600">
+            Something went wrong. Try to{' '}
+            <button
+              rel="noopener noreferrer"
+              className="text-blue-600 hover:underline"
+              onClick={() => window.location.reload()}
+            >
+              refresh this page
+            </button>{' '}
+            or <br /> feel free to{' '}
+            <a
+              rel="noopener noreferrer"
+              className="text-blue-600 hover:underline"
+              href="https://discord.gg/FTk2MvZwJH"
+              target="_blank_"
+            >
+              contact us
+            </a>{' '}
+            if the problem presists.
+          </p>
+          <div
+            className="mt-5 w-full rounded border border-red-400 bg-red-100 px-4 py-3 text-red-700"
+            role="alert"
+          >
+            <strong className="font-bold">Error: </strong>
+            <span className="block sm:inline">{error.message}</span>
+            <div className="mt-2 h-full w-full">
+              <pre className="mt-2 w-full whitespace-pre-wrap rounded bg-red-200 p-4 text-left text-sm text-red-600">
+                {showFull ? error.stack : error.stack?.slice(0, 200)}
+              </pre>
+              <button
+                onClick={() => setShowFull(!showFull)}
+                className="mt-1 text-sm text-red-700 underline focus:outline-none"
+              >
+                {showFull ? 'Show less' : 'Show more'}
+              </button>
+            </div>
+          </div>
+        </div>
+      </div>
+    </>
+  )
+}
diff --git a/web/app/page.tsx b/web/app/page.tsx
index 20b15a235..92d654528 100644
--- a/web/app/page.tsx
+++ b/web/app/page.tsx
@@ -11,7 +11,6 @@ import ExploreModelsScreen from '@/screens/ExploreModels'
 
 import LocalServerScreen from '@/screens/LocalServer'
 import SettingsScreen from '@/screens/Settings'
-import SystemMonitorScreen from '@/screens/SystemMonitor'
 
 export default function Page() {
   const { mainViewState } = useMainViewState()
@@ -26,10 +25,6 @@ export default function Page() {
       children = <SettingsScreen />
       break
 
-    case MainViewState.SystemMonitor:
-      children = <SystemMonitorScreen />
-      break
-
     case MainViewState.LocalServer:
       children = <LocalServerScreen />
       break
diff --git a/web/constants/screens.ts b/web/constants/screens.ts
index 6a8adc185..74b441b17 100644
--- a/web/constants/screens.ts
+++ b/web/constants/screens.ts
@@ -3,6 +3,5 @@ export enum MainViewState {
   MyModels,
   Settings,
   Thread,
-  SystemMonitor,
   LocalServer,
 }
diff --git a/web/containers/CardSidebar/index.tsx b/web/containers/CardSidebar/index.tsx
index 38a8678d9..89ff60e66 100644
--- a/web/containers/CardSidebar/index.tsx
+++ b/web/containers/CardSidebar/index.tsx
@@ -22,6 +22,7 @@ interface Props {
   rightAction?: ReactNode
   title: string
   asChild?: boolean
+  isShow?: boolean
   hideMoreVerticalAction?: boolean
 }
 export default function CardSidebar({
@@ -30,8 +31,9 @@ export default function CardSidebar({
   asChild,
   rightAction,
   hideMoreVerticalAction,
+  isShow,
 }: Props) {
-  const [show, setShow] = useState(true)
+  const [show, setShow] = useState(isShow ?? false)
   const [more, setMore] = useState(false)
   const [menu, setMenu] = useState<HTMLDivElement | null>(null)
   const [toggle, setToggle] = useState<HTMLDivElement | null>(null)
@@ -67,8 +69,8 @@ export default function CardSidebar({
                 show && 'rotate-180'
               )}
             />
+            <span className="font-bold">{title}</span>
           </button>
-          <span className="font-bold">{title}</span>
         </div>
         <div className="flex">
           {rightAction && rightAction}
@@ -156,7 +158,10 @@ export default function CardSidebar({
                       </>
                     ) : (
                       <>
-                        Opens <span className="lowercase">{title}.json.</span>
+                        Opens{' '}
+                        <span className="lowercase">
+                          {title === 'Tools' ? 'assistant' : title}.json.
+                        </span>
                         &nbsp;Changes affect all new threads.
                       </>
                     )}
diff --git a/web/containers/DropdownListSidebar/index.tsx b/web/containers/DropdownListSidebar/index.tsx
index 140a1aba1..191c7bcbe 100644
--- a/web/containers/DropdownListSidebar/index.tsx
+++ b/web/containers/DropdownListSidebar/index.tsx
@@ -14,7 +14,14 @@ import {
 
 import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 
-import { MonitorIcon } from 'lucide-react'
+import {
+  MonitorIcon,
+  LayoutGridIcon,
+  FoldersIcon,
+  GlobeIcon,
+  CheckIcon,
+  CopyIcon,
+} from 'lucide-react'
 
 import { twMerge } from 'tailwind-merge'
 
@@ -22,6 +29,7 @@ import { MainViewState } from '@/constants/screens'
 
 import { useActiveModel } from '@/hooks/useActiveModel'
 
+import { useClipboard } from '@/hooks/useClipboard'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import useRecommendedModel from '@/hooks/useRecommendedModel'
@@ -42,6 +50,8 @@ import {
 
 export const selectedModelAtom = atom<Model | undefined>(undefined)
 
+const engineOptions = ['Local', 'Remote']
+
 // TODO: Move all of the unscoped logics outside of the component
 const DropdownListSidebar = ({
   strictedThread = true,
@@ -51,13 +61,24 @@ const DropdownListSidebar = ({
   const activeThread = useAtomValue(activeThreadAtom)
   const [selectedModel, setSelectedModel] = useAtom(selectedModelAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
-
+  const [isTabActive, setIsTabActive] = useState(0)
   const { stateModel } = useActiveModel()
   const [serverEnabled, setServerEnabled] = useAtom(serverEnabledAtom)
   const { setMainViewState } = useMainViewState()
   const [loader, setLoader] = useState(0)
   const { recommendedModel, downloadedModels } = useRecommendedModel()
   const { updateModelParameter } = useUpdateModelParameters()
+  const clipboard = useClipboard({ timeout: 1000 })
+  const [copyId, setCopyId] = useState('')
+
+  const localModel = downloadedModels.filter(
+    (model) => model.engine === InferenceEngine.nitro
+  )
+  const remoteModel = downloadedModels.filter(
+    (model) => model.engine === InferenceEngine.openai
+  )
+
+  const modelOptions = isTabActive === 0 ? localModel : remoteModel
 
   useEffect(() => {
     if (!activeThread) return
@@ -73,7 +94,7 @@ const DropdownListSidebar = ({
 
   // This is fake loader please fix this when we have realtime percentage when load model
   useEffect(() => {
-    if (stateModel.loading) {
+    if (stateModel.model === selectedModel?.id && stateModel.loading) {
       if (loader === 24) {
         setTimeout(() => {
           setLoader(loader + 1)
@@ -94,7 +115,7 @@ const DropdownListSidebar = ({
     } else {
       setLoader(0)
     }
-  }, [stateModel.loading, loader])
+  }, [stateModel.loading, loader, selectedModel, stateModel.model])
 
   const onValueSelected = useCallback(
     async (modelId: string) => {
@@ -138,12 +159,16 @@ const DropdownListSidebar = ({
     return null
   }
 
+  const selectedModelLoading =
+    stateModel.model === selectedModel?.id && stateModel.loading
+
   return (
     <>
       <div
         className={twMerge(
           'relative w-full overflow-hidden rounded-md',
-          stateModel.loading && 'pointer-events-none bg-blue-200 text-blue-600'
+          stateModel.loading && 'pointer-events-none',
+          selectedModelLoading && 'bg-blue-200 text-blue-600'
         )}
       >
         <Select
@@ -153,7 +178,7 @@ const DropdownListSidebar = ({
         >
           <SelectTrigger className="relative w-full">
             <SelectValue placeholder="Choose model to start">
-              {stateModel.loading && (
+              {selectedModelLoading && (
                 <div
                   className="z-5 absolute left-0 top-0 h-full w-full rounded-md bg-blue-100/80"
                   style={{ width: `${loader}%` }}
@@ -162,7 +187,7 @@ const DropdownListSidebar = ({
               <span
                 className={twMerge(
                   'relative z-20',
-                  stateModel.loading && 'font-medium'
+                  selectedModelLoading && 'font-medium'
                 )}
               >
                 {selectedModel?.name}
@@ -170,49 +195,151 @@ const DropdownListSidebar = ({
             </SelectValue>
           </SelectTrigger>
           <SelectPortal>
-            <SelectContent className="right-2  block w-full min-w-[450px] pr-0">
-              <div className="flex w-full items-center space-x-2 px-4 py-2">
-                <MonitorIcon size={20} className="text-muted-foreground" />
-                <span>Local</span>
+            <SelectContent
+              className={twMerge(
+                'right-2  block w-full min-w-[450px] pr-0',
+                isTabActive === 1 && '[&_.select-scroll-down-button]:hidden'
+              )}
+            >
+              <div className="relative px-2 py-2 dark:bg-secondary/50">
+                <ul className="inline-flex w-full space-x-2 rounded-lg bg-zinc-100 px-1 dark:bg-secondary">
+                  {engineOptions.map((name, i) => {
+                    return (
+                      <li
+                        className={twMerge(
+                          'relative my-1 flex w-full cursor-pointer items-center justify-center space-x-2 px-2 py-2',
+                          isTabActive === i &&
+                            'rounded-md bg-background dark:bg-white'
+                        )}
+                        key={i}
+                        onClick={() => setIsTabActive(i)}
+                      >
+                        {i === 0 ? (
+                          <MonitorIcon
+                            size={20}
+                            className="z-50 text-muted-foreground"
+                          />
+                        ) : (
+                          <GlobeIcon
+                            size={20}
+                            className="z-50 text-muted-foreground"
+                          />
+                        )}
+                        <span
+                          className={twMerge(
+                            'relative z-50 font-medium text-muted-foreground',
+                            isTabActive === i &&
+                              'font-bold text-foreground dark:text-black'
+                          )}
+                        >
+                          {name}
+                        </span>
+                      </li>
+                    )
+                  })}
+                </ul>
               </div>
+
               <div className="border-b border-border" />
               {downloadedModels.length === 0 ? (
                 <div className="px-4 py-2">
                   <p>{`Oops, you don't have a model yet.`}</p>
                 </div>
               ) : (
-                <SelectGroup>
-                  {downloadedModels.map((x, i) => (
-                    <SelectItem
-                      key={i}
-                      value={x.id}
-                      className={twMerge(
-                        x.id === selectedModel?.id && 'bg-secondary'
-                      )}
-                    >
-                      <div className="flex w-full justify-between">
-                        <span className="line-clamp-1 block">{x.name}</span>
-                        <div className="space-x-2">
-                          <span className="font-bold text-muted-foreground">
-                            {toGibibytes(x.metadata.size)}
-                          </span>
-                          {x.engine == InferenceEngine.nitro && (
-                            <ModelLabel size={x.metadata.size} />
+                <SelectGroup className="py-2">
+                  <>
+                    {modelOptions.map((x, i) => (
+                      <div
+                        key={i}
+                        className={twMerge(
+                          x.id === selectedModel?.id && 'bg-secondary',
+                          'hover:bg-secondary'
+                        )}
+                      >
+                        <SelectItem
+                          value={x.id}
+                          className={twMerge(
+                            x.id === selectedModel?.id && 'bg-secondary',
+                            'my-0 pb-8 pt-4'
+                          )}
+                        >
+                          <div className="relative flex w-full justify-between">
+                            {x.engine === InferenceEngine.openai && (
+                              <svg
+                                width="20"
+                                height="20"
+                                viewBox="0 0 20 20"
+                                fill="none"
+                                xmlns="http://www.w3.org/2000/svg"
+                                className="absolute top-1"
+                              >
+                                <path
+                                  d="M18.5681 8.18423C18.7917 7.51079 18.8691 6.79739 18.795 6.09168C18.7209 5.38596 18.497 4.70419 18.1384 4.0919C17.6067 3.16642 16.7948 2.43369 15.8199 1.99936C14.8449 1.56503 13.7572 1.45153 12.7135 1.67523C12.1206 1.0157 11.3646 0.523789 10.5214 0.248906C9.67823 -0.0259764 8.77756 -0.0741542 7.90986 0.109212C7.04216 0.292577 6.23798 0.701031 5.57809 1.29355C4.91821 1.88607 4.42584 2.64179 4.15046 3.48481C3.45518 3.62739 2.79834 3.91672 2.22384 4.33347C1.64933 4.75023 1.1704 5.28481 0.81904 5.90148C0.281569 6.82542 0.0518576 7.89634 0.163116 8.95943C0.274374 10.0225 0.720837 11.0227 1.43796 11.8153C1.21351 12.4884 1.13539 13.2017 1.20883 13.9074C1.28227 14.6132 1.50557 15.2951 1.86379 15.9076C2.39616 16.8334 3.20872 17.5663 4.18438 18.0006C5.16004 18.4349 6.24841 18.5483 7.29262 18.3243C7.76367 18.8548 8.34248 19.2786 8.99038 19.5676C9.63828 19.8566 10.3404 20.004 11.0498 20C12.1195 20.001 13.1618 19.662 14.0263 19.032C14.8909 18.4021 15.5329 17.5137 15.8596 16.4951C16.5548 16.3523 17.2116 16.0629 17.786 15.6461C18.3605 15.2294 18.8395 14.6949 19.191 14.0784C19.7222 13.1558 19.9479 12.0889 19.836 11.0303C19.7242 9.97163 19.2804 8.9754 18.5681 8.18423ZM11.0498 18.691C10.1737 18.6924 9.32512 18.3853 8.65279 17.8236L8.77104 17.7566L12.753 15.4581C12.8521 15.4 12.9343 15.3171 12.9917 15.2176C13.0491 15.118 13.0796 15.0053 13.0802 14.8904V9.27631L14.7635 10.2501C14.7719 10.2544 14.7791 10.2605 14.7846 10.268C14.7901 10.2755 14.7937 10.2843 14.7952 10.2935V14.9456C14.7931 15.9383 14.3978 16.8898 13.6959 17.5917C12.9939 18.2936 12.0425 18.6889 11.0498 18.691ZM2.99921 15.2531C2.55985 14.4945 2.4021 13.6052 2.55371 12.7417L2.67204 12.8127L6.65787 15.1112C6.7565 15.1691 6.86877 15.1996 6.98312 15.1996C7.09747 15.1996 7.20975 15.1691 7.30837 15.1112L12.1774 12.3041V14.2478C12.1769 14.2579 12.1742 14.2677 12.1694 14.2766C12.1646 14.2855 12.1579 14.2932 12.1497 14.2991L8.11654 16.6251C7.25581 17.121 6.2335 17.255 5.27405 16.9978C4.3146 16.7405 3.49644 16.1131 2.99921 15.2531ZM1.95054 6.57965C2.39294 5.81612 3.09123 5.23375 3.92179 4.93565V9.66665C3.92029 9.78094 3.94949 9.89355 4.00635 9.99271C4.06321 10.0919 4.14564 10.174 4.24504 10.2304L9.09037 13.0256L7.40696 13.9994C7.39785 14.0042 7.38769 14.0068 7.37737 14.0068C7.36706 14.0068 7.3569 14.0042 7.34779 13.9994L3.32254 11.6773C2.46343 11.1793 1.83666 10.3612 1.57951 9.40204C1.32236 8.44291 1.45577 7.42095 1.95054 6.55998V6.57965ZM15.7808 9.79281L10.9197 6.96998L12.5992 5.99998C12.6083 5.99514 12.6185 5.99261 12.6288 5.99261C12.6391 5.99261 12.6493 5.99514 12.6584 5.99998L16.6836 8.32606C17.2991 8.68119 17.8008 9.20407 18.1303 9.83365C18.4597 10.4632 18.6032 11.1735 18.5441 11.8816C18.485 12.5898 18.2257 13.2664 17.7964 13.8327C17.3672 14.3989 16.7857 14.8314 16.1199 15.0796V10.3486C16.1164 10.2345 16.0833 10.1232 16.0238 10.0258C15.9644 9.92833 15.8807 9.8481 15.7808 9.79281ZM17.4564 7.27356L17.338 7.20256L13.3601 4.8844C13.2609 4.82617 13.1479 4.79547 13.0329 4.79547C12.9178 4.79547 12.8049 4.82617 12.7056 4.8844L7.84071 7.6914V5.74781C7.83967 5.73793 7.84132 5.72795 7.84549 5.71893C7.84965 5.70991 7.85618 5.70218 7.86437 5.69656L11.8896 3.3744C12.5066 3.01899 13.2119 2.84659 13.9232 2.87736C14.6345 2.90813 15.3224 3.14079 15.9063 3.54813C16.4903 3.95548 16.9461 4.52066 17.2206 5.17759C17.4952 5.83452 17.577 6.55602 17.4565 7.25773L17.4564 7.27356ZM6.92196 10.7191L5.23862 9.74931C5.2302 9.74424 5.223 9.73738 5.21753 9.72921C5.21205 9.72105 5.20845 9.71178 5.20696 9.70206V5.06181C5.20788 4.34996 5.41144 3.65307 5.79383 3.05265C6.17622 2.45222 6.72164 1.97305 7.36632 1.67118C8.011 1.3693 8.7283 1.2572 9.43434 1.34796C10.1404 1.43873 10.806 1.72861 11.3534 2.18373L11.235 2.25081L7.25321 4.54915C7.1541 4.60727 7.07182 4.69017 7.01445 4.78971C6.95707 4.88925 6.92658 5.00201 6.92596 5.1169L6.92196 10.7191ZM7.83662 8.74798L10.005 7.49815L12.1774 8.74798V11.2475L10.0129 12.4972L7.84062 11.2475L7.83662 8.74798Z"
+                                  fill="#18181B"
+                                />
+                              </svg>
+                            )}
+                            <div
+                              className={twMerge(
+                                x.engine === InferenceEngine.openai && 'pl-8'
+                              )}
+                            >
+                              <span className="line-clamp-1 block">
+                                {x.name}
+                              </span>
+                              <div className="absolute right-0 top-2 space-x-2">
+                                <span className="font-bold text-muted-foreground">
+                                  {toGibibytes(x.metadata.size)}
+                                </span>
+                                {x.engine == InferenceEngine.nitro && (
+                                  <ModelLabel size={x.metadata.size} />
+                                )}
+                              </div>
+                            </div>
+                          </div>
+                        </SelectItem>
+                        <div
+                          className={twMerge(
+                            'absolute -mt-6 inline-flex items-center space-x-2 px-4 pb-2 text-muted-foreground',
+                            x.engine === InferenceEngine.openai && 'left-8'
+                          )}
+                        >
+                          <span className="text-xs">{x.id}</span>
+                          {clipboard.copied && copyId === x.id ? (
+                            <CheckIcon size={16} className="text-green-600" />
+                          ) : (
+                            <CopyIcon
+                              size={16}
+                              className="z-20 cursor-pointer"
+                              onClick={() => {
+                                clipboard.copy(x.id)
+                                setCopyId(x.id)
+                              }}
+                            />
                           )}
                         </div>
                       </div>
-                    </SelectItem>
-                  ))}
+                    ))}
+                  </>
                 </SelectGroup>
               )}
               <div className="border-b border-border" />
-              <div className="w-full px-4 py-2">
+              <div className="flex w-full space-x-2 px-4 py-2">
+                <Button
+                  block
+                  themes="secondary"
+                  onClick={() => setMainViewState(MainViewState.Settings)}
+                >
+                  <FoldersIcon size={20} className="mr-2" />
+                  <span>My Models</span>
+                </Button>
                 <Button
                   block
                   className="bg-blue-100 font-bold text-blue-600 hover:bg-blue-100 hover:text-blue-600"
                   onClick={() => setMainViewState(MainViewState.Hub)}
                 >
-                  Explore The Hub
+                  <LayoutGridIcon size={20} className="mr-2" />
+                  <span>Explore The Hub</span>
                 </Button>
               </div>
             </SelectContent>
diff --git a/web/containers/GPUDriverPromptModal/index.tsx b/web/containers/GPUDriverPromptModal/index.tsx
index da20ab332..bdcf1b2f8 100644
--- a/web/containers/GPUDriverPromptModal/index.tsx
+++ b/web/containers/GPUDriverPromptModal/index.tsx
@@ -36,7 +36,7 @@ const GPUDriverPrompt: React.FC = () => {
       <Modal open={showNotification} onOpenChange={openChanged}>
         <ModalContent>
           <ModalHeader>
-            <ModalTitle>
+            <ModalTitle className="pr-4 leading-relaxed">
               Checking for machine that does not meet the requirements.
             </ModalTitle>
           </ModalHeader>
diff --git a/web/containers/Layout/BottomBar/DownloadingState/index.tsx b/web/containers/Layout/BottomBar/DownloadingState/index.tsx
index 7aef36caf..dcebacd3c 100644
--- a/web/containers/Layout/BottomBar/DownloadingState/index.tsx
+++ b/web/containers/Layout/BottomBar/DownloadingState/index.tsx
@@ -13,35 +13,38 @@ import {
 import { useAtomValue } from 'jotai'
 
 import useDownloadModel from '@/hooks/useDownloadModel'
-import { useDownloadState } from '@/hooks/useDownloadState'
+import { modelDownloadStateAtom } from '@/hooks/useDownloadState'
 
 import { formatDownloadPercentage } from '@/utils/converter'
 
-import { downloadingModelsAtom } from '@/helpers/atoms/Model.atom'
+import { getDownloadingModelAtom } from '@/helpers/atoms/Model.atom'
 
 export default function DownloadingState() {
-  const { downloadStates } = useDownloadState()
-  const downloadingModels = useAtomValue(downloadingModelsAtom)
+  const downloadStates = useAtomValue(modelDownloadStateAtom)
+  const downloadingModels = useAtomValue(getDownloadingModelAtom)
   const { abortModelDownload } = useDownloadModel()
 
-  const totalCurrentProgress = downloadStates
+  const totalCurrentProgress = Object.values(downloadStates)
     .map((a) => a.size.transferred + a.size.transferred)
     .reduce((partialSum, a) => partialSum + a, 0)
 
-  const totalSize = downloadStates
+  const totalSize = Object.values(downloadStates)
     .map((a) => a.size.total + a.size.total)
     .reduce((partialSum, a) => partialSum + a, 0)
 
-  const totalPercentage = ((totalCurrentProgress / totalSize) * 100).toFixed(2)
+  const totalPercentage =
+    totalSize !== 0 ? ((totalCurrentProgress / totalSize) * 100).toFixed(2) : 0
 
   return (
     <Fragment>
-      {downloadStates?.length > 0 && (
+      {Object.values(downloadStates)?.length > 0 && (
         <Modal>
           <ModalTrigger asChild>
             <div className="relative block">
               <Button size="sm" themes="outline">
-                <span>{downloadStates.length} Downloading model</span>
+                <span>
+                  {Object.values(downloadStates).length} Downloading model
+                </span>
               </Button>
               <span
                 className="absolute left-0 h-full rounded-md rounded-l-md bg-primary/20"
@@ -55,40 +58,38 @@ export default function DownloadingState() {
             <ModalHeader>
               <ModalTitle>Downloading model</ModalTitle>
             </ModalHeader>
-            {downloadStates.map((item, i) => {
-              return (
-                <div className="pt-2" key={i}>
-                  <Progress
-                    className="mb-2 h-2"
-                    value={
-                      formatDownloadPercentage(item?.percent, {
-                        hidePercentage: true,
-                      }) as number
-                    }
-                  />
-                  <div className="flex items-center justify-between gap-x-2">
-                    <div className="flex gap-x-2">
-                      <p className="line-clamp-1">{item?.modelId}</p>
-                      <span>{formatDownloadPercentage(item?.percent)}</span>
-                    </div>
-                    <Button
-                      themes="outline"
-                      size="sm"
-                      onClick={() => {
-                        if (item?.modelId) {
-                          const model = downloadingModels.find(
-                            (model) => model.id === item.modelId
-                          )
-                          if (model) abortModelDownload(model)
-                        }
-                      }}
-                    >
-                      Cancel
-                    </Button>
+            {Object.values(downloadStates).map((item, i) => (
+              <div className="pt-2" key={i}>
+                <Progress
+                  className="mb-2 h-2"
+                  value={
+                    formatDownloadPercentage(item?.percent, {
+                      hidePercentage: true,
+                    }) as number
+                  }
+                />
+                <div className="flex items-center justify-between gap-x-2">
+                  <div className="flex gap-x-2">
+                    <p className="line-clamp-1">{item?.modelId}</p>
+                    <span>{formatDownloadPercentage(item?.percent)}</span>
                   </div>
+                  <Button
+                    themes="outline"
+                    size="sm"
+                    onClick={() => {
+                      if (item?.modelId) {
+                        const model = downloadingModels.find(
+                          (model) => model.id === item.modelId
+                        )
+                        if (model) abortModelDownload(model)
+                      }
+                    }}
+                  >
+                    Cancel
+                  </Button>
                 </div>
-              )
-            })}
+              </div>
+            ))}
           </ModalContent>
         </Modal>
       )}
diff --git a/web/containers/Layout/BottomBar/SystemItem/index.tsx b/web/containers/Layout/BottomBar/SystemItem/index.tsx
deleted file mode 100644
index 6bb8b645d..000000000
--- a/web/containers/Layout/BottomBar/SystemItem/index.tsx
+++ /dev/null
@@ -1,30 +0,0 @@
-import { ReactNode } from 'react'
-
-import { twMerge } from 'tailwind-merge'
-
-type Props = {
-  name?: string
-  value: string | ReactNode
-  titleBold?: boolean
-}
-
-export default function SystemItem({ name, value, titleBold }: Props) {
-  return (
-    <div className="flex items-center gap-x-1 text-xs">
-      <p
-        className={twMerge(
-          titleBold ? 'font-semibold' : 'text-muted-foreground'
-        )}
-      >
-        {name}
-      </p>
-      <span
-        className={twMerge(
-          titleBold ? 'text-muted-foreground' : 'font-semibold'
-        )}
-      >
-        {value}
-      </span>
-    </div>
-  )
-}
diff --git a/web/containers/Layout/BottomBar/SystemMonitor/TableActiveModel/index.tsx b/web/containers/Layout/BottomBar/SystemMonitor/TableActiveModel/index.tsx
new file mode 100644
index 000000000..a73ec687f
--- /dev/null
+++ b/web/containers/Layout/BottomBar/SystemMonitor/TableActiveModel/index.tsx
@@ -0,0 +1,101 @@
+import { Fragment } from 'react'
+
+import {
+  Tooltip,
+  TooltipTrigger,
+  Button,
+  TooltipPortal,
+  Badge,
+  TooltipContent,
+  TooltipArrow,
+} from '@janhq/uikit'
+
+import { useAtom } from 'jotai'
+
+import { useActiveModel } from '@/hooks/useActiveModel'
+
+import { toGibibytes } from '@/utils/converter'
+
+import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
+
+const Column = ['Name', 'Model ID', 'Size', 'Version', 'Action']
+
+const TableActiveModel = () => {
+  const { activeModel, stateModel, stopModel } = useActiveModel()
+  const [serverEnabled, setServerEnabled] = useAtom(serverEnabledAtom)
+
+  return (
+    <div className="flex-shrink-0 m-4 mr-0 w-2/3">
+      <div className="rounded-lg border border-border shadow-sm overflow-hidden">
+        <table className="w-full px-8">
+          <thead className="w-full border-b border-border bg-secondary">
+            <tr>
+              {Column.map((col, i) => {
+                return (
+                  <th
+                    key={i}
+                    className="px-6 py-2 text-left font-normal last:text-center"
+                  >
+                    {col}
+                  </th>
+                )
+              })}
+            </tr>
+          </thead>
+          {activeModel && (
+            <Fragment>
+              <tbody>
+                <tr>
+                  <td className="px-6 py-2 font-bold">{activeModel.name}</td>
+                  <td className="px-6 py-2 font-bold">{activeModel.id}</td>
+                  <td className="px-6 py-2">
+                    <Badge themes="secondary">
+                      {toGibibytes(activeModel.metadata.size)}
+                    </Badge>
+                  </td>
+                  <td className="px-6 py-2">
+                    <Badge themes="secondary">v{activeModel.version}</Badge>
+                  </td>
+                  <td className="px-6 py-2 text-center">
+                    <Tooltip>
+                      <TooltipTrigger className="w-full">
+                        <Button
+                          block
+                          themes={
+                            stateModel.state === 'stop' ? 'danger' : 'primary'
+                          }
+                          className="w-16"
+                          loading={stateModel.loading}
+                          onClick={() => {
+                            stopModel()
+                            window.core?.api?.stopServer()
+                            setServerEnabled(false)
+                          }}
+                        >
+                          Stop
+                        </Button>
+                      </TooltipTrigger>
+                      {serverEnabled && (
+                        <TooltipPortal>
+                          <TooltipContent side="top">
+                            <span>
+                              The API server is running, stop the model will
+                              also stop the server
+                            </span>
+                            <TooltipArrow />
+                          </TooltipContent>
+                        </TooltipPortal>
+                      )}
+                    </Tooltip>
+                  </td>
+                </tr>
+              </tbody>
+            </Fragment>
+          )}
+        </table>
+      </div>
+    </div>
+  )
+}
+
+export default TableActiveModel
diff --git a/web/containers/Layout/BottomBar/SystemMonitor/index.tsx b/web/containers/Layout/BottomBar/SystemMonitor/index.tsx
new file mode 100644
index 000000000..5b7853698
--- /dev/null
+++ b/web/containers/Layout/BottomBar/SystemMonitor/index.tsx
@@ -0,0 +1,188 @@
+import { Fragment, useEffect, useState } from 'react'
+
+import { Progress } from '@janhq/uikit'
+import { useAtom, useAtomValue } from 'jotai'
+import { MonitorIcon, XIcon, ChevronDown, ChevronUp } from 'lucide-react'
+
+import { twMerge } from 'tailwind-merge'
+
+import { useClickOutside } from '@/hooks/useClickOutside'
+import useGetSystemResources from '@/hooks/useGetSystemResources'
+
+import { toGibibytes } from '@/utils/converter'
+
+import TableActiveModel from './TableActiveModel'
+
+import {
+  cpuUsageAtom,
+  gpusAtom,
+  ramUtilitizedAtom,
+  systemMonitorCollapseAtom,
+  totalRamAtom,
+  usedRamAtom,
+} from '@/helpers/atoms/SystemBar.atom'
+
+const SystemMonitor = () => {
+  const totalRam = useAtomValue(totalRamAtom)
+  const usedRam = useAtomValue(usedRamAtom)
+  const cpuUsage = useAtomValue(cpuUsageAtom)
+  const gpus = useAtomValue(gpusAtom)
+  const [showFullScreen, setShowFullScreen] = useState(false)
+  const ramUtilitized = useAtomValue(ramUtilitizedAtom)
+  const [systemMonitorCollapse, setSystemMonitorCollapse] = useAtom(
+    systemMonitorCollapseAtom
+  )
+  const [control, setControl] = useState<HTMLDivElement | null>(null)
+  const [elementExpand, setElementExpand] = useState<HTMLDivElement | null>(
+    null
+  )
+
+  const { watch, stopWatching } = useGetSystemResources()
+  useClickOutside(
+    () => {
+      setSystemMonitorCollapse(false)
+      setShowFullScreen(false)
+    },
+    null,
+    [control, elementExpand]
+  )
+
+  useEffect(() => {
+    // Watch for resource update
+    watch()
+
+    return () => {
+      stopWatching()
+    }
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [])
+
+  const calculateUtilization = () => {
+    let sum = 0
+    const util = gpus.map((x) => {
+      return Number(x['utilization'])
+    })
+    util.forEach((num) => {
+      sum += num
+    })
+    return sum
+  }
+
+  return (
+    <Fragment>
+      <div
+        ref={setControl}
+        className={twMerge(
+          'flex items-center gap-x-2 cursor-pointer p-2 rounded-md hover:bg-secondary',
+          systemMonitorCollapse && 'bg-secondary'
+        )}
+        onClick={() => {
+          setSystemMonitorCollapse(!systemMonitorCollapse)
+          setShowFullScreen(false)
+        }}
+      >
+        <MonitorIcon size={16} />
+        <span className="text-xs font-medium">System Monitor</span>
+      </div>
+      {systemMonitorCollapse && (
+        <div
+          ref={setElementExpand}
+          className={twMerge(
+            'fixed left-16 bottom-12 bg-white w-[calc(100%-64px)] z-50 border-t border-border flex flex-col flex-shrink-0',
+            showFullScreen && 'h-[calc(100%-48px)]'
+          )}
+        >
+          <div className="h-12 flex items-center border-b border-border px-4 justify-between flex-shrink-0">
+            <h6 className="font-medium">Running Models</h6>
+            <div className="flex items-center gap-x-2 unset-drag">
+              {showFullScreen ? (
+                <ChevronDown
+                  size={20}
+                  className="text-muted-foreground cursor-pointer"
+                  onClick={() => setShowFullScreen(!showFullScreen)}
+                />
+              ) : (
+                <ChevronUp
+                  size={20}
+                  className="text-muted-foreground cursor-pointer"
+                  onClick={() => setShowFullScreen(!showFullScreen)}
+                />
+              )}
+              <XIcon
+                size={16}
+                className="text-muted-foreground cursor-pointer"
+                onClick={() => {
+                  setSystemMonitorCollapse(false)
+                  setShowFullScreen(false)
+                }}
+              />
+            </div>
+          </div>
+          <div className="flex gap-4 h-full">
+            <TableActiveModel />
+            <div className="border-l border-border p-4 w-full">
+              <div className="mb-4 pb-4 border-b border-border">
+                <h6 className="font-bold">CPU</h6>
+                <div className="flex items-center gap-x-4">
+                  <Progress value={cpuUsage} className="h-2" />
+                  <span className="flex-shrink-0 text-muted-foreground">
+                    {cpuUsage}%
+                  </span>
+                </div>
+              </div>
+              <div className="mb-4 pb-4 border-b border-border">
+                <div className="flex items-center gap-2">
+                  <h6 className="font-bold">Memory</h6>
+                  <span className="text-xs text-muted-foreground">
+                    {toGibibytes(usedRam)} of {toGibibytes(totalRam)} used
+                  </span>
+                </div>
+                <div className="flex items-center gap-x-4">
+                  <Progress
+                    value={Math.round((usedRam / totalRam) * 100)}
+                    className="h-2"
+                  />
+                  <span className="flex-shrink-0 text-muted-foreground">
+                    {ramUtilitized}%
+                  </span>
+                </div>
+              </div>
+              {gpus.length > 0 && (
+                <div className="mb-4 pb-4 border-b border-border">
+                  <h6 className="font-bold">GPU</h6>
+                  <div className="flex items-center gap-x-4">
+                    <Progress value={calculateUtilization()} className="h-2" />
+                    <span className="flex-shrink-0 text-muted-foreground">
+                      {calculateUtilization()}%
+                    </span>
+                  </div>
+                  {gpus.map((gpu, index) => (
+                    <div
+                      key={index}
+                      className="flex items-start justify-between mt-4 gap-4"
+                    >
+                      <span className="text-muted-foreground font-medium line-clamp-1 w-1/2">
+                        {gpu.name}
+                      </span>
+                      <div className="flex gap-x-2">
+                        <span className="font-semibold">
+                          {gpu.utilization}%
+                        </span>
+                        <div>
+                          <span className="font-semibold">{gpu.vram}</span>
+                          <span>MB VRAM</span>
+                        </div>
+                      </div>
+                    </div>
+                  ))}
+                </div>
+              )}
+            </div>
+          </div>
+        </div>
+      )}
+    </Fragment>
+  )
+}
+
+export default SystemMonitor
diff --git a/web/containers/Layout/BottomBar/index.tsx b/web/containers/Layout/BottomBar/index.tsx
index 32dc70c70..61e984c99 100644
--- a/web/containers/Layout/BottomBar/index.tsx
+++ b/web/containers/Layout/BottomBar/index.tsx
@@ -1,37 +1,21 @@
 import {
-  Badge,
-  Button,
   Tooltip,
   TooltipArrow,
   TooltipContent,
   TooltipTrigger,
 } from '@janhq/uikit'
-import { useAtom, useAtomValue, useSetAtom } from 'jotai'
+import { useAtomValue } from 'jotai'
 
 import { FaGithub, FaDiscord } from 'react-icons/fa'
 
 import DownloadingState from '@/containers/Layout/BottomBar/DownloadingState'
 
-import SystemItem from '@/containers/Layout/BottomBar/SystemItem'
 import CommandListDownloadedModel from '@/containers/Layout/TopBar/CommandListDownloadedModel'
 import ProgressBar from '@/containers/ProgressBar'
 
 import { appDownloadProgress } from '@/containers/Providers/Jotai'
 
-import { showSelectModelModalAtom } from '@/containers/Providers/KeyListener'
-import ShortCut from '@/containers/Shortcut'
-
-import { MainViewState } from '@/constants/screens'
-
-import { useActiveModel } from '@/hooks/useActiveModel'
-
-import { useDownloadState } from '@/hooks/useDownloadState'
-
-import useGetSystemResources from '@/hooks/useGetSystemResources'
-import { useMainViewState } from '@/hooks/useMainViewState'
-
-import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
+import SystemMonitor from './SystemMonitor'
 
 const menuLinks = [
   {
@@ -47,22 +31,7 @@ const menuLinks = [
 ]
 
 const BottomBar = () => {
-  const { activeModel, stateModel } = useActiveModel()
-  const { ram, cpu, gpus } = useGetSystemResources()
   const progress = useAtomValue(appDownloadProgress)
-  const downloadedModels = useAtomValue(downloadedModelsAtom)
-
-  const { setMainViewState } = useMainViewState()
-  const { downloadStates } = useDownloadState()
-  const setShowSelectModelModal = useSetAtom(showSelectModelModalAtom)
-  const [serverEnabled] = useAtom(serverEnabledAtom)
-
-  const calculateGpuMemoryUsage = (gpu: Record<string, never>) => {
-    const total = parseInt(gpu.memoryTotal)
-    const free = parseInt(gpu.memoryFree)
-    if (!total || !free) return 0
-    return Math.round(((total - free) / total) * 100)
-  }
 
   return (
     <div className="fixed bottom-0 left-16 z-20 flex h-12 w-[calc(100%-64px)] items-center justify-between border-t border-border bg-background/80 px-3">
@@ -72,71 +41,11 @@ const BottomBar = () => {
             <ProgressBar total={100} used={progress} />
           ) : null}
         </div>
-
-        {!serverEnabled && (
-          <Badge
-            themes="secondary"
-            className="cursor-pointer rounded-md border-none font-medium"
-            onClick={() => setShowSelectModelModal((show) => !show)}
-          >
-            My Models
-            <ShortCut menu="E" />
-          </Badge>
-        )}
-
-        {stateModel.state === 'start' && stateModel.loading && (
-          <SystemItem
-            titleBold
-            name="Starting"
-            value={stateModel.model || '-'}
-          />
-        )}
-        {stateModel.state === 'stop' && stateModel.loading && (
-          <SystemItem
-            titleBold
-            name="Stopping"
-            value={stateModel.model || '-'}
-          />
-        )}
-        {!stateModel.loading &&
-          downloadedModels.length !== 0 &&
-          activeModel?.id && (
-            <SystemItem
-              titleBold
-              name={'Active model'}
-              value={activeModel?.id}
-            />
-          )}
-        {downloadedModels.length === 0 &&
-          !stateModel.loading &&
-          downloadStates.length === 0 && (
-            <Button
-              size="sm"
-              themes="outline"
-              onClick={() => setMainViewState(MainViewState.Hub)}
-            >
-              Download your first model
-            </Button>
-          )}
-
         <DownloadingState />
       </div>
       <div className="flex items-center gap-x-3">
-        <div className="flex items-center gap-x-2">
-          <SystemItem name="CPU:" value={`${cpu}%`} />
-          <SystemItem name="Mem:" value={`${ram}%`} />
-        </div>
-        {gpus.length > 0 && (
-          <div className="flex items-center gap-x-2">
-            {gpus.map((gpu, index) => (
-              <SystemItem
-                key={index}
-                name={`GPU ${gpu.id}:`}
-                value={`${gpu.utilization}% Util, ${calculateGpuMemoryUsage(gpu)}% Mem`}
-              />
-            ))}
-          </div>
-        )}
+        <SystemMonitor />
+
         {/* VERSION is defined by webpack, please see next.config.js */}
         <span className="text-xs text-muted-foreground">
           Jan v{VERSION ?? ''}
diff --git a/web/containers/Layout/Ribbon/index.tsx b/web/containers/Layout/Ribbon/index.tsx
index 83ed2725a..8a3c4a3a3 100644
--- a/web/containers/Layout/Ribbon/index.tsx
+++ b/web/containers/Layout/Ribbon/index.tsx
@@ -6,11 +6,10 @@ import {
 } from '@janhq/uikit'
 import { motion as m } from 'framer-motion'
 
-import { useAtom } from 'jotai'
+import { useAtom, useSetAtom } from 'jotai'
 import {
   MessageCircleIcon,
   SettingsIcon,
-  MonitorIcon,
   LayoutGridIcon,
   SquareCodeIcon,
 } from 'lucide-react'
@@ -23,16 +22,19 @@ import { MainViewState } from '@/constants/screens'
 
 import { useMainViewState } from '@/hooks/useMainViewState'
 
+import { editMessageAtom } from '@/helpers/atoms/ChatMessage.atom'
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
 
 export default function RibbonNav() {
   const { mainViewState, setMainViewState } = useMainViewState()
   const [serverEnabled] = useAtom(serverEnabledAtom)
+  const setEditMessage = useSetAtom(editMessageAtom)
 
   const onMenuClick = (state: MainViewState) => {
     if (mainViewState === state) return
     if (serverEnabled && state === MainViewState.Thread) return
     setMainViewState(state)
+    setEditMessage('')
   }
 
   const primaryMenus = [
@@ -72,16 +74,6 @@ export default function RibbonNav() {
       ),
       state: MainViewState.LocalServer,
     },
-    {
-      name: 'System Monitor',
-      icon: (
-        <MonitorIcon
-          size={20}
-          className="flex-shrink-0 text-muted-foreground"
-        />
-      ),
-      state: MainViewState.SystemMonitor,
-    },
     {
       name: 'Settings',
       icon: (
diff --git a/web/containers/Layout/TopBar/CommandSearch/index.tsx b/web/containers/Layout/TopBar/CommandSearch/index.tsx
index ec73a7660..17887763e 100644
--- a/web/containers/Layout/TopBar/CommandSearch/index.tsx
+++ b/web/containers/Layout/TopBar/CommandSearch/index.tsx
@@ -38,11 +38,7 @@ const menus = [
     icon: <LayoutGridIcon size={16} className="mr-3 text-muted-foreground" />,
     state: MainViewState.Hub,
   },
-  {
-    name: 'System Monitor',
-    icon: <MonitorIcon size={16} className="mr-3 text-muted-foreground" />,
-    state: MainViewState.SystemMonitor,
-  },
+
   {
     name: 'Settings',
     icon: <SettingsIcon size={16} className="mr-3 text-muted-foreground" />,
diff --git a/web/containers/Layout/TopBar/index.tsx b/web/containers/Layout/TopBar/index.tsx
index 206a9013d..525cd97de 100644
--- a/web/containers/Layout/TopBar/index.tsx
+++ b/web/containers/Layout/TopBar/index.tsx
@@ -68,7 +68,7 @@ const TopBar = () => {
   }
 
   return (
-    <div className="fixed left-0 top-0 z-50 flex h-12 w-full border-b border-border bg-background/80 backdrop-blur-md">
+    <div className="fixed left-0 top-0 z-20 flex h-12 w-full border-b border-border bg-background/80 backdrop-blur-md">
       {mainViewState !== MainViewState.Thread &&
       mainViewState !== MainViewState.LocalServer ? (
         <div className="relative left-16 flex w-[calc(100%-64px)] items-center justify-between space-x-4 pl-6 pr-2">
@@ -95,6 +95,7 @@ const TopBar = () => {
                 </div>
                 <div
                   className="unset-drag cursor-pointer pr-4"
+                  data-testid="btn-create-thread"
                   onClick={onCreateConversationClick}
                 >
                   <PenSquareIcon size={20} className="text-muted-foreground" />
diff --git a/web/containers/ModalCancelDownload/index.tsx b/web/containers/ModalCancelDownload/index.tsx
index 2a5626183..d52fbe5e9 100644
--- a/web/containers/ModalCancelDownload/index.tsx
+++ b/web/containers/ModalCancelDownload/index.tsx
@@ -1,4 +1,4 @@
-import { useMemo } from 'react'
+import { useCallback } from 'react'
 
 import { Model } from '@janhq/core'
 
@@ -14,31 +14,37 @@ import {
   Progress,
 } from '@janhq/uikit'
 
-import { atom, useAtomValue } from 'jotai'
+import { useAtomValue } from 'jotai'
 
 import useDownloadModel from '@/hooks/useDownloadModel'
-import { useDownloadState } from '@/hooks/useDownloadState'
+
+import { modelDownloadStateAtom } from '@/hooks/useDownloadState'
 
 import { formatDownloadPercentage } from '@/utils/converter'
 
-import { downloadingModelsAtom } from '@/helpers/atoms/Model.atom'
+import { getDownloadingModelAtom } from '@/helpers/atoms/Model.atom'
 
 type Props = {
   model: Model
   isFromList?: boolean
 }
 
-export default function ModalCancelDownload({ model, isFromList }: Props) {
-  const { modelDownloadStateAtom } = useDownloadState()
-  const downloadingModels = useAtomValue(downloadingModelsAtom)
-  const downloadAtom = useMemo(
-    () => atom((get) => get(modelDownloadStateAtom)[model.id]),
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-    [model.id]
-  )
-  const downloadState = useAtomValue(downloadAtom)
-  const cancelText = `Cancel ${formatDownloadPercentage(downloadState.percent)}`
+const ModalCancelDownload: React.FC<Props> = ({ model, isFromList }) => {
   const { abortModelDownload } = useDownloadModel()
+  const downloadingModels = useAtomValue(getDownloadingModelAtom)
+  const allDownloadStates = useAtomValue(modelDownloadStateAtom)
+  const downloadState = allDownloadStates[model.id]
+
+  const cancelText = `Cancel ${formatDownloadPercentage(downloadState.percent)}`
+
+  const onAbortDownloadClick = useCallback(() => {
+    if (downloadState?.modelId) {
+      const model = downloadingModels.find(
+        (model) => model.id === downloadState.modelId
+      )
+      if (model) abortModelDownload(model)
+    }
+  }, [downloadState, downloadingModels, abortModelDownload])
 
   return (
     <Modal>
@@ -78,17 +84,7 @@ export default function ModalCancelDownload({ model, isFromList }: Props) {
               <Button themes="ghost">No</Button>
             </ModalClose>
             <ModalClose asChild>
-              <Button
-                themes="danger"
-                onClick={() => {
-                  if (downloadState?.modelId) {
-                    const model = downloadingModels.find(
-                      (model) => model.id === downloadState.modelId
-                    )
-                    if (model) abortModelDownload(model)
-                  }
-                }}
-              >
+              <Button themes="danger" onClick={onAbortDownloadClick}>
                 Yes
               </Button>
             </ModalClose>
@@ -98,3 +94,5 @@ export default function ModalCancelDownload({ model, isFromList }: Props) {
     </Modal>
   )
 }
+
+export default ModalCancelDownload
diff --git a/web/containers/ModalTroubleShoot/AppLogs.tsx b/web/containers/ModalTroubleShoot/AppLogs.tsx
new file mode 100644
index 000000000..d4f6bddb8
--- /dev/null
+++ b/web/containers/ModalTroubleShoot/AppLogs.tsx
@@ -0,0 +1,203 @@
+import React, { useEffect, useState } from 'react'
+
+import { Button } from '@janhq/uikit'
+
+import { CopyIcon, CheckIcon } from 'lucide-react'
+
+import { useClipboard } from '@/hooks/useClipboard'
+import { useLogs } from '@/hooks/useLogs'
+
+const AppLogs = () => {
+  const { getLogs } = useLogs()
+  const [logs, setLogs] = useState([])
+
+  useEffect(() => {
+    getLogs('app').then((log) => {
+      if (typeof log?.split === 'function') {
+        setLogs(log.split(/\r?\n|\r|\n/g))
+      }
+    })
+
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [])
+
+  const clipboard = useClipboard({ timeout: 1000 })
+
+  return (
+    <>
+      <div className="absolute -top-11 right-2">
+        <Button
+          themes="outline"
+          className="bg-white dark:bg-secondary/50"
+          onClick={() => {
+            clipboard.copy(logs.slice(-50) ?? '')
+          }}
+        >
+          <div className="flex items-center space-x-2">
+            {clipboard.copied ? (
+              <>
+                <CheckIcon size={14} className="text-green-600" />
+                <span>Copying...</span>
+              </>
+            ) : (
+              <>
+                <CopyIcon size={14} />
+                <span>Copy All</span>
+              </>
+            )}
+          </div>
+        </Button>
+      </div>
+      <div className="overflow-hidden">
+        {logs.length > 1 ? (
+          <div className="h-full overflow-auto">
+            <code className="inline-block whitespace-pre-line text-xs">
+              {logs.slice(-100).map((log, i) => {
+                return (
+                  <p key={i} className="my-2 leading-relaxed">
+                    {log}
+                  </p>
+                )
+              })}
+            </code>
+          </div>
+        ) : (
+          <div className="mt-24 flex flex-col items-center justify-center">
+            <svg
+              width="115"
+              height="115"
+              viewBox="0 0 115 115"
+              fill="none"
+              xmlns="http://www.w3.org/2000/svg"
+            >
+              <circle cx="57.4999" cy="57.5009" r="50.2314" fill="#DADADA" />
+              <circle
+                cx="57.5"
+                cy="57.5"
+                r="55.9425"
+                fill="#E7E7E7"
+                stroke="white"
+                strokeWidth="3.1151"
+              />
+              <mask
+                id="mask0_1206_120508"
+                maskUnits="userSpaceOnUse"
+                x="3"
+                y="3"
+                width="109"
+                height="109"
+              >
+                <circle cx="57.4993" cy="57.5003" r="54.1253" fill="white" />
+              </mask>
+              <g mask="url(#mask0_1206_120508)">
+                <path
+                  d="M47.5039 116.445H58.5351L74.3593 39.8282L63.7828 37.6406L47.5039 116.445Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M72.165 39.4563L74.3716 39.8457L72.4246 38.418L72.165 39.4563Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M45.6797 114.947H56.7108L72.4257 38.4193L61.9585 36.1426L45.6797 114.947Z"
+                  fill="url(#paint0_linear_1206_120508)"
+                />
+                <path
+                  d="M93.1887 90.6726L26.5474 76.906L24.6602 75.2136L31.7058 51.9418L34.7984 52.1448L30.0296 49.6041L32.757 36.0039L99.3983 49.7705L101.29 51.467L98.5257 64.844L93.2456 64.9414L96.1515 65.4974L98.0387 67.1898L93.1887 90.6726Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M91.3015 88.9801L24.6602 75.2136L29.8186 50.2454L32.9112 50.4483L30.3299 47.7656L32.757 36.0039L99.3983 49.7705L96.6345 63.1475L91.3583 63.2449L96.1515 65.4974L91.3015 88.9801Z"
+                  fill="url(#paint1_linear_1206_120508)"
+                />
+                <path
+                  d="M92.7826 63.1065C92.7826 63.1065 92.7298 63.1065 92.6243 63.1065L92.1576 63.0741L90.3637 62.9279L89.069 62.8143L87.5308 62.6317C86.431 62.4937 85.1688 62.3638 83.7929 62.1365L81.6216 61.8078C80.8667 61.6901 80.0875 61.5359 79.2798 61.4019C77.6564 61.126 75.9396 60.7647 74.1295 60.3995C70.5133 59.6324 66.5563 58.703 62.4247 57.6518C54.1655 55.5252 46.7221 53.4797 41.2918 52.1525C39.9403 51.8075 38.7065 51.5275 37.6391 51.2677C36.5717 51.008 35.6098 50.797 34.8631 50.6306L33.1098 50.2247L32.6552 50.1151C32.6025 50.1035 32.5508 50.0872 32.501 50.0664C32.5545 50.0686 32.6076 50.0768 32.6593 50.0908L33.1219 50.176L34.8834 50.5291C35.6504 50.6833 36.5879 50.8822 37.6675 51.1297C38.7471 51.3773 39.9849 51.6452 41.3446 51.978C46.783 53.2605 54.2386 55.2816 62.4937 57.4043C66.6253 58.4554 70.5742 59.3929 74.1823 60.1722C75.9924 60.5415 77.7051 60.9109 79.3245 61.195C80.1362 61.3411 80.9114 61.4953 81.6622 61.6008L83.8254 61.9458C85.2012 62.1852 86.4553 62.3273 87.5552 62.4775L89.0893 62.6804L90.3799 62.8143L92.1698 63.0091L92.6324 63.0659L92.7826 63.1065Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M96.131 60.9773C96.0789 60.948 96.0288 60.9155 95.9808 60.8799L95.5749 60.5755C95.2056 60.3117 94.678 59.8937 93.9515 59.3985C91.9511 57.9951 89.8665 56.7156 87.7095 55.5673C84.5067 53.8752 81.1551 52.4813 77.697 51.4032C73.4578 50.101 69.0819 49.2947 64.6569 49.0005C59.9449 48.6555 55.4481 49.1142 51.353 49.2075C49.411 49.2762 47.4666 49.2369 45.529 49.0898C41.3921 48.7494 37.3342 47.762 33.5035 46.1636C32.6918 45.8267 32.0952 45.5426 31.6853 45.3519L31.2226 45.1165L31.0684 45.0312C31.1262 45.0462 31.1821 45.068 31.2348 45.0962L31.7096 45.3072C32.1155 45.4939 32.7364 45.7658 33.54 46.0865C35.8079 46.9951 38.1522 47.7 40.5451 48.1929C42.1954 48.5323 43.8654 48.7681 45.5452 48.899C47.4754 49.0336 49.4114 49.0647 51.3449 48.9924C55.4278 48.8869 59.9368 48.4201 64.6731 48.7651C69.1177 49.0615 73.5121 49.8788 77.766 51.2002C81.2331 52.295 84.5906 53.7108 87.7947 55.4293C89.949 56.5876 92.0247 57.8864 94.0083 59.3173C94.7105 59.8206 95.2259 60.2549 95.5912 60.5349L95.997 60.8596C96.0446 60.8953 96.0894 60.9347 96.131 60.9773Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M63.9192 43.0816C63.8188 43.1282 63.7141 43.1649 63.6067 43.1912L62.6935 43.4631C62.2876 43.5849 61.8128 43.7188 61.2405 43.8487C60.6683 43.9786 60.023 44.1572 59.2924 44.287C58.5619 44.4169 57.7745 44.5914 56.91 44.6929C56.0456 44.7943 55.1283 44.9364 54.1583 45.046C52.0463 45.2502 49.9242 45.3328 47.8027 45.2936C45.6814 45.2371 43.565 45.0623 41.4632 44.77C40.4973 44.6158 39.58 44.4818 38.7278 44.2951C37.8755 44.1084 37.1043 43.9461 36.3697 43.7675C35.6351 43.589 35.0101 43.4063 34.446 43.244C33.8818 43.0816 33.3989 42.9315 33.0092 42.7975L32.1082 42.485C32.0022 42.4531 31.8991 42.4123 31.7998 42.3633C31.9103 42.3761 32.0191 42.4006 32.1245 42.4363L33.0377 42.7042C33.4435 42.826 33.9143 42.968 34.4825 43.1101C35.0507 43.2521 35.7001 43.4469 36.4103 43.5971C37.1206 43.7472 37.916 43.942 38.7683 44.0922C39.6206 44.2424 40.5338 44.3966 41.4957 44.5427C43.5877 44.8202 45.693 44.9868 47.8027 45.0419C49.9143 45.0792 52.0264 45.0034 54.1299 44.8146C55.0959 44.7091 56.0172 44.6239 56.8735 44.4859C57.7299 44.3479 58.5253 44.2302 59.2518 44.08C59.9783 43.9299 60.6277 43.8 61.1999 43.6742C61.7722 43.5484 62.2633 43.4347 62.661 43.3292L63.5823 43.106C63.6933 43.0854 63.8063 43.0772 63.9192 43.0816Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M46.1782 66.8891C46.1782 66.8891 46.2837 66.9459 46.4786 67.0677L47.3552 67.6075C48.1263 68.0742 49.2546 68.7885 50.7644 69.5962C52.5839 70.6072 54.5341 71.3624 56.56 71.8405C57.1712 71.9765 57.7909 72.0714 58.4148 72.1246C59.0677 72.2062 59.729 72.063 60.2898 71.7188C60.5621 71.5185 60.7593 71.2327 60.8499 70.9071C60.9379 70.5705 60.9379 70.2169 60.8499 69.8803C60.6372 69.1763 60.1849 68.5689 59.5714 68.1635C54.4901 64.7949 47.3349 62.3395 39.2381 62.1122C38.2275 62.0797 37.2088 62.0797 36.1698 62.1122C35.1309 62.1447 34.0756 62.3882 33.3816 63.1593C33.2064 63.3413 33.0692 63.5562 32.9779 63.7918C32.8866 64.0273 32.8431 64.2786 32.85 64.5311C32.8877 65.0471 33.0864 65.5383 33.4181 65.9354C34.0716 66.7714 35.0132 67.3518 35.9182 67.9646C39.5709 70.4403 43.4387 72.8998 47.7895 74.6044C52.1402 76.309 56.7629 77.0761 61.1177 76.4308C62.1922 76.2718 63.2512 76.0219 64.2834 75.684C65.3 75.3967 66.2119 74.8217 66.9093 74.0281C67.5327 73.2028 67.8626 72.1929 67.8468 71.1587C67.8497 70.1451 67.625 69.1437 67.1893 68.2284C66.3039 66.4723 64.9462 64.9979 63.2688 63.971C61.6898 62.9951 59.9765 62.2554 58.1834 61.7753C56.4585 61.2761 54.7499 60.919 53.1183 60.5578L48.4226 59.4944L34.2542 56.276L30.4067 55.3872L29.4083 55.1518C29.181 55.099 29.0674 55.0625 29.0674 55.0625L29.4124 55.1274L30.4189 55.3385L34.2786 56.1827L48.4632 59.324L53.1589 60.3711C54.7824 60.7404 56.5032 61.0895 58.2402 61.5887C60.0548 62.0698 61.7887 62.8151 63.3865 63.8006C65.1016 64.8462 66.4904 66.3503 67.3963 68.1432C67.8467 69.0889 68.0797 70.1234 68.0782 71.1709C68.0964 72.2575 67.7507 73.319 67.096 74.1864C66.3707 75.017 65.4208 75.6203 64.3605 75.9235C63.3146 76.2697 62.2404 76.5237 61.1502 76.6824C56.7426 77.3399 52.0631 76.5566 47.7002 74.8479C43.3372 73.1393 39.441 70.6798 35.7965 68.1919C34.8955 67.5669 33.9376 66.9743 33.2477 66.0936C32.8831 65.658 32.6657 65.1181 32.6267 64.5514C32.6196 64.2683 32.6687 63.9866 32.7711 63.7226C32.8735 63.4586 33.0272 63.2174 33.2233 63.0132C33.599 62.6113 34.0734 62.3147 34.5992 62.1528C35.1094 61.9991 35.6373 61.9118 36.1698 61.893C37.2169 61.8525 38.2438 61.8565 39.2584 61.893C47.4039 62.1406 54.5794 64.6163 59.6932 68.0336C60.3373 68.4648 60.8099 69.1082 61.0285 69.8519C61.1239 70.2164 61.1239 70.5994 61.0285 70.9639C60.9286 71.3211 60.7095 71.6333 60.4075 71.8487C59.8169 72.2131 59.12 72.3662 58.431 72.2829C57.7989 72.2243 57.1713 72.1253 56.5519 71.9867C54.5186 71.4945 52.5639 70.7213 50.7441 69.6895C49.2343 68.8778 48.1142 68.1391 47.3512 67.6602C46.9778 67.4208 46.6896 67.2544 46.4907 67.1002C46.2919 66.9459 46.1782 66.8891 46.1782 66.8891Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M94.8364 71.2204C94.6993 71.2055 94.5635 71.1797 94.4305 71.1433C94.1789 71.0743 93.8014 71.0012 93.3185 70.916C91.9393 70.7187 90.5384 70.7297 89.1625 70.9484C87.1263 71.2911 85.1507 71.9282 83.2979 72.8397C81.0433 73.9901 78.866 75.2861 76.7799 76.7197C74.6823 78.1612 72.4837 79.4497 70.201 80.5753C68.3181 81.4721 66.3087 82.0743 64.243 82.3611C62.8484 82.5487 61.4325 82.5089 60.0505 82.2434C59.6768 82.1692 59.3081 82.0716 58.9466 81.9512C58.8182 81.9168 58.6932 81.8706 58.5732 81.8132C58.7037 81.8336 58.8326 81.8634 58.9588 81.9025C59.2104 81.9755 59.5838 82.0567 60.0668 82.15C61.4407 82.3746 62.841 82.3869 64.2187 82.1866C66.2604 81.8789 68.2442 81.266 70.1036 80.3683C72.3696 79.236 74.5543 77.9477 76.6419 76.5127C78.7383 75.0733 80.9295 73.777 83.2005 72.6327C85.0755 71.7192 87.077 71.0926 89.1382 70.7739C90.5308 70.568 91.9473 70.5845 93.3347 70.8226C93.72 70.8867 94.1009 70.9748 94.4752 71.0864C94.5995 71.1198 94.7204 71.1646 94.8364 71.2204Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M93.6026 77.826C93.6026 77.8504 93.286 77.7205 92.7016 77.5906C91.8761 77.4114 91.0248 77.3839 90.1894 77.5095C88.9516 77.719 87.7468 78.0901 86.6057 78.6134C85.195 79.2299 83.8293 79.9446 82.5187 80.7523C81.1063 81.5883 79.7589 82.4041 78.4602 83.025C77.321 83.5882 76.1214 84.0199 74.8846 84.3116C74.0488 84.5016 73.1926 84.5861 72.3358 84.5632C72.1034 84.5575 71.8716 84.5372 71.6418 84.5024C71.5603 84.4985 71.4797 84.4835 71.4023 84.4577C71.4023 84.4293 71.7392 84.4577 72.3358 84.4577C73.1828 84.4453 74.0257 84.3364 74.8481 84.133C76.0637 83.8193 77.242 83.3757 78.3628 82.8099C79.6371 82.1849 80.9724 81.3692 82.3888 80.529C83.7103 79.7132 85.0914 78.9983 86.5204 78.3902C87.683 77.8677 88.9122 77.5085 90.1731 77.3228C91.0279 77.2097 91.8965 77.2648 92.73 77.4851C92.9548 77.5461 93.1757 77.6207 93.3916 77.7083C93.4671 77.7375 93.5381 77.7771 93.6026 77.826Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M72.1531 44.1988C72.1531 44.2678 69.584 43.7645 66.4468 43.0746C63.3095 42.3846 60.7648 41.7718 60.7932 41.7069C60.8216 41.6419 63.3623 42.1411 66.4995 42.8311C69.6368 43.521 72.1531 44.1339 72.1531 44.1988Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M87.7278 22.8493C87.9286 21.4011 85.8726 20.21 84.3238 20.0848C83.5886 20.0273 82.8227 20.139 82.1249 19.8987C80.6135 19.3743 80.011 17.432 78.5371 16.8128C77.4342 16.3526 76.1544 16.762 75.0957 17.2967C74.0371 17.8313 72.9717 18.5046 71.7769 18.5825C70.7557 18.6468 69.6086 18.2644 68.7133 18.7686C68.0326 19.1442 67.6922 19.9224 67.059 20.3792C66.4259 20.836 65.6498 20.9206 64.8941 20.9612C64.1384 21.0018 63.3521 21.012 62.6611 21.3233C61.9701 21.6346 61.4017 22.3655 61.5446 23.1031L87.7278 22.8493Z"
+                  fill="#ABABAB"
+                />
+                <path
+                  d="M39.1881 32.5312C39.3293 31.4869 37.8655 30.6287 36.7662 30.5385C36.2413 30.4963 35.6955 30.5769 35.1993 30.4022C34.121 30.0182 33.6916 28.6264 32.64 28.1791C31.8556 27.847 30.951 28.1426 30.1895 28.5285C29.428 28.9144 28.6741 29.4001 27.8229 29.4538C27.0824 29.5018 26.2789 29.2254 25.632 29.5901C25.1491 29.8608 24.8972 30.4195 24.4525 30.742C24.0078 31.0645 23.4486 31.126 22.9085 31.1624C22.3684 31.1989 21.8092 31.1989 21.3187 31.4254C20.8282 31.652 20.4198 32.1741 20.5229 32.7078L39.1881 32.5312Z"
+                  fill="#ABABAB"
+                />
+                <path
+                  d="M76.46 61.6777L78.8178 62.1824L80.1702 66.9562L80.2674 66.977L83.4556 63.1752L85.8134 63.6799L80.8041 69.3391L80.0506 72.8588L77.9602 72.4114L78.7137 68.8917L76.46 61.6777Z"
+                  fill="white"
+                />
+                <path
+                  d="M67.148 61.4992L67.5195 59.7637L75.6965 61.514L75.325 63.2496L72.2769 62.5971L70.5171 70.8178L68.4364 70.3724L70.1962 62.1517L67.148 61.4992Z"
+                  fill="white"
+                />
+                <path
+                  d="M56.9049 67.9016L59.0361 57.9453L62.9642 58.7862C63.7193 58.9478 64.3318 59.2297 64.8016 59.632C65.272 60.0309 65.5922 60.5147 65.762 61.0832C65.9357 61.6491 65.9518 62.2627 65.8103 62.9238C65.6688 63.585 65.4013 64.1379 65.0078 64.5824C64.6144 65.0269 64.1169 65.3323 63.5153 65.4984C62.9169 65.6652 62.2353 65.6667 61.4705 65.503L58.9668 64.967L59.3279 63.2801L61.4913 63.7432C61.8964 63.8299 62.2451 63.8317 62.5375 63.7485C62.8338 63.6628 63.0734 63.5091 63.2565 63.2872C63.4435 63.0629 63.572 62.7871 63.6421 62.4597C63.7128 62.1291 63.7082 61.8265 63.628 61.5517C63.5518 61.2744 63.3954 61.0392 63.1587 60.8462C62.9228 60.65 62.6007 60.5082 62.1923 60.4207L60.7728 60.1169L59.0099 68.3522L56.9049 67.9016Z"
+                  fill="white"
+                />
+                <path
+                  d="M46.5049 55.2637L49.1009 55.8194L50.4108 63.0957L50.5275 63.1206L54.7013 57.0182L57.2973 57.5739L55.1661 67.5302L53.1243 67.0931L54.5114 60.6128L54.4288 60.5951L50.4754 66.4753L49.0851 66.1776L47.8905 59.1701L47.8078 59.1524L46.4154 65.657L44.3736 65.2199L46.5049 55.2637Z"
+                  fill="white"
+                />
+                <path
+                  d="M35.9977 63.425L38.1289 53.4688L44.8377 54.9048L44.4662 56.6404L39.8624 55.6549L39.3546 58.0273L43.6132 58.9389L43.2417 60.6744L38.9831 59.7628L38.4742 62.1401L43.0974 63.1297L42.7259 64.8653L35.9977 63.425Z"
+                  fill="white"
+                />
+              </g>
+              <defs>
+                <linearGradient
+                  id="paint0_linear_1206_120508"
+                  x1="59.1074"
+                  y1="36.1426"
+                  x2="59.1074"
+                  y2="114.947"
+                  gradientUnits="userSpaceOnUse"
+                >
+                  <stop stopColor="#CFCFCF" />
+                  <stop offset="1" stopColor="#C6C6C6" />
+                </linearGradient>
+                <linearGradient
+                  id="paint1_linear_1206_120508"
+                  x1="62.0292"
+                  y1="36.0039"
+                  x2="62.0292"
+                  y2="88.9801"
+                  gradientUnits="userSpaceOnUse"
+                >
+                  <stop stopColor="#DDDDDD" />
+                  <stop offset="1" stopColor="#B6B6B6" />
+                </linearGradient>
+              </defs>
+            </svg>
+            <p className="mt-4 text-muted-foreground">Empty logs</p>
+          </div>
+        )}
+      </div>
+    </>
+  )
+}
+
+export default AppLogs
diff --git a/web/containers/ModalTroubleShoot/DeviceSpecs.tsx b/web/containers/ModalTroubleShoot/DeviceSpecs.tsx
new file mode 100644
index 000000000..5ebb610d1
--- /dev/null
+++ b/web/containers/ModalTroubleShoot/DeviceSpecs.tsx
@@ -0,0 +1,46 @@
+import React from 'react'
+
+import { Button } from '@janhq/uikit'
+
+import { CopyIcon, CheckIcon } from 'lucide-react'
+
+import { useClipboard } from '@/hooks/useClipboard'
+
+// TODO @Louis help add missing information device specs
+const DeviceSpecs = () => {
+  const userAgent = window.navigator.userAgent
+  const clipboard = useClipboard({ timeout: 1000 })
+
+  return (
+    <>
+      <div className="absolute -top-11 right-2">
+        <Button
+          themes="outline"
+          className="bg-white dark:bg-secondary/50"
+          onClick={() => {
+            clipboard.copy(userAgent ?? '')
+          }}
+        >
+          <div className="flex items-center space-x-2">
+            {clipboard.copied ? (
+              <>
+                <CheckIcon size={14} className="text-green-600" />
+                <span>Copying...</span>
+              </>
+            ) : (
+              <>
+                <CopyIcon size={14} />
+                <span>Copy All</span>
+              </>
+            )}
+          </div>
+        </Button>
+      </div>
+      <div>
+        <p className="leading-relaxed">{userAgent}</p>
+      </div>
+    </>
+  )
+}
+
+export default DeviceSpecs
diff --git a/web/containers/ModalTroubleShoot/index.tsx b/web/containers/ModalTroubleShoot/index.tsx
new file mode 100644
index 000000000..547398c4f
--- /dev/null
+++ b/web/containers/ModalTroubleShoot/index.tsx
@@ -0,0 +1,121 @@
+import { useState } from 'react'
+import ScrollToBottom from 'react-scroll-to-bottom'
+
+import { Modal, ModalContent, ModalHeader, ModalTitle } from '@janhq/uikit'
+import { motion as m } from 'framer-motion'
+import { atom, useAtom } from 'jotai'
+import { twMerge } from 'tailwind-merge'
+
+import ServerLogs from '../ServerLogs'
+
+import AppLogs from './AppLogs'
+import DeviceSpecs from './DeviceSpecs'
+
+export const modalTroubleShootingAtom = atom(false)
+const logOption = ['App Logs', 'Server Logs', 'Device Specs']
+
+const ModalTroubleShooting: React.FC = () => {
+  const [modalTroubleShooting, setModalTroubleShooting] = useAtom(
+    modalTroubleShootingAtom
+  )
+  const [isTabActive, setIsTabActivbe] = useState(0)
+
+  return (
+    <Modal open={modalTroubleShooting} onOpenChange={setModalTroubleShooting}>
+      <ModalContent className="max-w-[60%] pb-4 pt-8">
+        <ModalHeader>
+          <ModalTitle>Troubleshooting Assistance</ModalTitle>
+        </ModalHeader>
+        <p className="-mt-2 pr-3 leading-relaxed text-muted-foreground">
+          {`We're here to help! Your report is crucial for debugging and shaping
+          the next version. Here’s how you can report & get further support:`}
+        </p>
+
+        <div className="rounded-lg border border-border p-4 shadow">
+          <h2 className="font-semibold">Step 1</h2>
+          <p className="mt-1 text-muted-foreground">
+            Follow our&nbsp;
+            <a
+              href="https://jan.ai/guides/troubleshooting"
+              target="_blank"
+              className="text-blue-600 hover:underline dark:text-blue-300"
+            >
+              troubleshooting guide
+            </a>
+            &nbsp;for step-by-step solutions.
+          </p>
+        </div>
+
+        <div className="block overflow-hidden rounded-lg border border-border pb-2 pt-4 shadow">
+          <div className="px-4">
+            <h2 className="font-semibold">Step 2</h2>
+            <p className="mt-1 text-muted-foreground">
+              {`If you can't find what you need in our troubleshooting guide, feel
+            free reach out to us for extra help:`}
+            </p>
+            <ul className="mt-2 list-disc space-y-2 pl-6">
+              <li>
+                <p className="font-medium">
+                  Copy your 2-hour logs & device specifications provided below.{' '}
+                </p>
+              </li>
+              <li>
+                <p className="font-medium">
+                  Go to our&nbsp;
+                  <a
+                    href="https://discord.gg/AsJ8krTT3N"
+                    target="_blank"
+                    className="text-blue-600 hover:underline dark:text-blue-300"
+                  >
+                    Discord
+                  </a>
+                  &nbsp; & send it to #🆘|get-help channel for further support.
+                </p>
+              </li>
+            </ul>
+          </div>
+
+          <div className="flex flex-col pt-4">
+            {/* TODO @faisal replace this once we have better tabs component UI */}
+            <div className="relative bg-zinc-100 px-4 py-2 dark:bg-secondary/50">
+              <ul className="inline-flex space-x-2 rounded-lg bg-zinc-200 px-1 dark:bg-secondary">
+                {logOption.map((name, i) => {
+                  return (
+                    <li
+                      className="relative cursor-pointer px-4 py-2"
+                      key={i}
+                      onClick={() => setIsTabActivbe(i)}
+                    >
+                      <span
+                        className={twMerge(
+                          'relative z-50 font-medium text-muted-foreground',
+                          isTabActive === i &&
+                            'font-bold text-foreground dark:text-black'
+                        )}
+                      >
+                        {name}
+                      </span>
+                      {isTabActive === i && (
+                        <m.div
+                          className="absolute left-0 top-1 h-[calc(100%-8px)] w-full rounded-md bg-background dark:bg-white"
+                          layoutId="log-state-active"
+                        />
+                      )}
+                    </li>
+                  )
+                })}
+              </ul>
+            </div>
+            <ScrollToBottom className={twMerge('relative h-[140px] px-4 py-2')}>
+              {isTabActive === 0 && <AppLogs />}
+              {isTabActive === 1 && <ServerLogs limit={50} withCopy />}
+              {isTabActive === 2 && <DeviceSpecs />}
+            </ScrollToBottom>
+          </div>
+        </div>
+      </ModalContent>
+    </Modal>
+  )
+}
+
+export default ModalTroubleShooting
diff --git a/web/containers/OpenAiKeyInput/index.tsx b/web/containers/OpenAiKeyInput/index.tsx
index 444c8074f..7ef97cf38 100644
--- a/web/containers/OpenAiKeyInput/index.tsx
+++ b/web/containers/OpenAiKeyInput/index.tsx
@@ -30,7 +30,7 @@ const OpenAiKeyInput: React.FC = () => {
   }
 
   return (
-    <div className="mt-4">
+    <div className="my-4">
       <label
         id="thread-title"
         className="mb-2 inline-block font-bold text-gray-600 dark:text-gray-300"
diff --git a/web/containers/Providers/DataLoader.tsx b/web/containers/Providers/DataLoader.tsx
index 2b6675d98..d7b630043 100644
--- a/web/containers/Providers/DataLoader.tsx
+++ b/web/containers/Providers/DataLoader.tsx
@@ -3,6 +3,7 @@
 import { Fragment, ReactNode } from 'react'
 
 import useAssistants from '@/hooks/useAssistants'
+import useGetSystemResources from '@/hooks/useGetSystemResources'
 import useModels from '@/hooks/useModels'
 import useThreads from '@/hooks/useThreads'
 
@@ -14,6 +15,8 @@ const DataLoader: React.FC<Props> = ({ children }) => {
   useModels()
   useThreads()
   useAssistants()
+  useGetSystemResources()
+  console.debug('Load Data...')
 
   return <Fragment>{children}</Fragment>
 }
diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index f22ed1bc7..102fa5f1c 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -2,16 +2,22 @@
 import { ReactNode, useCallback, useEffect, useRef } from 'react'
 
 import {
+  ChatCompletionMessage,
+  ChatCompletionRole,
   events,
   ThreadMessage,
   ExtensionTypeEnum,
   MessageStatus,
+  MessageRequest,
   Model,
   ConversationalExtension,
   MessageEvent,
+  MessageRequestType,
   ModelEvent,
+  Thread,
 } from '@janhq/core'
 import { useAtomValue, useSetAtom } from 'jotai'
+import { ulid } from 'ulid'
 
 import {
   activeModelAtom,
@@ -25,6 +31,7 @@ import { toaster } from '../Toast'
 
 import { extensionManager } from '@/extension'
 import {
+  getCurrentChatMessagesAtom,
   addNewMessageAtom,
   updateMessageAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
@@ -37,9 +44,11 @@ import {
 } from '@/helpers/atoms/Thread.atom'
 
 export default function EventHandler({ children }: { children: ReactNode }) {
+  const messages = useAtomValue(getCurrentChatMessagesAtom)
   const addNewMessage = useSetAtom(addNewMessageAtom)
   const updateMessage = useSetAtom(updateMessageAtom)
   const downloadedModels = useAtomValue(downloadedModelsAtom)
+  const activeModel = useAtomValue(activeModelAtom)
   const setActiveModel = useSetAtom(activeModelAtom)
   const setStateModel = useSetAtom(stateModelAtom)
   const setQueuedMessage = useSetAtom(queuedMessageAtom)
@@ -51,6 +60,8 @@ export default function EventHandler({ children }: { children: ReactNode }) {
   const threadsRef = useRef(threads)
   const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
   const updateThread = useSetAtom(updateThreadAtom)
+  const messagesRef = useRef(messages)
+  const activeModelRef = useRef(activeModel)
 
   useEffect(() => {
     threadsRef.current = threads
@@ -60,9 +71,19 @@ export default function EventHandler({ children }: { children: ReactNode }) {
     modelsRef.current = downloadedModels
   }, [downloadedModels])
 
+  useEffect(() => {
+    messagesRef.current = messages
+  }, [messages])
+
+  useEffect(() => {
+    activeModelRef.current = activeModel
+  }, [activeModel])
+
   const onNewMessageResponse = useCallback(
     (message: ThreadMessage) => {
-      addNewMessage(message)
+      if (message.type === MessageRequestType.Thread) {
+        addNewMessage(message)
+      }
     },
     [addNewMessage]
   )
@@ -93,20 +114,60 @@ export default function EventHandler({ children }: { children: ReactNode }) {
 
   const onModelInitFailed = useCallback(
     (res: any) => {
-      const errorMessage = `${res.error}`
-      console.error('Failed to load model: ' + errorMessage)
-      setLoadModelError(errorMessage)
+      const errorMessage = res?.error ?? res
+      console.error('Failed to load model: ', errorMessage)
       setStateModel(() => ({
         state: 'start',
         loading: false,
         model: res.modelId,
       }))
+      setLoadModelError(errorMessage)
       setQueuedMessage(false)
     },
     [setStateModel, setQueuedMessage, setLoadModelError]
   )
 
-  const onMessageResponseUpdate = useCallback(
+  const updateThreadTitle = useCallback(
+    (message: ThreadMessage) => {
+      // Update only when it's finished
+      if (message.status !== MessageStatus.Ready) {
+        return
+      }
+
+      const thread = threadsRef.current?.find((e) => e.id == message.thread_id)
+      const messageContent = message.content[0]?.text?.value
+
+      // The thread title should not be updated if the message is less than 10 words
+      // And no new line character is present
+      // And non-alphanumeric characters should be removed
+      if (thread && messageContent && !messageContent.includes('\n')) {
+        // Remove non-alphanumeric characters
+        const cleanedMessageContent = messageContent
+          .replace(/[^a-z0-9\s]/gi, '')
+          .trim()
+        // Split the message into words
+        const words = cleanedMessageContent.split(' ')
+        // Check if the message is less than 10 words
+        if (words.length < 10) {
+          // Update the Thread title with the response of the inference on the 1st prompt
+          updateThread({
+            ...thread,
+            title: cleanedMessageContent,
+            metadata: thread.metadata,
+          })
+
+          extensionManager
+            .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
+            ?.saveThread({
+              ...thread,
+            })
+        }
+      }
+    },
+    [updateThread]
+  )
+
+  const updateThreadMessage = useCallback(
     (message: ThreadMessage) => {
       updateMessage(
         message.id,
@@ -116,7 +177,6 @@ export default function EventHandler({ children }: { children: ReactNode }) {
       )
       if (message.status === MessageStatus.Pending) {
         if (message.content.length) {
-          updateThreadWaiting(message.thread_id, false)
           setIsGeneratingResponse(false)
         }
         return
@@ -128,10 +188,10 @@ export default function EventHandler({ children }: { children: ReactNode }) {
 
       const thread = threadsRef.current?.find((e) => e.id == message.thread_id)
       if (thread) {
-        const messageContent = message.content[0]?.text.value ?? ''
+        const messageContent = message.content[0]?.text?.value
         const metadata = {
           ...thread.metadata,
-          lastMessage: messageContent,
+          ...(messageContent && { lastMessage: messageContent }),
         }
 
         updateThread({
@@ -146,20 +206,84 @@ export default function EventHandler({ children }: { children: ReactNode }) {
             metadata,
           })
 
+        // If this is not the summary of the Thread, don't need to add it to the Thread
         extensionManager
           .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
           ?.addNewMessage(message)
+
+        // Attempt to generate the title of the Thread when needed
+        generateThreadTitle(message, thread)
       }
     },
-    [updateMessage, updateThreadWaiting, setIsGeneratingResponse]
+    [setIsGeneratingResponse, updateMessage, updateThread, updateThreadWaiting]
   )
 
+  const onMessageResponseUpdate = useCallback(
+    (message: ThreadMessage) => {
+      switch (message.type) {
+        case MessageRequestType.Summary:
+          updateThreadTitle(message)
+          break
+        default:
+          updateThreadMessage(message)
+      }
+    },
+    [updateThreadMessage, updateThreadTitle]
+  )
+
+  const generateThreadTitle = (message: ThreadMessage, thread: Thread) => {
+    // If this is the first ever prompt in the thread
+    if (
+      thread &&
+      thread.title?.trim() === 'New Thread' &&
+      activeModelRef.current
+    ) {
+      // This is the first time message comes in on a new thread
+      //  Summarize the first message, and make that the title of the Thread
+      // 1. Get the summary of the first prompt using whatever engine user is currently using
+      const threadMessages = messagesRef?.current
+
+      if (!threadMessages || threadMessages.length === 0) return
+
+      const summarizeFirstPrompt = `Summarize this text "${threadMessages[0].content[0].text.value}" for a conversation title in less than 10 words`
+      // Prompt: Given this query from user {query}, return to me the summary in 5 words as the title
+      const msgId = ulid()
+      const messages: ChatCompletionMessage[] = [
+        {
+          role: ChatCompletionRole.System,
+          content:
+            'The conversation below is for a text summarization, user asks assistant to summarize a text and assistant should response in just less than 10 words',
+        },
+        {
+          role: ChatCompletionRole.User,
+          content: summarizeFirstPrompt,
+        },
+      ]
+
+      const messageRequest: MessageRequest = {
+        id: msgId,
+        threadId: message.thread_id,
+        type: MessageRequestType.Summary,
+        messages,
+        model: {
+          ...activeModelRef.current,
+          parameters: {
+            stream: false,
+          },
+        },
+      }
+
+      // 2. Update the title with the result of the inference
+      setTimeout(() => {
+        events.emit(MessageEvent.OnMessageSent, messageRequest)
+      }, 1000)
+    }
+  }
+
   useEffect(() => {
-    console.log('Registering events')
     if (window.core?.events) {
       events.on(MessageEvent.OnMessageResponse, onNewMessageResponse)
       events.on(MessageEvent.OnMessageUpdate, onMessageResponseUpdate)
-
       events.on(ModelEvent.OnModelReady, onModelReady)
       events.on(ModelEvent.OnModelFail, onModelInitFailed)
       events.on(ModelEvent.OnModelStopped, onModelStopped)
diff --git a/web/containers/Providers/EventListener.tsx b/web/containers/Providers/EventListener.tsx
index 5e8556f33..938db69c0 100644
--- a/web/containers/Providers/EventListener.tsx
+++ b/web/containers/Providers/EventListener.tsx
@@ -1,93 +1,62 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
+import { PropsWithChildren, useCallback, useEffect } from 'react'
 
-import { PropsWithChildren, useEffect, useRef } from 'react'
+import React from 'react'
 
-import { baseName } from '@janhq/core'
-import { useAtom, useAtomValue, useSetAtom } from 'jotai'
+import { DownloadEvent, events, DownloadState } from '@janhq/core'
+import { useSetAtom } from 'jotai'
 
-import { useDownloadState } from '@/hooks/useDownloadState'
-
-import { modelBinFileName } from '@/utils/model'
+import { setDownloadStateAtom } from '@/hooks/useDownloadState'
 
 import EventHandler from './EventHandler'
 
 import { appDownloadProgress } from './Jotai'
 
-import {
-  downloadedModelsAtom,
-  downloadingModelsAtom,
-} from '@/helpers/atoms/Model.atom'
-
-export default function EventListenerWrapper({ children }: PropsWithChildren) {
+const EventListenerWrapper = ({ children }: PropsWithChildren) => {
+  const setDownloadState = useSetAtom(setDownloadStateAtom)
   const setProgress = useSetAtom(appDownloadProgress)
-  const models = useAtomValue(downloadingModelsAtom)
-  const modelsRef = useRef(models)
 
-  const [downloadedModels, setDownloadedModels] = useAtom(downloadedModelsAtom)
-  const {
-    setDownloadState,
-    setDownloadStateSuccess,
-    setDownloadStateFailed,
-    setDownloadStateCancelled,
-  } = useDownloadState()
-  const downloadedModelRef = useRef(downloadedModels)
+  const onFileDownloadUpdate = useCallback(
+    async (state: DownloadState) => {
+      console.debug('onFileDownloadUpdate', state)
+      setDownloadState(state)
+    },
+    [setDownloadState]
+  )
+
+  const onFileDownloadError = useCallback(
+    (state: DownloadState) => {
+      console.debug('onFileDownloadError', state)
+      setDownloadState(state)
+    },
+    [setDownloadState]
+  )
+
+  const onFileDownloadSuccess = useCallback(
+    (state: DownloadState) => {
+      console.debug('onFileDownloadSuccess', state)
+      setDownloadState(state)
+    },
+    [setDownloadState]
+  )
 
   useEffect(() => {
-    modelsRef.current = models
-  }, [models])
-  useEffect(() => {
-    downloadedModelRef.current = downloadedModels
-  }, [downloadedModels])
+    console.debug('EventListenerWrapper: registering event listeners...')
+
+    events.on(DownloadEvent.onFileDownloadUpdate, onFileDownloadUpdate)
+    events.on(DownloadEvent.onFileDownloadError, onFileDownloadError)
+    events.on(DownloadEvent.onFileDownloadSuccess, onFileDownloadSuccess)
+
+    return () => {
+      console.debug('EventListenerWrapper: unregistering event listeners...')
+      events.off(DownloadEvent.onFileDownloadUpdate, onFileDownloadUpdate)
+      events.off(DownloadEvent.onFileDownloadError, onFileDownloadError)
+      events.off(DownloadEvent.onFileDownloadSuccess, onFileDownloadSuccess)
+    }
+  }, [onFileDownloadUpdate, onFileDownloadError, onFileDownloadSuccess])
 
   useEffect(() => {
     if (window && window.electronAPI) {
-      window.electronAPI.onFileDownloadUpdate(
-        async (_event: string, state: any | undefined) => {
-          if (!state) return
-          const modelName = await baseName(state.fileName)
-          const model = modelsRef.current.find(
-            (model) => modelBinFileName(model) === modelName
-          )
-          if (model)
-            setDownloadState({
-              ...state,
-              modelId: model.id,
-            })
-        }
-      )
-
-      window.electronAPI.onFileDownloadError(
-        async (_event: string, state: any) => {
-          const modelName = await baseName(state.fileName)
-          const model = modelsRef.current.find(
-            (model) => modelBinFileName(model) === modelName
-          )
-          if (model) {
-            if (state.err?.message !== 'aborted') {
-              console.error('Download error', state)
-              setDownloadStateFailed(model.id, state.err.message)
-            } else {
-              setDownloadStateCancelled(model.id)
-            }
-          }
-        }
-      )
-
-      window.electronAPI.onFileDownloadSuccess(
-        async (_event: string, state: any) => {
-          if (state && state.fileName) {
-            const modelName = await baseName(state.fileName)
-            const model = modelsRef.current.find(
-              (model) => modelBinFileName(model) === modelName
-            )
-            if (model) {
-              setDownloadStateSuccess(model.id)
-              setDownloadedModels([...downloadedModelRef.current, model])
-            }
-          }
-        }
-      )
-
       window.electronAPI.onAppUpdateDownloadUpdate(
         (_event: string, progress: any) => {
           setProgress(progress.percent)
@@ -107,14 +76,9 @@ export default function EventListenerWrapper({ children }: PropsWithChildren) {
       })
     }
     return () => {}
-  }, [
-    setDownloadState,
-    setDownloadStateCancelled,
-    setDownloadStateFailed,
-    setDownloadStateSuccess,
-    setDownloadedModels,
-    setProgress,
-  ])
+  }, [setDownloadState, setProgress])
 
   return <EventHandler>{children}</EventHandler>
 }
+
+export default EventListenerWrapper
diff --git a/web/containers/Providers/Jotai.tsx b/web/containers/Providers/Jotai.tsx
index 103f0d9ee..5907ac746 100644
--- a/web/containers/Providers/Jotai.tsx
+++ b/web/containers/Providers/Jotai.tsx
@@ -8,6 +8,7 @@ type Props = {
   children: ReactNode
 }
 
+export const editPromptAtom = atom<string>('')
 export const currentPromptAtom = atom<string>('')
 export const fileUploadAtom = atom<FileInfo[]>([])
 export const appDownloadProgress = atom<number>(-1)
diff --git a/web/containers/ServerLogs/index.tsx b/web/containers/ServerLogs/index.tsx
new file mode 100644
index 000000000..a980fefff
--- /dev/null
+++ b/web/containers/ServerLogs/index.tsx
@@ -0,0 +1,232 @@
+/* eslint-disable @typescript-eslint/naming-convention */
+import { useCallback, useEffect, useState } from 'react'
+
+import React from 'react'
+
+import { Button } from '@janhq/uikit'
+import { useAtomValue } from 'jotai'
+
+import { CopyIcon, CheckIcon } from 'lucide-react'
+
+import { useClipboard } from '@/hooks/useClipboard'
+import { useLogs } from '@/hooks/useLogs'
+
+import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
+
+type ServerLogsProps = { limit?: number; withCopy?: boolean }
+
+const ServerLogs = (props: ServerLogsProps) => {
+  const { limit = 0 } = props
+  const { getLogs } = useLogs()
+  const serverEnabled = useAtomValue(serverEnabledAtom)
+  const [logs, setLogs] = useState([])
+
+  const clipboard = useClipboard({ timeout: 1000 })
+
+  const updateLogs = useCallback(
+    () =>
+      getLogs('server').then((log) => {
+        if (typeof log?.split === 'function') {
+          setLogs(log.split(/\r?\n|\r|\n/g))
+        }
+      }),
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+    []
+  )
+
+  useEffect(() => {
+    if (serverEnabled) {
+      updateLogs()
+    }
+  }, [serverEnabled, updateLogs])
+
+  useEffect(() => {
+    updateLogs()
+
+    // Log polling interval
+    const intervalId = setInterval(() => {
+      updateLogs()
+    }, window.core?.api?.pollingInterval ?? 1000)
+
+    // clean up interval
+    return () => clearInterval(intervalId)
+  }, [updateLogs])
+
+  return (
+    <>
+      <div className="absolute -top-11 right-2">
+        <Button
+          themes="outline"
+          className="bg-white dark:bg-secondary/50"
+          onClick={() => {
+            clipboard.copy(logs.slice(-100) ?? '')
+          }}
+        >
+          <div className="flex items-center space-x-2">
+            {clipboard.copied ? (
+              <>
+                <CheckIcon size={14} className="text-green-600" />
+                <span>Copying...</span>
+              </>
+            ) : (
+              <>
+                <CopyIcon size={14} />
+                <span>Copy All</span>
+              </>
+            )}
+          </div>
+        </Button>
+      </div>
+      <div className="overflow-hidden">
+        {logs.length > 1 ? (
+          <div className="h-full overflow-auto">
+            <code className="inline-block whitespace-pre-line text-xs">
+              {logs.slice(-limit).map((log, i) => {
+                return (
+                  <p key={i} className="my-2 leading-relaxed">
+                    {log}
+                  </p>
+                )
+              })}
+            </code>
+          </div>
+        ) : (
+          <div className="mt-24 flex flex-col items-center justify-center">
+            <svg
+              width="115"
+              height="115"
+              viewBox="0 0 115 115"
+              fill="none"
+              xmlns="http://www.w3.org/2000/svg"
+            >
+              <circle cx="57.4999" cy="57.5009" r="50.2314" fill="#DADADA" />
+              <circle
+                cx="57.5"
+                cy="57.5"
+                r="55.9425"
+                fill="#E7E7E7"
+                stroke="white"
+                strokeWidth="3.1151"
+              />
+              <mask
+                id="mask0_1206_120508"
+                maskUnits="userSpaceOnUse"
+                x="3"
+                y="3"
+                width="109"
+                height="109"
+              >
+                <circle cx="57.4993" cy="57.5003" r="54.1253" fill="white" />
+              </mask>
+              <g mask="url(#mask0_1206_120508)">
+                <path
+                  d="M47.5039 116.445H58.5351L74.3593 39.8282L63.7828 37.6406L47.5039 116.445Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M72.165 39.4563L74.3716 39.8457L72.4246 38.418L72.165 39.4563Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M45.6797 114.947H56.7108L72.4257 38.4193L61.9585 36.1426L45.6797 114.947Z"
+                  fill="url(#paint0_linear_1206_120508)"
+                />
+                <path
+                  d="M93.1887 90.6726L26.5474 76.906L24.6602 75.2136L31.7058 51.9418L34.7984 52.1448L30.0296 49.6041L32.757 36.0039L99.3983 49.7705L101.29 51.467L98.5257 64.844L93.2456 64.9414L96.1515 65.4974L98.0387 67.1898L93.1887 90.6726Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M91.3015 88.9801L24.6602 75.2136L29.8186 50.2454L32.9112 50.4483L30.3299 47.7656L32.757 36.0039L99.3983 49.7705L96.6345 63.1475L91.3583 63.2449L96.1515 65.4974L91.3015 88.9801Z"
+                  fill="url(#paint1_linear_1206_120508)"
+                />
+                <path
+                  d="M92.7826 63.1065C92.7826 63.1065 92.7298 63.1065 92.6243 63.1065L92.1576 63.0741L90.3637 62.9279L89.069 62.8143L87.5308 62.6317C86.431 62.4937 85.1688 62.3638 83.7929 62.1365L81.6216 61.8078C80.8667 61.6901 80.0875 61.5359 79.2798 61.4019C77.6564 61.126 75.9396 60.7647 74.1295 60.3995C70.5133 59.6324 66.5563 58.703 62.4247 57.6518C54.1655 55.5252 46.7221 53.4797 41.2918 52.1525C39.9403 51.8075 38.7065 51.5275 37.6391 51.2677C36.5717 51.008 35.6098 50.797 34.8631 50.6306L33.1098 50.2247L32.6552 50.1151C32.6025 50.1035 32.5508 50.0872 32.501 50.0664C32.5545 50.0686 32.6076 50.0768 32.6593 50.0908L33.1219 50.176L34.8834 50.5291C35.6504 50.6833 36.5879 50.8822 37.6675 51.1297C38.7471 51.3773 39.9849 51.6452 41.3446 51.978C46.783 53.2605 54.2386 55.2816 62.4937 57.4043C66.6253 58.4554 70.5742 59.3929 74.1823 60.1722C75.9924 60.5415 77.7051 60.9109 79.3245 61.195C80.1362 61.3411 80.9114 61.4953 81.6622 61.6008L83.8254 61.9458C85.2012 62.1852 86.4553 62.3273 87.5552 62.4775L89.0893 62.6804L90.3799 62.8143L92.1698 63.0091L92.6324 63.0659L92.7826 63.1065Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M96.131 60.9773C96.0789 60.948 96.0288 60.9155 95.9808 60.8799L95.5749 60.5755C95.2056 60.3117 94.678 59.8937 93.9515 59.3985C91.9511 57.9951 89.8665 56.7156 87.7095 55.5673C84.5067 53.8752 81.1551 52.4813 77.697 51.4032C73.4578 50.101 69.0819 49.2947 64.6569 49.0005C59.9449 48.6555 55.4481 49.1142 51.353 49.2075C49.411 49.2762 47.4666 49.2369 45.529 49.0898C41.3921 48.7494 37.3342 47.762 33.5035 46.1636C32.6918 45.8267 32.0952 45.5426 31.6853 45.3519L31.2226 45.1165L31.0684 45.0312C31.1262 45.0462 31.1821 45.068 31.2348 45.0962L31.7096 45.3072C32.1155 45.4939 32.7364 45.7658 33.54 46.0865C35.8079 46.9951 38.1522 47.7 40.5451 48.1929C42.1954 48.5323 43.8654 48.7681 45.5452 48.899C47.4754 49.0336 49.4114 49.0647 51.3449 48.9924C55.4278 48.8869 59.9368 48.4201 64.6731 48.7651C69.1177 49.0615 73.5121 49.8788 77.766 51.2002C81.2331 52.295 84.5906 53.7108 87.7947 55.4293C89.949 56.5876 92.0247 57.8864 94.0083 59.3173C94.7105 59.8206 95.2259 60.2549 95.5912 60.5349L95.997 60.8596C96.0446 60.8953 96.0894 60.9347 96.131 60.9773Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M63.9192 43.0816C63.8188 43.1282 63.7141 43.1649 63.6067 43.1912L62.6935 43.4631C62.2876 43.5849 61.8128 43.7188 61.2405 43.8487C60.6683 43.9786 60.023 44.1572 59.2924 44.287C58.5619 44.4169 57.7745 44.5914 56.91 44.6929C56.0456 44.7943 55.1283 44.9364 54.1583 45.046C52.0463 45.2502 49.9242 45.3328 47.8027 45.2936C45.6814 45.2371 43.565 45.0623 41.4632 44.77C40.4973 44.6158 39.58 44.4818 38.7278 44.2951C37.8755 44.1084 37.1043 43.9461 36.3697 43.7675C35.6351 43.589 35.0101 43.4063 34.446 43.244C33.8818 43.0816 33.3989 42.9315 33.0092 42.7975L32.1082 42.485C32.0022 42.4531 31.8991 42.4123 31.7998 42.3633C31.9103 42.3761 32.0191 42.4006 32.1245 42.4363L33.0377 42.7042C33.4435 42.826 33.9143 42.968 34.4825 43.1101C35.0507 43.2521 35.7001 43.4469 36.4103 43.5971C37.1206 43.7472 37.916 43.942 38.7683 44.0922C39.6206 44.2424 40.5338 44.3966 41.4957 44.5427C43.5877 44.8202 45.693 44.9868 47.8027 45.0419C49.9143 45.0792 52.0264 45.0034 54.1299 44.8146C55.0959 44.7091 56.0172 44.6239 56.8735 44.4859C57.7299 44.3479 58.5253 44.2302 59.2518 44.08C59.9783 43.9299 60.6277 43.8 61.1999 43.6742C61.7722 43.5484 62.2633 43.4347 62.661 43.3292L63.5823 43.106C63.6933 43.0854 63.8063 43.0772 63.9192 43.0816Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M46.1782 66.8891C46.1782 66.8891 46.2837 66.9459 46.4786 67.0677L47.3552 67.6075C48.1263 68.0742 49.2546 68.7885 50.7644 69.5962C52.5839 70.6072 54.5341 71.3624 56.56 71.8405C57.1712 71.9765 57.7909 72.0714 58.4148 72.1246C59.0677 72.2062 59.729 72.063 60.2898 71.7188C60.5621 71.5185 60.7593 71.2327 60.8499 70.9071C60.9379 70.5705 60.9379 70.2169 60.8499 69.8803C60.6372 69.1763 60.1849 68.5689 59.5714 68.1635C54.4901 64.7949 47.3349 62.3395 39.2381 62.1122C38.2275 62.0797 37.2088 62.0797 36.1698 62.1122C35.1309 62.1447 34.0756 62.3882 33.3816 63.1593C33.2064 63.3413 33.0692 63.5562 32.9779 63.7918C32.8866 64.0273 32.8431 64.2786 32.85 64.5311C32.8877 65.0471 33.0864 65.5383 33.4181 65.9354C34.0716 66.7714 35.0132 67.3518 35.9182 67.9646C39.5709 70.4403 43.4387 72.8998 47.7895 74.6044C52.1402 76.309 56.7629 77.0761 61.1177 76.4308C62.1922 76.2718 63.2512 76.0219 64.2834 75.684C65.3 75.3967 66.2119 74.8217 66.9093 74.0281C67.5327 73.2028 67.8626 72.1929 67.8468 71.1587C67.8497 70.1451 67.625 69.1437 67.1893 68.2284C66.3039 66.4723 64.9462 64.9979 63.2688 63.971C61.6898 62.9951 59.9765 62.2554 58.1834 61.7753C56.4585 61.2761 54.7499 60.919 53.1183 60.5578L48.4226 59.4944L34.2542 56.276L30.4067 55.3872L29.4083 55.1518C29.181 55.099 29.0674 55.0625 29.0674 55.0625L29.4124 55.1274L30.4189 55.3385L34.2786 56.1827L48.4632 59.324L53.1589 60.3711C54.7824 60.7404 56.5032 61.0895 58.2402 61.5887C60.0548 62.0698 61.7887 62.8151 63.3865 63.8006C65.1016 64.8462 66.4904 66.3503 67.3963 68.1432C67.8467 69.0889 68.0797 70.1234 68.0782 71.1709C68.0964 72.2575 67.7507 73.319 67.096 74.1864C66.3707 75.017 65.4208 75.6203 64.3605 75.9235C63.3146 76.2697 62.2404 76.5237 61.1502 76.6824C56.7426 77.3399 52.0631 76.5566 47.7002 74.8479C43.3372 73.1393 39.441 70.6798 35.7965 68.1919C34.8955 67.5669 33.9376 66.9743 33.2477 66.0936C32.8831 65.658 32.6657 65.1181 32.6267 64.5514C32.6196 64.2683 32.6687 63.9866 32.7711 63.7226C32.8735 63.4586 33.0272 63.2174 33.2233 63.0132C33.599 62.6113 34.0734 62.3147 34.5992 62.1528C35.1094 61.9991 35.6373 61.9118 36.1698 61.893C37.2169 61.8525 38.2438 61.8565 39.2584 61.893C47.4039 62.1406 54.5794 64.6163 59.6932 68.0336C60.3373 68.4648 60.8099 69.1082 61.0285 69.8519C61.1239 70.2164 61.1239 70.5994 61.0285 70.9639C60.9286 71.3211 60.7095 71.6333 60.4075 71.8487C59.8169 72.2131 59.12 72.3662 58.431 72.2829C57.7989 72.2243 57.1713 72.1253 56.5519 71.9867C54.5186 71.4945 52.5639 70.7213 50.7441 69.6895C49.2343 68.8778 48.1142 68.1391 47.3512 67.6602C46.9778 67.4208 46.6896 67.2544 46.4907 67.1002C46.2919 66.9459 46.1782 66.8891 46.1782 66.8891Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M94.8364 71.2204C94.6993 71.2055 94.5635 71.1797 94.4305 71.1433C94.1789 71.0743 93.8014 71.0012 93.3185 70.916C91.9393 70.7187 90.5384 70.7297 89.1625 70.9484C87.1263 71.2911 85.1507 71.9282 83.2979 72.8397C81.0433 73.9901 78.866 75.2861 76.7799 76.7197C74.6823 78.1612 72.4837 79.4497 70.201 80.5753C68.3181 81.4721 66.3087 82.0743 64.243 82.3611C62.8484 82.5487 61.4325 82.5089 60.0505 82.2434C59.6768 82.1692 59.3081 82.0716 58.9466 81.9512C58.8182 81.9168 58.6932 81.8706 58.5732 81.8132C58.7037 81.8336 58.8326 81.8634 58.9588 81.9025C59.2104 81.9755 59.5838 82.0567 60.0668 82.15C61.4407 82.3746 62.841 82.3869 64.2187 82.1866C66.2604 81.8789 68.2442 81.266 70.1036 80.3683C72.3696 79.236 74.5543 77.9477 76.6419 76.5127C78.7383 75.0733 80.9295 73.777 83.2005 72.6327C85.0755 71.7192 87.077 71.0926 89.1382 70.7739C90.5308 70.568 91.9473 70.5845 93.3347 70.8226C93.72 70.8867 94.1009 70.9748 94.4752 71.0864C94.5995 71.1198 94.7204 71.1646 94.8364 71.2204Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M93.6026 77.826C93.6026 77.8504 93.286 77.7205 92.7016 77.5906C91.8761 77.4114 91.0248 77.3839 90.1894 77.5095C88.9516 77.719 87.7468 78.0901 86.6057 78.6134C85.195 79.2299 83.8293 79.9446 82.5187 80.7523C81.1063 81.5883 79.7589 82.4041 78.4602 83.025C77.321 83.5882 76.1214 84.0199 74.8846 84.3116C74.0488 84.5016 73.1926 84.5861 72.3358 84.5632C72.1034 84.5575 71.8716 84.5372 71.6418 84.5024C71.5603 84.4985 71.4797 84.4835 71.4023 84.4577C71.4023 84.4293 71.7392 84.4577 72.3358 84.4577C73.1828 84.4453 74.0257 84.3364 74.8481 84.133C76.0637 83.8193 77.242 83.3757 78.3628 82.8099C79.6371 82.1849 80.9724 81.3692 82.3888 80.529C83.7103 79.7132 85.0914 78.9983 86.5204 78.3902C87.683 77.8677 88.9122 77.5085 90.1731 77.3228C91.0279 77.2097 91.8965 77.2648 92.73 77.4851C92.9548 77.5461 93.1757 77.6207 93.3916 77.7083C93.4671 77.7375 93.5381 77.7771 93.6026 77.826Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M72.1531 44.1988C72.1531 44.2678 69.584 43.7645 66.4468 43.0746C63.3095 42.3846 60.7648 41.7718 60.7932 41.7069C60.8216 41.6419 63.3623 42.1411 66.4995 42.8311C69.6368 43.521 72.1531 44.1339 72.1531 44.1988Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M87.7278 22.8493C87.9286 21.4011 85.8726 20.21 84.3238 20.0848C83.5886 20.0273 82.8227 20.139 82.1249 19.8987C80.6135 19.3743 80.011 17.432 78.5371 16.8128C77.4342 16.3526 76.1544 16.762 75.0957 17.2967C74.0371 17.8313 72.9717 18.5046 71.7769 18.5825C70.7557 18.6468 69.6086 18.2644 68.7133 18.7686C68.0326 19.1442 67.6922 19.9224 67.059 20.3792C66.4259 20.836 65.6498 20.9206 64.8941 20.9612C64.1384 21.0018 63.3521 21.012 62.6611 21.3233C61.9701 21.6346 61.4017 22.3655 61.5446 23.1031L87.7278 22.8493Z"
+                  fill="#ABABAB"
+                />
+                <path
+                  d="M39.1881 32.5312C39.3293 31.4869 37.8655 30.6287 36.7662 30.5385C36.2413 30.4963 35.6955 30.5769 35.1993 30.4022C34.121 30.0182 33.6916 28.6264 32.64 28.1791C31.8556 27.847 30.951 28.1426 30.1895 28.5285C29.428 28.9144 28.6741 29.4001 27.8229 29.4538C27.0824 29.5018 26.2789 29.2254 25.632 29.5901C25.1491 29.8608 24.8972 30.4195 24.4525 30.742C24.0078 31.0645 23.4486 31.126 22.9085 31.1624C22.3684 31.1989 21.8092 31.1989 21.3187 31.4254C20.8282 31.652 20.4198 32.1741 20.5229 32.7078L39.1881 32.5312Z"
+                  fill="#ABABAB"
+                />
+                <path
+                  d="M76.46 61.6777L78.8178 62.1824L80.1702 66.9562L80.2674 66.977L83.4556 63.1752L85.8134 63.6799L80.8041 69.3391L80.0506 72.8588L77.9602 72.4114L78.7137 68.8917L76.46 61.6777Z"
+                  fill="white"
+                />
+                <path
+                  d="M67.148 61.4992L67.5195 59.7637L75.6965 61.514L75.325 63.2496L72.2769 62.5971L70.5171 70.8178L68.4364 70.3724L70.1962 62.1517L67.148 61.4992Z"
+                  fill="white"
+                />
+                <path
+                  d="M56.9049 67.9016L59.0361 57.9453L62.9642 58.7862C63.7193 58.9478 64.3318 59.2297 64.8016 59.632C65.272 60.0309 65.5922 60.5147 65.762 61.0832C65.9357 61.6491 65.9518 62.2627 65.8103 62.9238C65.6688 63.585 65.4013 64.1379 65.0078 64.5824C64.6144 65.0269 64.1169 65.3323 63.5153 65.4984C62.9169 65.6652 62.2353 65.6667 61.4705 65.503L58.9668 64.967L59.3279 63.2801L61.4913 63.7432C61.8964 63.8299 62.2451 63.8317 62.5375 63.7485C62.8338 63.6628 63.0734 63.5091 63.2565 63.2872C63.4435 63.0629 63.572 62.7871 63.6421 62.4597C63.7128 62.1291 63.7082 61.8265 63.628 61.5517C63.5518 61.2744 63.3954 61.0392 63.1587 60.8462C62.9228 60.65 62.6007 60.5082 62.1923 60.4207L60.7728 60.1169L59.0099 68.3522L56.9049 67.9016Z"
+                  fill="white"
+                />
+                <path
+                  d="M46.5049 55.2637L49.1009 55.8194L50.4108 63.0957L50.5275 63.1206L54.7013 57.0182L57.2973 57.5739L55.1661 67.5302L53.1243 67.0931L54.5114 60.6128L54.4288 60.5951L50.4754 66.4753L49.0851 66.1776L47.8905 59.1701L47.8078 59.1524L46.4154 65.657L44.3736 65.2199L46.5049 55.2637Z"
+                  fill="white"
+                />
+                <path
+                  d="M35.9977 63.425L38.1289 53.4688L44.8377 54.9048L44.4662 56.6404L39.8624 55.6549L39.3546 58.0273L43.6132 58.9389L43.2417 60.6744L38.9831 59.7628L38.4742 62.1401L43.0974 63.1297L42.7259 64.8653L35.9977 63.425Z"
+                  fill="white"
+                />
+              </g>
+              <defs>
+                <linearGradient
+                  id="paint0_linear_1206_120508"
+                  x1="59.1074"
+                  y1="36.1426"
+                  x2="59.1074"
+                  y2="114.947"
+                  gradientUnits="userSpaceOnUse"
+                >
+                  <stop stopColor="#CFCFCF" />
+                  <stop offset="1" stopColor="#C6C6C6" />
+                </linearGradient>
+                <linearGradient
+                  id="paint1_linear_1206_120508"
+                  x1="62.0292"
+                  y1="36.0039"
+                  x2="62.0292"
+                  y2="88.9801"
+                  gradientUnits="userSpaceOnUse"
+                >
+                  <stop stopColor="#DDDDDD" />
+                  <stop offset="1" stopColor="#B6B6B6" />
+                </linearGradient>
+              </defs>
+            </svg>
+            <p className="mt-4 text-muted-foreground">Empty logs</p>
+          </div>
+        )}
+      </div>
+    </>
+  )
+}
+
+export default ServerLogs
diff --git a/web/context/FeatureToggle.tsx b/web/context/FeatureToggle.tsx
index 6444359b0..5a63eb66e 100644
--- a/web/context/FeatureToggle.tsx
+++ b/web/context/FeatureToggle.tsx
@@ -4,18 +4,26 @@ interface FeatureToggleContextType {
   experimentalFeature: boolean
   ignoreSSL: boolean
   proxy: string
+  proxyEnabled: boolean
+  vulkanEnabled: boolean
   setExperimentalFeature: (on: boolean) => void
+  setVulkanEnabled: (on: boolean) => void
   setIgnoreSSL: (on: boolean) => void
   setProxy: (value: string) => void
+  setProxyEnabled: (on: boolean) => void
 }
 
 const initialContext: FeatureToggleContextType = {
   experimentalFeature: false,
   ignoreSSL: false,
   proxy: '',
+  proxyEnabled: false,
+  vulkanEnabled: false,
   setExperimentalFeature: () => {},
+  setVulkanEnabled: () => {},
   setIgnoreSSL: () => {},
   setProxy: () => {},
+  setProxyEnabled: () => {},
 }
 
 export const FeatureToggleContext =
@@ -27,10 +35,15 @@ export default function FeatureToggleWrapper({
   children: ReactNode
 }) {
   const EXPERIMENTAL_FEATURE = 'experimentalFeature'
+  const VULKAN_ENABLED = 'vulkanEnabled'
   const IGNORE_SSL = 'ignoreSSLFeature'
   const HTTPS_PROXY_FEATURE = 'httpsProxyFeature'
+  const PROXY_FEATURE_ENABLED = 'proxyFeatureEnabled'
+
   const [experimentalFeature, directSetExperimentalFeature] =
     useState<boolean>(false)
+  const [proxyEnabled, directSetProxyEnabled] = useState<boolean>(false)
+  const [vulkanEnabled, directEnableVulkan] = useState<boolean>(false)
   const [ignoreSSL, directSetIgnoreSSL] = useState<boolean>(false)
   const [proxy, directSetProxy] = useState<string>('')
 
@@ -40,6 +53,9 @@ export default function FeatureToggleWrapper({
     )
     directSetIgnoreSSL(localStorage.getItem(IGNORE_SSL) === 'true')
     directSetProxy(localStorage.getItem(HTTPS_PROXY_FEATURE) ?? '')
+    directSetProxyEnabled(
+      localStorage.getItem(PROXY_FEATURE_ENABLED) === 'true'
+    )
   }, [])
 
   const setExperimentalFeature = (on: boolean) => {
@@ -47,6 +63,11 @@ export default function FeatureToggleWrapper({
     directSetExperimentalFeature(on)
   }
 
+  const setVulkanEnabled = (on: boolean) => {
+    localStorage.setItem(VULKAN_ENABLED, on ? 'true' : 'false')
+    directEnableVulkan(on)
+  }
+
   const setIgnoreSSL = (on: boolean) => {
     localStorage.setItem(IGNORE_SSL, on ? 'true' : 'false')
     directSetIgnoreSSL(on)
@@ -57,15 +78,24 @@ export default function FeatureToggleWrapper({
     directSetProxy(proxy)
   }
 
+  const setProxyEnabled = (on: boolean) => {
+    localStorage.setItem(PROXY_FEATURE_ENABLED, on ? 'true' : 'false')
+    directSetProxyEnabled(on)
+  }
+
   return (
     <FeatureToggleContext.Provider
       value={{
         experimentalFeature,
         ignoreSSL,
         proxy,
+        proxyEnabled,
+        vulkanEnabled,
         setExperimentalFeature,
+        setVulkanEnabled,
         setIgnoreSSL,
         setProxy,
+        setProxyEnabled,
       }}
     >
       {children}
diff --git a/web/extension/ExtensionManager.ts b/web/extension/ExtensionManager.ts
index 3074177bb..1259021f7 100644
--- a/web/extension/ExtensionManager.ts
+++ b/web/extension/ExtensionManager.ts
@@ -83,7 +83,10 @@ export class ExtensionManager {
     // Import class
     const extensionUrl = window.electronAPI
       ? extension.url
-      : extension.url.replace('extension://', `${API_BASE_URL}/extensions/`)
+      : extension.url.replace(
+          'extension://',
+          `${window.core?.api?.baseApiUrl ?? ''}/extensions/`
+        )
     await import(/* webpackIgnore: true */ extensionUrl).then(
       (extensionClass) => {
         // Register class if it has a default export
diff --git a/web/helpers/atoms/ChatMessage.atom.ts b/web/helpers/atoms/ChatMessage.atom.ts
index b11e8f3be..0061eca7c 100644
--- a/web/helpers/atoms/ChatMessage.atom.ts
+++ b/web/helpers/atoms/ChatMessage.atom.ts
@@ -16,6 +16,8 @@ import {
  */
 export const chatMessages = atom<Record<string, ThreadMessage[]>>({})
 
+export const readyThreadsMessagesAtom = atom<Record<string, boolean>>({})
+
 /**
  * Return the chat messages for the current active conversation
  */
@@ -34,6 +36,10 @@ export const setConvoMessagesAtom = atom(
     }
     newData[threadId] = messages
     set(chatMessages, newData)
+    set(readyThreadsMessagesAtom, {
+      ...get(readyThreadsMessagesAtom),
+      [threadId]: true,
+    })
   }
 )
 
@@ -70,11 +76,12 @@ export const addNewMessageAtom = atom(
     set(chatMessages, newData)
 
     // Update thread last message
-    set(
-      updateThreadStateLastMessageAtom,
-      newMessage.thread_id,
-      newMessage.content
-    )
+    if (newMessage.content.length)
+      set(
+        updateThreadStateLastMessageAtom,
+        newMessage.thread_id,
+        newMessage.content
+      )
   }
 )
 
@@ -108,6 +115,8 @@ export const deleteMessageAtom = atom(null, (get, set, id: string) => {
   }
 })
 
+export const editMessageAtom = atom('')
+
 export const updateMessageAtom = atom(
   null,
   (
@@ -131,7 +140,8 @@ export const updateMessageAtom = atom(
       newData[conversationId] = updatedMessages
       set(chatMessages, newData)
       // Update thread last message
-      set(updateThreadStateLastMessageAtom, conversationId, text)
+      if (text.length)
+        set(updateThreadStateLastMessageAtom, conversationId, text)
     }
   }
 )
diff --git a/web/helpers/atoms/Model.atom.ts b/web/helpers/atoms/Model.atom.ts
index 5c9188ad7..512518df1 100644
--- a/web/helpers/atoms/Model.atom.ts
+++ b/web/helpers/atoms/Model.atom.ts
@@ -4,23 +4,28 @@ import { atom } from 'jotai'
 export const stateModel = atom({ state: 'start', loading: false, model: '' })
 export const activeAssistantModelAtom = atom<Model | undefined>(undefined)
 
-export const downloadingModelsAtom = atom<Model[]>([])
+/**
+ * Stores the list of models which are being downloaded.
+ */
+const downloadingModelsAtom = atom<Model[]>([])
 
-export const addNewDownloadingModelAtom = atom(
-  null,
-  (get, set, model: Model) => {
-    const currentModels = get(downloadingModelsAtom)
-    set(downloadingModelsAtom, [...currentModels, model])
+export const getDownloadingModelAtom = atom((get) => get(downloadingModelsAtom))
+
+export const addDownloadingModelAtom = atom(null, (get, set, model: Model) => {
+  const downloadingModels = get(downloadingModelsAtom)
+  if (!downloadingModels.find((e) => e.id === model.id)) {
+    set(downloadingModelsAtom, [...downloadingModels, model])
   }
-)
+})
 
 export const removeDownloadingModelAtom = atom(
   null,
   (get, set, modelId: string) => {
-    const currentModels = get(downloadingModelsAtom)
+    const downloadingModels = get(downloadingModelsAtom)
+
     set(
       downloadingModelsAtom,
-      currentModels.filter((e) => e.id !== modelId)
+      downloadingModels.filter((e) => e.id !== modelId)
     )
   }
 )
diff --git a/web/helpers/atoms/SystemBar.atom.ts b/web/helpers/atoms/SystemBar.atom.ts
index 22a7573ec..5779ef822 100644
--- a/web/helpers/atoms/SystemBar.atom.ts
+++ b/web/helpers/atoms/SystemBar.atom.ts
@@ -2,8 +2,11 @@ import { atom } from 'jotai'
 
 export const totalRamAtom = atom<number>(0)
 export const usedRamAtom = atom<number>(0)
-export const availableRamAtom = atom<number>(0)
 
 export const cpuUsageAtom = atom<number>(0)
+export const ramUtilitizedAtom = atom<number>(0)
+
+export const gpusAtom = atom<Record<string, never>[]>([])
 
 export const nvidiaTotalVramAtom = atom<number>(0)
+export const systemMonitorCollapseAtom = atom<boolean>(false)
diff --git a/web/helpers/atoms/Thread.atom.ts b/web/helpers/atoms/Thread.atom.ts
index cab286bd1..f55541380 100644
--- a/web/helpers/atoms/Thread.atom.ts
+++ b/web/helpers/atoms/Thread.atom.ts
@@ -28,6 +28,10 @@ export const isGeneratingResponseAtom = atom<boolean | undefined>(undefined)
  * Stores all thread states for the current user
  */
 export const threadStatesAtom = atom<Record<string, ThreadState>>({})
+
+// Whether thread data is ready or not
+export const threadDataReadyAtom = atom<boolean>(false)
+
 export const activeThreadStateAtom = atom<ThreadState | undefined>((get) => {
   const threadId = get(activeThreadIdAtom)
   if (!threadId) {
diff --git a/web/hooks/useAssistants.ts b/web/hooks/useAssistants.ts
index 8f2c4a92c..61679bce5 100644
--- a/web/hooks/useAssistants.ts
+++ b/web/hooks/useAssistants.ts
@@ -1,6 +1,12 @@
-import { useEffect } from 'react'
+import { useCallback, useEffect } from 'react'
 
-import { Assistant, AssistantExtension, ExtensionTypeEnum } from '@janhq/core'
+import {
+  Assistant,
+  AssistantEvent,
+  AssistantExtension,
+  ExtensionTypeEnum,
+  events,
+} from '@janhq/core'
 
 import { useSetAtom } from 'jotai'
 
@@ -10,14 +16,19 @@ import { assistantsAtom } from '@/helpers/atoms/Assistant.atom'
 const useAssistants = () => {
   const setAssistants = useSetAtom(assistantsAtom)
 
-  useEffect(() => {
-    const getAssistants = async () => {
-      const assistants = await getLocalAssistants()
-      setAssistants(assistants)
-    }
-
-    getAssistants()
+  const getData = useCallback(async () => {
+    const assistants = await getLocalAssistants()
+    setAssistants(assistants)
   }, [setAssistants])
+
+  useEffect(() => {
+    getData()
+
+    events.on(AssistantEvent.OnAssistantsUpdate, () => getData())
+    return () => {
+      events.off(AssistantEvent.OnAssistantsUpdate, () => getData())
+    }
+  }, [getData])
 }
 
 const getLocalAssistants = async (): Promise<Assistant[]> =>
diff --git a/web/hooks/useCreateNewThread.ts b/web/hooks/useCreateNewThread.ts
index 12a5e04ca..722e5b7e4 100644
--- a/web/hooks/useCreateNewThread.ts
+++ b/web/hooks/useCreateNewThread.ts
@@ -1,3 +1,5 @@
+import { useContext } from 'react'
+
 import {
   Assistant,
   ConversationalExtension,
@@ -6,12 +8,17 @@ import {
   ThreadAssistantInfo,
   ThreadState,
   Model,
+  AssistantTool,
+  events,
+  InferenceEvent,
 } from '@janhq/core'
 import { atom, useAtomValue, useSetAtom } from 'jotai'
 
 import { selectedModelAtom } from '@/containers/DropdownListSidebar'
 import { fileUploadAtom } from '@/containers/Providers/Jotai'
 
+import { FeatureToggleContext } from '@/context/FeatureToggle'
+
 import { generateThreadId } from '@/utils/thread'
 
 import useRecommendedModel from './useRecommendedModel'
@@ -25,6 +32,7 @@ import {
   threadStatesAtom,
   updateThreadAtom,
   setThreadModelParamsAtom,
+  isGeneratingResponseAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 const createNewThreadAtom = atom(null, (get, set, newThread: Thread) => {
@@ -51,6 +59,8 @@ export const useCreateNewThread = () => {
   const setFileUpload = useSetAtom(fileUploadAtom)
   const setSelectedModel = useSetAtom(selectedModelAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
+  const { experimentalFeature } = useContext(FeatureToggleContext)
+  const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
 
   const { recommendedModel, downloadedModels } = useRecommendedModel()
 
@@ -60,6 +70,10 @@ export const useCreateNewThread = () => {
     assistant: Assistant,
     model?: Model | undefined
   ) => {
+    // Stop generating if any
+    setIsGeneratingResponse(false)
+    events.emit(InferenceEvent.OnInferenceStopped, {})
+
     const defaultModel = model ?? recommendedModel ?? downloadedModels[0]
 
     // check last thread message, if there empty last message use can not create thread
@@ -69,11 +83,18 @@ export const useCreateNewThread = () => {
       return null
     }
 
+    // modify assistant tools when experimental on, retieval toggle enabled in default
+    const assistantTools: AssistantTool = {
+      type: 'retrieval',
+      enabled: true,
+      settings: assistant.tools && assistant.tools[0].settings,
+    }
+
     const createdAt = Date.now()
     const assistantInfo: ThreadAssistantInfo = {
       assistant_id: assistant.id,
       assistant_name: assistant.name,
-      tools: assistant.tools,
+      tools: experimentalFeature ? [assistantTools] : assistant.tools,
       model: {
         id: defaultModel?.id ?? '*',
         settings: defaultModel?.settings ?? {},
diff --git a/web/hooks/useDownloadModel.ts b/web/hooks/useDownloadModel.ts
index 528108d18..59333fbde 100644
--- a/web/hooks/useDownloadModel.ts
+++ b/web/hooks/useDownloadModel.ts
@@ -1,4 +1,4 @@
-import { useContext } from 'react'
+import { useCallback, useContext } from 'react'
 
 import {
   Model,
@@ -7,29 +7,47 @@ import {
   abortDownload,
   joinPath,
   ModelArtifact,
+  DownloadState,
 } from '@janhq/core'
 
 import { useSetAtom } from 'jotai'
 
 import { FeatureToggleContext } from '@/context/FeatureToggle'
 
-import { modelBinFileName } from '@/utils/model'
-
-import { useDownloadState } from './useDownloadState'
+import { setDownloadStateAtom } from './useDownloadState'
 
 import { extensionManager } from '@/extension/ExtensionManager'
-import { addNewDownloadingModelAtom } from '@/helpers/atoms/Model.atom'
+import { addDownloadingModelAtom } from '@/helpers/atoms/Model.atom'
 
 export default function useDownloadModel() {
-  const { ignoreSSL, proxy } = useContext(FeatureToggleContext)
-  const { setDownloadState } = useDownloadState()
-  const addNewDownloadingModel = useSetAtom(addNewDownloadingModelAtom)
+  const { ignoreSSL, proxy, proxyEnabled } = useContext(FeatureToggleContext)
+  const setDownloadState = useSetAtom(setDownloadStateAtom)
+  const addDownloadingModel = useSetAtom(addDownloadingModelAtom)
 
-  const downloadModel = async (model: Model) => {
-    const childrenDownloadProgress: DownloadState[] = []
-    model.sources.forEach((source: ModelArtifact) => {
-      childrenDownloadProgress.push({
-        modelId: source.filename,
+  const downloadModel = useCallback(
+    async (model: Model) => {
+      const childProgresses: DownloadState[] = model.sources.map(
+        (source: ModelArtifact) => ({
+          fileName: source.filename,
+          modelId: model.id,
+          time: {
+            elapsed: 0,
+            remaining: 0,
+          },
+          speed: 0,
+          percent: 0,
+          size: {
+            total: 0,
+            transferred: 0,
+          },
+          downloadState: 'downloading',
+        })
+      )
+
+      // set an initial download state
+      setDownloadState({
+        fileName: '',
+        modelId: model.id,
         time: {
           elapsed: 0,
           remaining: 0,
@@ -40,40 +58,35 @@ export default function useDownloadModel() {
           total: 0,
           transferred: 0,
         },
+        children: childProgresses,
+        downloadState: 'downloading',
       })
-    })
 
-    // set an initial download state
-    setDownloadState({
-      modelId: model.id,
-      time: {
-        elapsed: 0,
-        remaining: 0,
-      },
-      speed: 0,
-      percent: 0,
-      size: {
-        total: 0,
-        transferred: 0,
-      },
-      children: childrenDownloadProgress,
-    })
+      addDownloadingModel(model)
 
-    addNewDownloadingModel(model)
+      await localDownloadModel(model, ignoreSSL, proxyEnabled ? proxy : '')
+    },
+    [ignoreSSL, proxy, proxyEnabled, addDownloadingModel, setDownloadState]
+  )
 
-    await extensionManager
-      .get<ModelExtension>(ExtensionTypeEnum.Model)
-      ?.downloadModel(model, { ignoreSSL, proxy })
-  }
-
-  const abortModelDownload = async (model: Model) => {
-    await abortDownload(
-      await joinPath(['models', model.id, modelBinFileName(model)])
-    )
-  }
+  const abortModelDownload = useCallback(async (model: Model) => {
+    for (const source of model.sources) {
+      const path = await joinPath(['models', model.id, source.filename])
+      await abortDownload(path)
+    }
+  }, [])
 
   return {
     downloadModel,
     abortModelDownload,
   }
 }
+
+const localDownloadModel = async (
+  model: Model,
+  ignoreSSL: boolean,
+  proxy: string
+) =>
+  extensionManager
+    .get<ModelExtension>(ExtensionTypeEnum.Model)
+    ?.downloadModel(model, { ignoreSSL, proxy })
diff --git a/web/hooks/useDownloadState.ts b/web/hooks/useDownloadState.ts
index 37f41d2a1..06de9bef6 100644
--- a/web/hooks/useDownloadState.ts
+++ b/web/hooks/useDownloadState.ts
@@ -1,96 +1,140 @@
-import { atom, useSetAtom, useAtomValue } from 'jotai'
+import { DownloadState } from '@janhq/core'
+import { atom } from 'jotai'
 
 import { toaster } from '@/containers/Toast'
 
+import {
+  configuredModelsAtom,
+  downloadedModelsAtom,
+  removeDownloadingModelAtom,
+} from '@/helpers/atoms/Model.atom'
+
 // download states
-const modelDownloadStateAtom = atom<Record<string, DownloadState>>({})
+export const modelDownloadStateAtom = atom<Record<string, DownloadState>>({})
 
-const setDownloadStateAtom = atom(null, (get, set, state: DownloadState) => {
-  const currentState = { ...get(modelDownloadStateAtom) }
-  console.debug(
-    `current download state for ${state.modelId} is ${JSON.stringify(state)}`
-  )
-  currentState[state.modelId] = state
-  set(modelDownloadStateAtom, currentState)
-})
-
-const setDownloadStateSuccessAtom = atom(null, (get, set, modelId: string) => {
-  const currentState = { ...get(modelDownloadStateAtom) }
-  const state = currentState[modelId]
-  if (!state) {
-    console.debug(`Cannot find download state for ${modelId}`)
-    return
-  }
-  delete currentState[modelId]
-  set(modelDownloadStateAtom, currentState)
-  toaster({
-    title: 'Download Completed',
-    description: `Download ${modelId} completed`,
-    type: 'success',
-  })
-})
-
-const setDownloadStateFailedAtom = atom(
+/**
+ * Used to set the download state for a particular model.
+ */
+export const setDownloadStateAtom = atom(
   null,
-  (get, set, modelId: string, error: string) => {
+  (get, set, state: DownloadState) => {
     const currentState = { ...get(modelDownloadStateAtom) }
-    const state = currentState[modelId]
-    if (!state) {
-      console.debug(`Cannot find download state for ${modelId}`)
-      return
-    }
-    if (error.includes('certificate')) {
-      error += '. To fix enable "Ignore SSL Certificates" in Advanced settings.'
-    }
-    toaster({
-      title: 'Download Failed',
-      description: `Model ${modelId} download failed: ${error}`,
-      type: 'error',
-    })
 
-    delete currentState[modelId]
+    if (state.downloadState === 'end') {
+      const modelDownloadState = currentState[state.modelId]
+
+      const updatedChildren: DownloadState[] =
+        modelDownloadState.children!.filter(
+          (m) => m.fileName !== state.fileName
+        )
+      updatedChildren.push(state)
+      modelDownloadState.children = updatedChildren
+      currentState[state.modelId] = modelDownloadState
+
+      const isAllChildrenDownloadEnd = modelDownloadState.children?.every(
+        (m) => m.downloadState === 'end'
+      )
+
+      if (isAllChildrenDownloadEnd) {
+        // download successfully
+        delete currentState[state.modelId]
+        set(removeDownloadingModelAtom, state.modelId)
+
+        const model = get(configuredModelsAtom).find(
+          (e) => e.id === state.modelId
+        )
+        if (model) set(downloadedModelsAtom, (prev) => [...prev, model])
+        toaster({
+          title: 'Download Completed',
+          description: `Download ${state.modelId} completed`,
+          type: 'success',
+        })
+      }
+    } else if (state.downloadState === 'error') {
+      // download error
+      delete currentState[state.modelId]
+      set(removeDownloadingModelAtom, state.modelId)
+      if (state.error === 'aborted') {
+        toaster({
+          title: 'Cancel Download',
+          description: `Model ${state.modelId} download cancelled`,
+          type: 'warning',
+        })
+      } else {
+        let error = state.error
+        if (
+          typeof error?.includes === 'function' &&
+          state.error?.includes('certificate')
+        ) {
+          error +=
+            '. To fix enable "Ignore SSL Certificates" in Advanced settings.'
+        }
+        toaster({
+          title: 'Download Failed',
+          description: `Model ${state.modelId} download failed: ${error}`,
+          type: 'error',
+        })
+      }
+    } else {
+      // download in progress
+      if (state.size.total === 0) {
+        // this is initial state, just set the state
+        currentState[state.modelId] = state
+        set(modelDownloadStateAtom, currentState)
+        return
+      }
+
+      const modelDownloadState = currentState[state.modelId]
+      if (!modelDownloadState) {
+        console.debug('setDownloadStateAtom: modelDownloadState not found')
+        return
+      }
+
+      // delete the children if the filename is matched and replace the new state
+      const updatedChildren: DownloadState[] =
+        modelDownloadState.children!.filter(
+          (m) => m.fileName !== state.fileName
+        )
+
+      updatedChildren.push(state)
+
+      // re-calculate the overall progress if we have all the children download data
+      const isAnyChildDownloadNotReady = updatedChildren.some(
+        (m) => m.size.total === 0
+      )
+
+      modelDownloadState.children = updatedChildren
+
+      if (isAnyChildDownloadNotReady) {
+        // just update the children
+        currentState[state.modelId] = modelDownloadState
+        set(modelDownloadStateAtom, currentState)
+
+        return
+      }
+
+      const parentTotalSize = modelDownloadState.size.total
+      if (parentTotalSize === 0) {
+        // calculate the total size of the parent by sum all children total size
+        const totalSize = updatedChildren.reduce(
+          (acc, m) => acc + m.size.total,
+          0
+        )
+
+        modelDownloadState.size.total = totalSize
+      }
+
+      // calculate the total transferred size by sum all children transferred size
+      const transferredSize = updatedChildren.reduce(
+        (acc, m) => acc + m.size.transferred,
+        0
+      )
+      modelDownloadState.size.transferred = transferredSize
+      modelDownloadState.percent =
+        parentTotalSize === 0 ? 0 : transferredSize / parentTotalSize
+      currentState[state.modelId] = modelDownloadState
+    }
+
     set(modelDownloadStateAtom, currentState)
   }
 )
-const setDownloadStateCancelledAtom = atom(
-  null,
-  (get, set, modelId: string) => {
-    const currentState = { ...get(modelDownloadStateAtom) }
-    const state = currentState[modelId]
-    if (!state) {
-      console.debug(`Cannot find download state for ${modelId}`)
-      toaster({
-        title: 'Cancel Download',
-        description: `Model ${modelId} cancel download`,
-        type: 'warning',
-      })
-
-      return
-    }
-    delete currentState[modelId]
-    set(modelDownloadStateAtom, currentState)
-  }
-)
-
-export function useDownloadState() {
-  const modelDownloadState = useAtomValue(modelDownloadStateAtom)
-  const setDownloadState = useSetAtom(setDownloadStateAtom)
-  const setDownloadStateSuccess = useSetAtom(setDownloadStateSuccessAtom)
-  const setDownloadStateFailed = useSetAtom(setDownloadStateFailedAtom)
-  const setDownloadStateCancelled = useSetAtom(setDownloadStateCancelledAtom)
-
-  const downloadStates: DownloadState[] = []
-  for (const [, value] of Object.entries(modelDownloadState)) {
-    downloadStates.push(value)
-  }
-
-  return {
-    modelDownloadStateAtom,
-    modelDownloadState,
-    setDownloadState,
-    setDownloadStateSuccess,
-    setDownloadStateFailed,
-    setDownloadStateCancelled,
-    downloadStates,
-  }
-}
diff --git a/web/hooks/useFactoryReset.ts b/web/hooks/useFactoryReset.ts
index 56994d4c4..06a637572 100644
--- a/web/hooks/useFactoryReset.ts
+++ b/web/hooks/useFactoryReset.ts
@@ -26,29 +26,18 @@ export default function useFactoryReset() {
     console.debug('appConfiguration: ', appConfiguration)
     const janDataFolderPath = appConfiguration!.data_folder
 
-    if (defaultJanDataFolder === janDataFolderPath) {
-      console.debug('Jan data folder is already at user home')
-    } else {
-      // if jan data folder is not at user home, we update the app configuration to point to user home
-      if (!keepCurrentFolder) {
-        const configuration: AppConfiguration = {
-          data_folder: defaultJanDataFolder,
-        }
-        await window.core?.api?.updateAppConfiguration(configuration)
+    if (!keepCurrentFolder) {
+      // set the default jan data folder to user's home directory
+      const configuration: AppConfiguration = {
+        data_folder: defaultJanDataFolder,
       }
+      await window.core?.api?.updateAppConfiguration(configuration)
     }
-
-    const modelPath = await joinPath([janDataFolderPath, 'models'])
-    const threadPath = await joinPath([janDataFolderPath, 'threads'])
-
-    console.debug(`Removing models at ${modelPath}`)
-    await fs.rmdirSync(modelPath, { recursive: true })
-
-    console.debug(`Removing threads at ${threadPath}`)
-    await fs.rmdirSync(threadPath, { recursive: true })
+    await fs.rmdirSync(janDataFolderPath, { recursive: true })
 
     // reset the localStorage
     localStorage.clear()
+
     await window.core?.api?.relaunch()
   }
 
diff --git a/web/hooks/useGetSystemResources.ts b/web/hooks/useGetSystemResources.ts
index 3f71040d7..ef2f30a61 100644
--- a/web/hooks/useGetSystemResources.ts
+++ b/web/hooks/useGetSystemResources.ts
@@ -1,4 +1,4 @@
-import { useEffect, useState } from 'react'
+import { useCallback, useEffect, useState } from 'react'
 
 import { ExtensionTypeEnum, MonitoringExtension } from '@janhq/core'
 
@@ -6,25 +6,27 @@ import { useSetAtom } from 'jotai'
 
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
-  availableRamAtom,
   cpuUsageAtom,
   totalRamAtom,
   usedRamAtom,
   nvidiaTotalVramAtom,
+  gpusAtom,
+  ramUtilitizedAtom,
 } from '@/helpers/atoms/SystemBar.atom'
 
 export default function useGetSystemResources() {
-  const [ram, setRam] = useState<number>(0)
-  const [cpu, setCPU] = useState<number>(0)
+  const [intervalId, setIntervalId] = useState<
+    NodeJS.Timeout | number | undefined
+  >(undefined)
 
-  const [gpus, setGPUs] = useState<Record<string, never>[]>([])
   const setTotalRam = useSetAtom(totalRamAtom)
+  const setGpus = useSetAtom(gpusAtom)
   const setUsedRam = useSetAtom(usedRamAtom)
-  const setAvailableRam = useSetAtom(availableRamAtom)
   const setCpuUsage = useSetAtom(cpuUsageAtom)
   const setTotalNvidiaVram = useSetAtom(nvidiaTotalVramAtom)
+  const setRamUtilitized = useSetAtom(ramUtilitizedAtom)
 
-  const getSystemResources = async () => {
+  const getSystemResources = useCallback(async () => {
     if (
       !extensionManager.get<MonitoringExtension>(
         ExtensionTypeEnum.SystemMonitoring
@@ -38,23 +40,20 @@ export default function useGetSystemResources() {
     const resourceInfor = await monitoring?.getResourcesInfo()
     const currentLoadInfor = await monitoring?.getCurrentLoad()
 
-    const ram =
-      (resourceInfor?.mem?.usedMemory ?? 0) /
-      (resourceInfor?.mem?.totalMemory ?? 1)
     if (resourceInfor?.mem?.usedMemory) setUsedRam(resourceInfor.mem.usedMemory)
     if (resourceInfor?.mem?.totalMemory)
       setTotalRam(resourceInfor.mem.totalMemory)
 
-    setRam(Math.round(ram * 100))
-    if (resourceInfor.mem.totalMemory && resourceInfor.mem.usedMemory)
-      setAvailableRam(
-        resourceInfor.mem.totalMemory - resourceInfor.mem.usedMemory
-      )
-    setCPU(Math.round(currentLoadInfor?.cpu?.usage ?? 0))
+    const ramUtilitized =
+      ((resourceInfor?.mem?.usedMemory ?? 0) /
+        (resourceInfor?.mem?.totalMemory ?? 1)) *
+      100
+    setRamUtilitized(Math.round(ramUtilitized))
+
     setCpuUsage(Math.round(currentLoadInfor?.cpu?.usage ?? 0))
 
     const gpus = currentLoadInfor?.gpu ?? []
-    setGPUs(gpus)
+    setGpus(gpus)
 
     let totalNvidiaVram = 0
     if (gpus.length > 0) {
@@ -65,27 +64,49 @@ export default function useGetSystemResources() {
       )
     }
     setTotalNvidiaVram(totalNvidiaVram)
-  }
+  }, [
+    setUsedRam,
+    setTotalRam,
+    setRamUtilitized,
+    setCpuUsage,
+    setGpus,
+    setTotalNvidiaVram,
+  ])
 
-  useEffect(() => {
+  const watch = () => {
     getSystemResources()
 
     // Fetch interval - every 2s
-    // TODO: Will we really need this?
-    // There is a possibility that this will be removed and replaced by the process event hook?
-    const intervalId = setInterval(() => {
+    const itv = setInterval(() => {
       getSystemResources()
-    }, 5000)
+    }, 2000)
+    setIntervalId(itv)
+  }
+  const stopWatching = useCallback(() => {
+    if (intervalId) clearInterval(intervalId)
+  }, [intervalId])
 
-    // clean up interval
-    return () => clearInterval(intervalId)
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
+  useEffect(() => {
+    getSystemResources()
+    // Component did unmount
+    // Stop watching if any
+    return () => {
+      stopWatching()
+    }
+  }, [getSystemResources, stopWatching])
 
   return {
-    totalRamAtom,
-    ram,
-    cpu,
-    gpus,
+    /**
+     * Fetch resource informations once
+     */
+    getSystemResources,
+    /**
+     *  Fetch & watch for resource update
+     */
+    watch,
+    /**
+     *  Stop watching
+     */
+    stopWatching,
   }
 }
diff --git a/web/hooks/useServerLog.ts b/web/hooks/useLogs.tsx
similarity index 57%
rename from web/hooks/useServerLog.ts
rename to web/hooks/useLogs.tsx
index b263534b6..fc591405f 100644
--- a/web/hooks/useServerLog.ts
+++ b/web/hooks/useLogs.tsx
@@ -5,14 +5,11 @@ import {
   getJanDataFolderPath,
 } from '@janhq/core'
 
-export const useServerLog = () => {
-  const getServerLog = async () => {
-    if (!(await fs.existsSync(await joinPath(['file://logs', 'server.log']))))
-      return {}
-    const logs = await fs.readFileSync(
-      await joinPath(['file://logs', 'server.log']),
-      'utf-8'
-    )
+export const useLogs = () => {
+  const getLogs = async (file: string) => {
+    const path = await joinPath(['file://logs', `${file}.log`])
+    if (!(await fs.existsSync(path))) return {}
+    const logs = await fs.readFileSync(path, 'utf-8')
 
     return logs
   }
@@ -25,5 +22,5 @@ export const useServerLog = () => {
   const clearServerLog = async () => {
     await fs.writeFileSync(await joinPath(['file://logs', 'server.log']), '')
   }
-  return { getServerLog, openServerLog, clearServerLog }
+  return { getLogs, openServerLog, clearServerLog }
 }
diff --git a/web/hooks/useModels.ts b/web/hooks/useModels.ts
index 23e098007..b2aa0b518 100644
--- a/web/hooks/useModels.ts
+++ b/web/hooks/useModels.ts
@@ -1,6 +1,12 @@
-import { useEffect } from 'react'
+import { useCallback, useEffect } from 'react'
 
-import { ExtensionTypeEnum, Model, ModelExtension } from '@janhq/core'
+import {
+  ExtensionTypeEnum,
+  Model,
+  ModelEvent,
+  ModelExtension,
+  events,
+} from '@janhq/core'
 
 import { useSetAtom } from 'jotai'
 
@@ -14,23 +20,30 @@ const useModels = () => {
   const setDownloadedModels = useSetAtom(downloadedModelsAtom)
   const setConfiguredModels = useSetAtom(configuredModelsAtom)
 
-  useEffect(() => {
+  const getData = useCallback(() => {
     const getDownloadedModels = async () => {
       const models = await getLocalDownloadedModels()
       setDownloadedModels(models)
     }
-
-    getDownloadedModels()
-  }, [setDownloadedModels])
-
-  useEffect(() => {
     const getConfiguredModels = async () => {
       const models = await getLocalConfiguredModels()
       setConfiguredModels(models)
     }
-
+    getDownloadedModels()
     getConfiguredModels()
-  }, [setConfiguredModels])
+  }, [setDownloadedModels, setConfiguredModels])
+
+  useEffect(() => {
+    // Try get data on mount
+    getData()
+
+    // Listen for model updates
+    events.on(ModelEvent.OnModelsUpdate, async () => getData())
+    return () => {
+      // Remove listener on unmount
+      events.off(ModelEvent.OnModelsUpdate, async () => {})
+    }
+  }, [getData])
 }
 
 const getLocalConfiguredModels = async (): Promise<Model[]> =>
diff --git a/web/hooks/usePath.ts b/web/hooks/usePath.ts
index aea25bef1..35fb853b4 100644
--- a/web/hooks/usePath.ts
+++ b/web/hooks/usePath.ts
@@ -25,6 +25,7 @@ export const usePath = () => {
         if (!selectedModel) return
         filePath = await joinPath(['models', selectedModel.id])
         break
+      case 'Tools':
       case 'Assistant':
         if (!assistantId) return
         filePath = await joinPath(['assistants', assistantId])
@@ -59,6 +60,7 @@ export const usePath = () => {
         filePath = await joinPath(['models', selectedModel.id, 'model.json'])
         break
       case 'Assistant':
+      case 'Tools':
         if (!assistantId) return
         filePath = await joinPath(['assistants', assistantId, 'assistant.json'])
         break
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index 7d89764db..6c8f98aab 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -6,6 +6,7 @@ import {
   ChatCompletionRole,
   ContentType,
   MessageRequest,
+  MessageRequestType,
   MessageStatus,
   ExtensionTypeEnum,
   Thread,
@@ -23,7 +24,11 @@ import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 import { ulid } from 'ulid'
 
 import { selectedModelAtom } from '@/containers/DropdownListSidebar'
-import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
+import {
+  currentPromptAtom,
+  editPromptAtom,
+  fileUploadAtom,
+} from '@/containers/Providers/Jotai'
 
 import { getBase64 } from '@/utils/base64'
 import { toRuntimeParams, toSettingParams } from '@/utils/modelParam'
@@ -33,6 +38,7 @@ import { loadModelErrorAtom, useActiveModel } from './useActiveModel'
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
   addNewMessageAtom,
+  deleteMessageAtom,
   getCurrentChatMessagesAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
 import {
@@ -53,6 +59,8 @@ export default function useSendChatMessage() {
   const updateThread = useSetAtom(updateThreadAtom)
   const updateThreadWaiting = useSetAtom(updateThreadWaitingForResponseAtom)
   const setCurrentPrompt = useSetAtom(currentPromptAtom)
+  const deleteMessage = useSetAtom(deleteMessageAtom)
+  const setEditPrompt = useSetAtom(editPromptAtom)
 
   const currentMessages = useAtomValue(getCurrentChatMessagesAtom)
   const { activeModel } = useActiveModel()
@@ -112,6 +120,7 @@ export default function useSendChatMessage() {
 
     const messageRequest: MessageRequest = {
       id: ulid(),
+      type: MessageRequestType.Thread,
       messages: messages,
       threadId: activeThread.id,
       model: activeThread.assistants[0].model ?? selectedModel,
@@ -125,6 +134,19 @@ export default function useSendChatMessage() {
       await waitForModelStarting(modelId)
       setQueuedMessage(false)
     }
+
+    if (currentMessage.role !== ChatCompletionRole.User) {
+      // Delete last response before regenerating
+      deleteMessage(currentMessage.id ?? '')
+      if (activeThread) {
+        await extensionManager
+          .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
+          ?.writeMessages(
+            activeThread.id,
+            currentMessages.filter((msg) => msg.id !== currentMessage.id)
+          )
+      }
+    }
     events.emit(MessageEvent.OnMessageSent, messageRequest)
   }
 
@@ -145,6 +167,7 @@ export default function useSendChatMessage() {
     updateThreadWaiting(activeThread.id, true)
     const prompt = message.trim()
     setCurrentPrompt('')
+    setEditPrompt('')
 
     const base64Blob = fileUpload[0]
       ? await getBase64(fileUpload[0].file).then()
@@ -209,6 +232,7 @@ export default function useSendChatMessage() {
     }
     const messageRequest: MessageRequest = {
       id: msgId,
+      type: MessageRequestType.Thread,
       threadId: activeThread.id,
       messages,
       model: {
@@ -218,8 +242,8 @@ export default function useSendChatMessage() {
       },
       thread: activeThread,
     }
-    const timestamp = Date.now()
 
+    const timestamp = Date.now()
     const content: any = []
 
     if (base64Blob && fileUpload[0]?.type === 'image') {
@@ -273,6 +297,10 @@ export default function useSendChatMessage() {
     const updatedThread: Thread = {
       ...activeThread,
       updated: timestamp,
+      metadata: {
+        ...(activeThread.metadata ?? {}),
+        lastMessage: prompt,
+      },
     }
 
     // change last update thread when send message
diff --git a/web/hooks/useSetActiveThread.ts b/web/hooks/useSetActiveThread.ts
index 6cf94d45d..486a14d03 100644
--- a/web/hooks/useSetActiveThread.ts
+++ b/web/hooks/useSetActiveThread.ts
@@ -1,22 +1,14 @@
-import { useCallback } from 'react'
+import { ExtensionTypeEnum, Thread, ConversationalExtension } from '@janhq/core'
 
-import {
-  InferenceEvent,
-  ExtensionTypeEnum,
-  Thread,
-  events,
-  ConversationalExtension,
-} from '@janhq/core'
-
-import { useSetAtom } from 'jotai'
-
-import { loadModelErrorAtom } from './useActiveModel'
+import { useAtomValue, useSetAtom } from 'jotai'
 
 import { extensionManager } from '@/extension'
-import { setConvoMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
+import {
+  readyThreadsMessagesAtom,
+  setConvoMessagesAtom,
+} from '@/helpers/atoms/ChatMessage.atom'
 import {
   ModelParams,
-  isGeneratingResponseAtom,
   setActiveThreadIdAtom,
   setThreadModelParamsAtom,
 } from '@/helpers/atoms/Thread.atom'
@@ -25,32 +17,22 @@ export default function useSetActiveThread() {
   const setActiveThreadId = useSetAtom(setActiveThreadIdAtom)
   const setThreadMessage = useSetAtom(setConvoMessagesAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
-  const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
-  const setLoadModelError = useSetAtom(loadModelErrorAtom)
+  const readyMessageThreads = useAtomValue(readyThreadsMessagesAtom)
 
-  const setActiveThread = useCallback(
-    async (thread: Thread) => {
-      setIsGeneratingResponse(false)
-      events.emit(InferenceEvent.OnInferenceStopped, thread.id)
-
-      // load the corresponding messages
+  const setActiveThread = async (thread: Thread) => {
+    // Load local messages only if there are no messages in the state
+    if (!readyMessageThreads[thread.id]) {
       const messages = await getLocalThreadMessage(thread.id)
       setThreadMessage(thread.id, messages)
+    }
 
-      setActiveThreadId(thread.id)
-      const modelParams: ModelParams = {
-        ...thread.assistants[0]?.model?.parameters,
-        ...thread.assistants[0]?.model?.settings,
-      }
-      setThreadModelParams(thread.id, modelParams)
-    },
-    [
-      setActiveThreadId,
-      setThreadMessage,
-      setThreadModelParams,
-      setIsGeneratingResponse,
-    ]
-  )
+    setActiveThreadId(thread.id)
+    const modelParams: ModelParams = {
+      ...thread.assistants[0]?.model?.parameters,
+      ...thread.assistants[0]?.model?.settings,
+    }
+    setThreadModelParams(thread.id, modelParams)
+  }
 
   return { setActiveThread }
 }
diff --git a/web/hooks/useSettings.ts b/web/hooks/useSettings.ts
index 289355b36..9ff89827e 100644
--- a/web/hooks/useSettings.ts
+++ b/web/hooks/useSettings.ts
@@ -24,7 +24,7 @@ export const useSettings = () => {
         ((settings.nvidia_driver?.exist && !settings.cuda?.exist) ||
           !settings.nvidia_driver?.exist)
       ) {
-        setShowNotification(true)
+        setShowNotification(false)
       }
 
       // Check if run_mode is 'gpu' or 'cpu' and update state accordingly
@@ -48,17 +48,33 @@ export const useSettings = () => {
     runMode,
     notify,
     gpusInUse,
+    vulkan,
   }: {
     runMode?: string | undefined
     notify?: boolean | undefined
     gpusInUse?: string[] | undefined
+    vulkan?: boolean | undefined
   }) => {
     const settingsFile = await joinPath(['file://settings', 'settings.json'])
     const settings = await readSettings()
     if (runMode != null) settings.run_mode = runMode
     if (notify != null) settings.notify = notify
     if (gpusInUse != null) settings.gpus_in_use = gpusInUse
+    if (vulkan != null) {
+      settings.vulkan = vulkan
+      // GPU enabled, set run_mode to 'gpu'
+      if (settings.vulkan) {
+        settings.run_mode = 'gpu'
+      } else {
+        settings.run_mode = settings.gpus?.length > 0 ? 'gpu' : 'cpu'
+      }
+    }
     await fs.writeFileSync(settingsFile, JSON.stringify(settings))
+
+    // Relaunch to apply settings
+    if (vulkan != null) {
+      window.location.reload()
+    }
   }
 
   return {
diff --git a/web/hooks/useThreads.ts b/web/hooks/useThreads.ts
index 1ac038b26..fd0b3456d 100644
--- a/web/hooks/useThreads.ts
+++ b/web/hooks/useThreads.ts
@@ -9,11 +9,10 @@ import {
 
 import { useSetAtom } from 'jotai'
 
-import useSetActiveThread from './useSetActiveThread'
-
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
   ModelParams,
+  threadDataReadyAtom,
   threadModelParamsAtom,
   threadStatesAtom,
   threadsAtom,
@@ -23,7 +22,7 @@ const useThreads = () => {
   const setThreadStates = useSetAtom(threadStatesAtom)
   const setThreads = useSetAtom(threadsAtom)
   const setThreadModelRuntimeParams = useSetAtom(threadModelParamsAtom)
-  const { setActiveThread } = useSetActiveThread()
+  const setThreadDataReady = useSetAtom(threadDataReadyAtom)
 
   useEffect(() => {
     const getThreads = async () => {
@@ -54,18 +53,15 @@ const useThreads = () => {
       setThreadStates(localThreadStates)
       setThreads(localThreads)
       setThreadModelRuntimeParams(threadModelParams)
-
-      if (localThreads.length > 0) {
-        setActiveThread(localThreads[0])
-      }
+      setThreadDataReady(true)
     }
 
     getThreads()
   }, [
-    setActiveThread,
     setThreadModelRuntimeParams,
     setThreadStates,
     setThreads,
+    setThreadDataReady,
   ])
 }
 
diff --git a/web/next.config.js b/web/next.config.js
index a2e202c51..a4b3e6d43 100644
--- a/web/next.config.js
+++ b/web/next.config.js
@@ -6,6 +6,11 @@ const webpack = require('webpack')
 const packageJson = require('./package.json')
 
 const nextConfig = {
+  eslint: {
+    // Warning: This allows production builds to successfully complete even if
+    // your project has ESLint errors.
+    ignoreDuringBuilds: true,
+  },
   output: 'export',
   assetPrefix: '.',
   images: {
@@ -27,7 +32,9 @@ const nextConfig = {
         VERSION: JSON.stringify(packageJson.version),
         ANALYTICS_ID: JSON.stringify(process.env.ANALYTICS_ID),
         ANALYTICS_HOST: JSON.stringify(process.env.ANALYTICS_HOST),
-        API_BASE_URL: JSON.stringify('http://localhost:1337'),
+        API_BASE_URL: JSON.stringify(
+          process.env.API_BASE_URL ?? 'http://localhost:1337'
+        ),
         isMac: process.platform === 'darwin',
         isWindows: process.platform === 'win32',
         isLinux: process.platform === 'linux',
diff --git a/web/public/umami_script.js b/web/public/umami_script.js
new file mode 100644
index 000000000..b9db0b024
--- /dev/null
+++ b/web/public/umami_script.js
@@ -0,0 +1,210 @@
+!(function () {
+  'use strict'
+  !(function (t) {
+    var e = t.screen,
+      n = e.width,
+      r = e.height,
+      a = t.navigator.language,
+      i = t.location,
+      o = t.localStorage,
+      u = t.document,
+      c = t.history,
+      f = 'jan.ai',
+      s = 'mainpage',
+      l = i.search,
+      d = u.currentScript
+    if (d) {
+      var m = 'data-',
+        h = d.getAttribute.bind(d),
+        v = h(m + 'website-id'),
+        p = h(m + 'host-url'),
+        g = 'false' !== h(m + 'auto-track'),
+        y = h(m + 'do-not-track'),
+        b = h(m + 'domains') || '',
+        S = b.split(',').map(function (t) {
+          return t.trim()
+        }),
+        k =
+          (p ? p.replace(/\/$/, '') : d.src.split('/').slice(0, -1).join('/')) +
+          '/api/send',
+        w = n + 'x' + r,
+        N = /data-umami-event-([\w-_]+)/,
+        T = m + 'umami-event',
+        j = 300,
+        A = function (t, e, n) {
+          var r = t[e]
+          return function () {
+            for (var e = [], a = arguments.length; a--; ) e[a] = arguments[a]
+            return n.apply(null, e), r.apply(t, e)
+          }
+        },
+        x = function () {
+          return {
+            website: v,
+            hostname: f,
+            screen: w,
+            language: a,
+            title: M,
+            url: I,
+            referrer: J,
+          }
+        },
+        E = function () {
+          return (
+            (o && o.getItem('umami.disabled')) ||
+            (y &&
+              (function () {
+                var e = t.doNotTrack,
+                  n = t.navigator,
+                  r = t.external,
+                  a = 'msTrackingProtectionEnabled',
+                  i =
+                    e ||
+                    n.doNotTrack ||
+                    n.msDoNotTrack ||
+                    (r && a in r && r[a]())
+                return '1' == i || 'yes' === i
+              })()) ||
+            (b && !S.includes(f))
+          )
+        },
+        O = function (t, e, n) {
+          n &&
+            ((J = I),
+            (I = (function (t) {
+              try {
+                return new URL(t).pathname
+              } catch (e) {
+                return t
+              }
+            })(n.toString())) !== J && setTimeout(D, j))
+        },
+        L = function (t, e) {
+          if ((void 0 === e && (e = 'event'), !E())) {
+            var n = {
+              // eslint-disable-next-line @typescript-eslint/naming-convention
+              'Content-Type': 'application/json',
+            }
+            return (
+              void 0 !== K && (n['x-umami-cache'] = K),
+              fetch(k, {
+                method: 'POST',
+                body: JSON.stringify({
+                  type: e,
+                  payload: t,
+                }),
+                headers: n,
+              })
+                .then(function (t) {
+                  return t.text()
+                })
+                .then(function (t) {
+                  return (K = t)
+                })
+                .catch(function () {})
+            )
+          }
+        },
+        D = function (t, e) {
+          return L(
+            'string' == typeof t
+              ? Object.assign({}, x(), {
+                  name: t,
+                  data: 'object' == typeof e ? e : void 0,
+                })
+              : 'object' == typeof t
+                ? t
+                : 'function' == typeof t
+                  ? t(x())
+                  : x()
+          )
+        }
+      t.umami ||
+        (t.umami = {
+          track: D,
+          identify: function (t) {
+            return L(
+              Object.assign({}, x(), {
+                data: t,
+              }),
+              'identify'
+            )
+          },
+        })
+      var K,
+        P,
+        _,
+        q,
+        C,
+        I = '' + s + l,
+        J = u.referrer,
+        M = u.title
+      if (g && !E()) {
+        ;(c.pushState = A(c, 'pushState', O)),
+          (c.replaceState = A(c, 'replaceState', O)),
+          (C = function (t) {
+            var e = t.getAttribute.bind(t),
+              n = e(T)
+            if (n) {
+              var r = {}
+              return (
+                t.getAttributeNames().forEach(function (t) {
+                  var n = t.match(N)
+                  n && (r[n[1]] = e(t))
+                }),
+                D(n, r)
+              )
+            }
+            return Promise.resolve()
+          }),
+          u.addEventListener(
+            'click',
+            function (t) {
+              var e = t.target,
+                n =
+                  'A' === e.tagName
+                    ? e
+                    : (function (t, e) {
+                        for (var n = t, r = 0; r < e; r++) {
+                          if ('A' === n.tagName) return n
+                          if (!(n = n.parentElement)) return null
+                        }
+                        return null
+                      })(e, 10)
+              if (n) {
+                var r = n.href,
+                  a =
+                    '_blank' === n.target ||
+                    t.ctrlKey ||
+                    t.shiftKey ||
+                    t.metaKey ||
+                    (t.button && 1 === t.button)
+                if (n.getAttribute(T) && r)
+                  return (
+                    a || t.preventDefault(),
+                    C(n).then(function () {
+                      a || (i.href = r)
+                    })
+                  )
+              } else C(e)
+            },
+            !0
+          ),
+          (_ = new MutationObserver(function (t) {
+            var e = t[0]
+            M = e && e.target ? e.target.text : void 0
+          })),
+          (q = u.querySelector('head > title')) &&
+            _.observe(q, {
+              subtree: !0,
+              characterData: !0,
+              childList: !0,
+            })
+        var R = function () {
+          'complete' !== u.readyState || P || (D(), (P = !0))
+        }
+        u.addEventListener('readystatechange', R, !0), R()
+      }
+    }
+  })(window)
+})()
diff --git a/web/screens/Chat/ChatBody/index.tsx b/web/screens/Chat/ChatBody/index.tsx
index c67d6a538..ee0b4592d 100644
--- a/web/screens/Chat/ChatBody/index.tsx
+++ b/web/screens/Chat/ChatBody/index.tsx
@@ -10,8 +10,6 @@ import LogoMark from '@/containers/Brand/Logo/Mark'
 
 import { MainViewState } from '@/constants/screens'
 
-import { loadModelErrorAtom } from '@/hooks/useActiveModel'
-
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import ChatItem from '../ChatItem'
@@ -83,7 +81,8 @@ const ChatBody: React.FC = () => {
         <ScrollToBottom className="flex h-full w-full flex-col">
           {messages.map((message, index) => (
             <div key={message.id}>
-              {(message.status !== MessageStatus.Pending ||
+              {((message.status !== MessageStatus.Error &&
+                message.status !== MessageStatus.Pending) ||
                 message.content.length > 0) && (
                 <ChatItem {...message} key={message.id} />
               )}
diff --git a/web/screens/Chat/ChatInput/index.tsx b/web/screens/Chat/ChatInput/index.tsx
index ee1ac9a41..5b8128439 100644
--- a/web/screens/Chat/ChatInput/index.tsx
+++ b/web/screens/Chat/ChatInput/index.tsx
@@ -38,6 +38,8 @@ import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
 import {
   activeThreadAtom,
   getActiveThreadIdAtom,
+  isGeneratingResponseAtom,
+  threadStatesAtom,
   waitingToSendMessage,
 } from '@/helpers/atoms/Thread.atom'
 
@@ -57,6 +59,12 @@ const ChatInput: React.FC = () => {
   const imageInputRef = useRef<HTMLInputElement>(null)
   const [showAttacmentMenus, setShowAttacmentMenus] = useState(false)
   const { experimentalFeature } = useContext(FeatureToggleContext)
+  const isGeneratingResponse = useAtomValue(isGeneratingResponseAtom)
+  const threadStates = useAtomValue(threadStatesAtom)
+
+  const isStreamingResponse = Object.values(threadStates).some(
+    (threadState) => threadState.waitingForResponse
+  )
 
   const onPromptChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
     setCurrentPrompt(e.target.value)
@@ -112,14 +120,12 @@ const ChatInput: React.FC = () => {
     const file = event.target.files?.[0]
     if (!file) return
     setFileUpload([{ file: file, type: 'pdf' }])
-    setCurrentPrompt('Summarize this for me')
   }
 
   const handleImageChange = (event: React.ChangeEvent<HTMLInputElement>) => {
     const file = event.target.files?.[0]
     if (!file) return
     setFileUpload([{ file: file, type: 'image' }])
-    setCurrentPrompt('What do you see in this image?')
   }
 
   const renderPreview = (fileUpload: any) => {
@@ -139,7 +145,7 @@ const ChatInput: React.FC = () => {
 
         <Textarea
           className={twMerge(
-            'max-h-[400px] resize-none overflow-y-hidden pr-20',
+            'max-h-[400px] resize-none pr-20',
             fileUpload.length && 'rounded-t-none'
           )}
           style={{ height: '40px' }}
@@ -237,7 +243,9 @@ const ChatInput: React.FC = () => {
         accept="application/pdf"
       />
 
-      {messages[messages.length - 1]?.status !== MessageStatus.Pending ? (
+      {messages[messages.length - 1]?.status !== MessageStatus.Pending &&
+      !isGeneratingResponse &&
+      !isStreamingResponse ? (
         <Button
           size="lg"
           disabled={
diff --git a/web/screens/Chat/EditChatInput/index.tsx b/web/screens/Chat/EditChatInput/index.tsx
new file mode 100644
index 000000000..240dc5106
--- /dev/null
+++ b/web/screens/Chat/EditChatInput/index.tsx
@@ -0,0 +1,192 @@
+/* eslint-disable @typescript-eslint/no-explicit-any */
+import { useEffect, useRef, useState } from 'react'
+
+import {
+  ConversationalExtension,
+  ExtensionTypeEnum,
+  InferenceEvent,
+  MessageStatus,
+  ThreadMessage,
+  events,
+} from '@janhq/core'
+
+import {
+  Textarea,
+  Button,
+  Modal,
+  ModalClose,
+  ModalContent,
+  ModalFooter,
+  ModalHeader,
+  ModalPortal,
+  ModalTitle,
+} from '@janhq/uikit'
+import { useAtom, useAtomValue, useSetAtom } from 'jotai'
+
+import { twMerge } from 'tailwind-merge'
+
+import { editPromptAtom } from '@/containers/Providers/Jotai'
+
+import { useActiveModel } from '@/hooks/useActiveModel'
+
+import useSendChatMessage from '@/hooks/useSendChatMessage'
+
+import { extensionManager } from '@/extension'
+
+import {
+  editMessageAtom,
+  getCurrentChatMessagesAtom,
+  setConvoMessagesAtom,
+} from '@/helpers/atoms/ChatMessage.atom'
+import {
+  activeThreadAtom,
+  getActiveThreadIdAtom,
+  waitingToSendMessage,
+} from '@/helpers/atoms/Thread.atom'
+
+type Props = {
+  message: ThreadMessage
+}
+
+const EditChatInput: React.FC<Props> = ({ message }) => {
+  const activeThread = useAtomValue(activeThreadAtom)
+  const { stateModel } = useActiveModel()
+  const messages = useAtomValue(getCurrentChatMessagesAtom)
+
+  const [editPrompt, setEditPrompt] = useAtom(editPromptAtom)
+  const { sendChatMessage } = useSendChatMessage()
+  const setMessages = useSetAtom(setConvoMessagesAtom)
+  const activeThreadId = useAtomValue(getActiveThreadIdAtom)
+
+  const [isWaitingToSend, setIsWaitingToSend] = useAtom(waitingToSendMessage)
+  const textareaRef = useRef<HTMLTextAreaElement>(null)
+  const setEditMessage = useSetAtom(editMessageAtom)
+  const [showDialog, setshowDialog] = useState(false)
+
+  const onPromptChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
+    setEditPrompt(e.target.value)
+  }
+
+  useEffect(() => {
+    if (isWaitingToSend && activeThreadId) {
+      setIsWaitingToSend(false)
+      sendChatMessage(editPrompt)
+    }
+  }, [
+    activeThreadId,
+    isWaitingToSend,
+    editPrompt,
+    setIsWaitingToSend,
+    sendChatMessage,
+  ])
+
+  useEffect(() => {
+    if (textareaRef.current) {
+      textareaRef.current.focus()
+    }
+  }, [activeThreadId])
+
+  useEffect(() => {
+    if (textareaRef.current) {
+      textareaRef.current.style.height = '40px'
+      textareaRef.current.style.height = textareaRef.current.scrollHeight + 'px'
+    }
+  }, [editPrompt])
+
+  useEffect(() => {
+    setEditPrompt(message.content[0]?.text?.value)
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [])
+
+  const sendEditMessage = async () => {
+    setEditMessage('')
+    const messageIdx = messages.findIndex((msg) => msg.id === message.id)
+    const newMessages = messages.slice(0, messageIdx)
+    if (activeThread) {
+      setMessages(activeThread.id, newMessages)
+      await extensionManager
+        .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
+        ?.writeMessages(
+          activeThread.id,
+          // Remove all of the messages below this
+          newMessages
+        )
+        .then(() => {
+          sendChatMessage(editPrompt)
+        })
+    }
+  }
+
+  const onKeyDown = async (e: React.KeyboardEvent<HTMLTextAreaElement>) => {
+    if (e.key === 'Enter' && !e.shiftKey) {
+      e.preventDefault()
+      if (messages[messages.length - 1]?.status !== MessageStatus.Pending)
+        sendEditMessage()
+      else onStopInferenceClick()
+    }
+  }
+
+  const onStopInferenceClick = async () => {
+    events.emit(InferenceEvent.OnInferenceStopped, {})
+  }
+
+  return (
+    <div className="mx-auto flex w-full flex-shrink-0 items-end justify-center space-x-4 pb-0 pt-1">
+      <div className="relative flex w-full flex-col">
+        <Textarea
+          className={twMerge(
+            'max-h-[400px] resize-none overflow-y-hidden pr-20'
+          )}
+          style={{ height: '40px' }}
+          ref={textareaRef}
+          onKeyDown={onKeyDown}
+          placeholder="Enter your message..."
+          disabled={stateModel.loading || !activeThread}
+          value={editPrompt}
+          onChange={onPromptChange}
+        />
+      </div>
+
+      <div className="flex items-center space-x-2">
+        <Button
+          disabled={
+            stateModel.loading ||
+            !activeThread ||
+            editPrompt.trim().length === 0
+          }
+          themes="primary"
+          onClick={sendEditMessage}
+        >
+          Submit
+        </Button>
+        <Button themes="outline" onClick={() => setEditMessage('')}>
+          Cancel
+        </Button>
+      </div>
+
+      <Modal open={showDialog} onOpenChange={() => setshowDialog(false)}>
+        <ModalPortal />
+        <ModalContent>
+          <ModalHeader>
+            <ModalTitle>Edit Message</ModalTitle>
+          </ModalHeader>
+          <p className="text-muted-foreground">
+            Do you want to discard the change
+          </p>
+          <ModalFooter>
+            <div className="flex gap-x-2">
+              <ModalClose asChild onClick={() => setshowDialog(false)}>
+                <Button themes="outline">Cancel</Button>
+              </ModalClose>
+              <ModalClose asChild onClick={() => setEditMessage('')}>
+                <Button autoFocus>Yes</Button>
+              </ModalClose>
+            </div>
+          </ModalFooter>
+        </ModalContent>
+      </Modal>
+    </div>
+  )
+}
+
+export default EditChatInput
diff --git a/web/screens/Chat/EngineSetting/index.tsx b/web/screens/Chat/EngineSetting/index.tsx
index 2153bcbde..272434471 100644
--- a/web/screens/Chat/EngineSetting/index.tsx
+++ b/web/screens/Chat/EngineSetting/index.tsx
@@ -1,36 +1,25 @@
-/* eslint-disable @typescript-eslint/no-explicit-any */
-import { useAtomValue } from 'jotai'
-
-import { selectedModelAtom } from '@/containers/DropdownListSidebar'
-
-import { getConfigurationsData } from '@/utils/componentSettings'
-import { toSettingParams } from '@/utils/modelParam'
-
-import SettingComponentBuilder from '../ModelSetting/SettingComponent'
-
-import { getActiveThreadModelParamsAtom } from '@/helpers/atoms/Thread.atom'
-
-const EngineSetting = ({ enabled = true }: { enabled?: boolean }) => {
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-  const selectedModel = useAtomValue(selectedModelAtom)
-
-  if (!selectedModel || !activeModelParams) return null
-
-  const modelSettingParams = toSettingParams(activeModelParams)
-
-  const componentData = getConfigurationsData(
-    modelSettingParams,
-    selectedModel
-  ).toSorted((a, b) => a.title.localeCompare(b.title))
+import SettingComponentBuilder from '../../Chat/ModelSetting/SettingComponent'
+import { SettingComponentData } from '../ModelSetting/SettingComponent'
 
+const EngineSetting = ({
+  componentData,
+  enabled = true,
+}: {
+  componentData: SettingComponentData[]
+  enabled?: boolean
+}) => {
   return (
-    <div className="flex flex-col">
-      <SettingComponentBuilder
-        componentData={componentData}
-        enabled={enabled}
-        selector={(e) => e.name !== 'prompt_template'}
-      />
-    </div>
+    <>
+      {componentData.filter((e) => e.name !== 'prompt_template').length && (
+        <div className="flex flex-col">
+          <SettingComponentBuilder
+            componentData={componentData}
+            enabled={enabled}
+            selector={(e) => e.name !== 'prompt_template'}
+          />
+        </div>
+      )}
+    </>
   )
 }
 
diff --git a/web/screens/Chat/ErrorMessage/index.tsx b/web/screens/Chat/ErrorMessage/index.tsx
index 84a89cee8..5aa0cd6ce 100644
--- a/web/screens/Chat/ErrorMessage/index.tsx
+++ b/web/screens/Chat/ErrorMessage/index.tsx
@@ -1,55 +1,34 @@
-import {
-  ChatCompletionRole,
-  ConversationalExtension,
-  ExtensionTypeEnum,
-  MessageStatus,
-  ThreadMessage,
-} from '@janhq/core'
+import { MessageStatus, ThreadMessage } from '@janhq/core'
 import { Button } from '@janhq/uikit'
 import { useAtomValue, useSetAtom } from 'jotai'
 import { RefreshCcw } from 'lucide-react'
 
-import { useActiveModel } from '@/hooks/useActiveModel'
+import ModalTroubleShooting, {
+  modalTroubleShootingAtom,
+} from '@/containers/ModalTroubleShoot'
+
+import { loadModelErrorAtom } from '@/hooks/useActiveModel'
 import useSendChatMessage from '@/hooks/useSendChatMessage'
 
-import { extensionManager } from '@/extension'
-import {
-  deleteMessageAtom,
-  getCurrentChatMessagesAtom,
-} from '@/helpers/atoms/ChatMessage.atom'
-import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
+import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
 
 const ErrorMessage = ({ message }: { message: ThreadMessage }) => {
   const messages = useAtomValue(getCurrentChatMessagesAtom)
-  const thread = useAtomValue(activeThreadAtom)
-  const deleteMessage = useSetAtom(deleteMessageAtom)
   const { resendChatMessage } = useSendChatMessage()
+  const setModalTroubleShooting = useSetAtom(modalTroubleShootingAtom)
+  const loadModelError = useAtomValue(loadModelErrorAtom)
+  const PORT_NOT_AVAILABLE = 'PORT_NOT_AVAILABLE'
 
   const regenerateMessage = async () => {
     const lastMessageIndex = messages.length - 1
     const message = messages[lastMessageIndex]
-    if (message.role !== ChatCompletionRole.User) {
-      // Delete last response before regenerating
-      deleteMessage(message.id ?? '')
-      if (thread) {
-        await extensionManager
-          .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
-          ?.writeMessages(
-            thread.id,
-            messages.filter((msg) => msg.id !== message.id)
-          )
-      }
-      const targetMessage = messages[lastMessageIndex - 1]
-      if (targetMessage) resendChatMessage(targetMessage)
-    } else {
-      resendChatMessage(message)
-    }
+    resendChatMessage(message)
   }
 
   return (
-    <>
+    <div className="mt-10">
       {message.status === MessageStatus.Stopped && (
-        <div key={message.id} className="mt-10 flex flex-col items-center">
+        <div key={message.id} className="flex flex-col items-center">
           <span className="mb-3 text-center text-sm font-medium text-gray-500">
             Oops! The generation was interrupted. Let&apos;s give it another go!
           </span>
@@ -65,32 +44,47 @@ const ErrorMessage = ({ message }: { message: ThreadMessage }) => {
         </div>
       )}
       {message.status === MessageStatus.Error && (
-        <div key={message.id} className="mt-10 flex flex-col items-center">
-          <span className="mb-3 text-center text-sm font-medium text-gray-500">
-            <>
-              <p>Apologies, something&apos;s amiss!</p>
-              Jan&apos;s in beta. Find troubleshooting guides{' '}
-              <a
-                href="https://jan.ai/guides/troubleshooting"
-                target="_blank"
-                className="text-blue-600 hover:underline dark:text-blue-300"
-              >
-                here
-              </a>{' '}
-              or reach out to us on{' '}
-              <a
-                href="https://discord.gg/AsJ8krTT3N"
-                target="_blank"
-                className="text-blue-600 hover:underline dark:text-blue-300"
-              >
-                Discord
-              </a>{' '}
-              for assistance.
-            </>
-          </span>
-        </div>
+        <>
+          {loadModelError === PORT_NOT_AVAILABLE ? (
+            <div
+              key={message.id}
+              className="flex flex-col items-center text-center text-sm font-medium text-gray-500 w-full"
+            >
+              <p className="w-[90%]">
+                Port 3928 is currently unavailable. Check for conflicting apps,
+                or access&nbsp;
+                <span
+                  className="cursor-pointer text-primary dark:text-blue-400"
+                  onClick={() => setModalTroubleShooting(true)}
+                >
+                  troubleshooting assistance
+                </span>
+                &nbsp;for further support.
+              </p>
+              <ModalTroubleShooting />
+            </div>
+          ) : (
+            <div
+              key={message.id}
+              className="flex flex-col items-center text-center text-sm font-medium text-gray-500"
+            >
+              <p>{`Apologies, something’s amiss!`}</p>
+              <p>
+                Jan’s in beta. Access&nbsp;
+                <span
+                  className="cursor-pointer text-primary dark:text-blue-400"
+                  onClick={() => setModalTroubleShooting(true)}
+                >
+                  troubleshooting assistance
+                </span>
+                &nbsp;now.
+              </p>
+              <ModalTroubleShooting />
+            </div>
+          )}
+        </>
       )}
-    </>
+    </div>
   )
 }
 export default ErrorMessage
diff --git a/web/screens/Chat/MessageQueuedBanner/index.tsx b/web/screens/Chat/MessageQueuedBanner/index.tsx
deleted file mode 100644
index 5847394b4..000000000
--- a/web/screens/Chat/MessageQueuedBanner/index.tsx
+++ /dev/null
@@ -1,21 +0,0 @@
-import { useAtomValue } from 'jotai'
-
-import { queuedMessageAtom } from '@/hooks/useSendChatMessage'
-
-const MessageQueuedBanner: React.FC = () => {
-  const queuedMessage = useAtomValue(queuedMessageAtom)
-
-  return (
-    <div>
-      {queuedMessage && (
-        <div className="my-2 py-2 text-center">
-          <span className="rounded-lg border border-border px-4 py-2 shadow-lg">
-            Message queued. It can be sent once the model has started
-          </span>
-        </div>
-      )}
-    </div>
-  )
-}
-
-export default MessageQueuedBanner
diff --git a/web/screens/Chat/MessageToolbar/index.tsx b/web/screens/Chat/MessageToolbar/index.tsx
index 070022122..e5d81475e 100644
--- a/web/screens/Chat/MessageToolbar/index.tsx
+++ b/web/screens/Chat/MessageToolbar/index.tsx
@@ -7,7 +7,13 @@ import {
   ContentType,
 } from '@janhq/core'
 import { useAtomValue, useSetAtom } from 'jotai'
-import { RefreshCcw, CopyIcon, Trash2Icon, CheckIcon } from 'lucide-react'
+import {
+  RefreshCcw,
+  CopyIcon,
+  Trash2Icon,
+  CheckIcon,
+  PencilIcon,
+} from 'lucide-react'
 
 import { twMerge } from 'tailwind-merge'
 
@@ -17,12 +23,14 @@ import useSendChatMessage from '@/hooks/useSendChatMessage'
 import { extensionManager } from '@/extension'
 import {
   deleteMessageAtom,
+  editMessageAtom,
   getCurrentChatMessagesAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
 import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 const MessageToolbar = ({ message }: { message: ThreadMessage }) => {
   const deleteMessage = useSetAtom(deleteMessageAtom)
+  const setEditMessage = useSetAtom(editMessageAtom)
   const thread = useAtomValue(activeThreadAtom)
   const messages = useAtomValue(getCurrentChatMessagesAtom)
   const { resendChatMessage } = useSendChatMessage()
@@ -40,11 +48,11 @@ const MessageToolbar = ({ message }: { message: ThreadMessage }) => {
     }
   }
 
+  const onEditClick = async () => {
+    setEditMessage(message.id ?? '')
+  }
+
   const onRegenerateClick = async () => {
-    if (message.role !== ChatCompletionRole.User) {
-      // Delete last response before regenerating
-      await onDeleteClick()
-    }
     resendChatMessage(message)
   }
 
@@ -53,6 +61,16 @@ const MessageToolbar = ({ message }: { message: ThreadMessage }) => {
   return (
     <div className={twMerge('flex flex-row items-center')}>
       <div className="flex overflow-hidden rounded-md border border-border bg-background/20">
+        {message.role === ChatCompletionRole.User &&
+          message.content[0]?.type === ContentType.Text && (
+            <div
+              className="cursor-pointer border-r border-border px-2 py-2 hover:bg-background/80"
+              onClick={onEditClick}
+            >
+              <PencilIcon size={14} />
+            </div>
+          )}
+
         {message.id === messages[messages.length - 1]?.id &&
           messages[messages.length - 1].status !== MessageStatus.Error &&
           messages[messages.length - 1].content[0]?.type !==
diff --git a/web/screens/Chat/ModelSetting/index.tsx b/web/screens/Chat/ModelSetting/index.tsx
index ea95363eb..51aa6f637 100644
--- a/web/screens/Chat/ModelSetting/index.tsx
+++ b/web/screens/Chat/ModelSetting/index.tsx
@@ -1,37 +1,26 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
 import React from 'react'
 
-import { useAtomValue } from 'jotai'
-
-import { selectedModelAtom } from '@/containers/DropdownListSidebar'
-
-import { getConfigurationsData } from '@/utils/componentSettings'
-import { toRuntimeParams } from '@/utils/modelParam'
-
-import SettingComponentBuilder from './SettingComponent'
-
-import { getActiveThreadModelParamsAtom } from '@/helpers/atoms/Thread.atom'
-
-const ModelSetting = () => {
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-  const selectedModel = useAtomValue(selectedModelAtom)
-
-  if (!selectedModel || !activeModelParams) return null
-
-  const modelRuntimeParams = toRuntimeParams(activeModelParams)
-
-  const componentData = getConfigurationsData(
-    modelRuntimeParams,
-    selectedModel
-  ).toSorted((a, b) => a.title.localeCompare(b.title))
+import SettingComponentBuilder, {
+  SettingComponentData,
+} from './SettingComponent'
 
+const ModelSetting = ({
+  componentData,
+}: {
+  componentData: SettingComponentData[]
+}) => {
   return (
-    <div className="flex flex-col">
-      <SettingComponentBuilder
-        componentData={componentData}
-        selector={(e) => e.name !== 'prompt_template'}
-      />
-    </div>
+    <>
+      {componentData.filter((e) => e.name !== 'prompt_template').length && (
+        <div className="flex flex-col">
+          <SettingComponentBuilder
+            componentData={componentData}
+            selector={(e) => e.name !== 'prompt_template'}
+          />
+        </div>
+      )}
+    </>
   )
 }
 
diff --git a/web/screens/Chat/Sidebar/index.tsx b/web/screens/Chat/Sidebar/index.tsx
index 8088501b9..7187c84b3 100644
--- a/web/screens/Chat/Sidebar/index.tsx
+++ b/web/screens/Chat/Sidebar/index.tsx
@@ -1,11 +1,20 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
 import React, { useContext } from 'react'
 
-import { InferenceEngine } from '@janhq/core'
-import { Input, Textarea, Switch } from '@janhq/uikit'
+import {
+  Input,
+  Textarea,
+  Switch,
+  Tooltip,
+  TooltipArrow,
+  TooltipContent,
+  TooltipPortal,
+  TooltipTrigger,
+} from '@janhq/uikit'
 
 import { atom, useAtomValue } from 'jotai'
 
+import { InfoIcon } from 'lucide-react'
 import { twMerge } from 'tailwind-merge'
 
 import LogoMark from '@/containers/Brand/Logo/Mark'
@@ -50,8 +59,14 @@ const Sidebar: React.FC = () => {
       activeThread?.assistants[0]?.tools[0]?.settings) ??
       {}
   )
-  const componentDataEngineSetting = getConfigurationsData(modelEngineParams)
-  const componentDataRuntimeSetting = getConfigurationsData(modelRuntimeParams)
+  const componentDataEngineSetting = getConfigurationsData(
+    modelEngineParams,
+    selectedModel
+  )
+  const componentDataRuntimeSetting = getConfigurationsData(
+    modelRuntimeParams,
+    selectedModel
+  )
 
   return (
     <div
@@ -101,7 +116,7 @@ const Sidebar: React.FC = () => {
           </div>
         </div>
 
-        <CardSidebar title="Assistant">
+        <CardSidebar title="Assistant" isShow={true}>
           <div className="flex flex-col space-y-4 p-2">
             <div className="flex items-center space-x-2">
               <LogoMark width={24} height={24} />
@@ -134,15 +149,88 @@ const Sidebar: React.FC = () => {
                 }}
               />
             </div>
-            {experimentalFeature && (
-              <div>
-                {activeThread?.assistants[0]?.tools &&
-                  componentDataAssistantSetting.length > 0 && (
-                    <div className="mt-2">
-                      <CardSidebar
-                        title="Retrieval"
-                        asChild
-                        rightAction={
+          </div>
+        </CardSidebar>
+
+        <CardSidebar title="Model" isShow={true}>
+          <div className="px-2 pt-4">
+            <DropdownListSidebar />
+
+            {componentDataRuntimeSetting.length > 0 && (
+              <div className="mt-6">
+                <CardSidebar title="Inference Parameters" asChild>
+                  <div className="px-2 py-4">
+                    <ModelSetting componentData={componentDataRuntimeSetting} />
+                  </div>
+                </CardSidebar>
+              </div>
+            )}
+
+            {componentDataEngineSetting.filter(
+              (x) => x.name === 'prompt_template'
+            ).length !== 0 && (
+              <div className="mt-4">
+                <CardSidebar title="Model Parameters" asChild>
+                  <div className="px-2 py-4">
+                    <SettingComponentBuilder
+                      componentData={componentDataEngineSetting}
+                      selector={(x: any) => x.name === 'prompt_template'}
+                    />
+                  </div>
+                </CardSidebar>
+              </div>
+            )}
+
+            {componentDataEngineSetting.length > 0 && (
+              <div className="my-4">
+                <CardSidebar title="Engine Parameters" asChild>
+                  <div className="px-2 py-4">
+                    <EngineSetting componentData={componentDataEngineSetting} />
+                  </div>
+                </CardSidebar>
+              </div>
+            )}
+          </div>
+        </CardSidebar>
+
+        {experimentalFeature && (
+          <div>
+            {activeThread?.assistants[0]?.tools &&
+              componentDataAssistantSetting.length > 0 && (
+                <CardSidebar title="Tools" isShow={true}>
+                  <div className="px-2 pt-4">
+                    <div className="mb-2">
+                      <div className="flex items-center justify-between">
+                        <label
+                          id="retrieval"
+                          className="inline-flex items-center font-bold text-zinc-500 dark:text-gray-300"
+                        >
+                          Retrieval
+                          <Tooltip>
+                            <TooltipTrigger asChild>
+                              <InfoIcon
+                                size={16}
+                                className="ml-2 flex-shrink-0 text-black dark:text-gray-500"
+                              />
+                            </TooltipTrigger>
+                            <TooltipPortal>
+                              <TooltipContent
+                                side="top"
+                                className="max-w-[240px]"
+                              >
+                                <span>
+                                  Retrieval helps the assistant use information
+                                  from files you send to it. Once you share a
+                                  file, the assistant automatically fetches the
+                                  relevant content based on your request.
+                                </span>
+                                <TooltipArrow />
+                              </TooltipContent>
+                            </TooltipPortal>
+                          </Tooltip>
+                        </label>
+
+                        <div className="flex items-center justify-between">
                           <Switch
                             name="retrieval"
                             className="mr-2"
@@ -172,78 +260,99 @@ const Sidebar: React.FC = () => {
                                 })
                             }}
                           />
-                        }
-                      >
-                        {activeThread?.assistants[0]?.tools[0].enabled && (
-                          <div className="px-2 py-4">
-                            <div className="mb-4">
-                              <label
-                                id="tool-title"
-                                className="mb-2 inline-block font-bold text-zinc-500 dark:text-gray-300"
-                              >
-                                Embedding Engine
-                              </label>
-                              <div className="flex items-center justify-between">
-                                <label className="font-medium text-zinc-500 dark:text-gray-300">
-                                  {selectedModel?.engine ===
-                                  InferenceEngine.openai
-                                    ? 'OpenAI'
-                                    : 'Nitro'}
-                                </label>
-                              </div>
-                            </div>
-                            <AssistantSetting
-                              componentData={componentDataAssistantSetting}
-                            />
-                          </div>
-                        )}
-                      </CardSidebar>
+                        </div>
+                      </div>
                     </div>
-                  )}
-              </div>
-            )}
+                    {activeThread?.assistants[0]?.tools[0].enabled && (
+                      <div className="pb-4 pt-2">
+                        <div className="mb-4">
+                          <div className="item-center mb-2 flex">
+                            <label
+                              id="embedding-model"
+                              className="inline-flex font-bold text-zinc-500 dark:text-gray-300"
+                            >
+                              Embedding Model
+                            </label>
+                            <Tooltip>
+                              <TooltipTrigger asChild>
+                                <InfoIcon
+                                  size={16}
+                                  className="ml-2 flex-shrink-0 dark:text-gray-500"
+                                />
+                              </TooltipTrigger>
+                              <TooltipPortal>
+                                <TooltipContent
+                                  side="top"
+                                  className="max-w-[240px]"
+                                >
+                                  <span>
+                                    Embedding model is crucial for understanding
+                                    and processing the input text effectively by
+                                    converting text to numerical
+                                    representations. Align the model choice with
+                                    your task, evaluate its performance, and
+                                    consider factors like resource availability.
+                                    Experiment to find the best fit for your
+                                    specific use case.
+                                  </span>
+                                  <TooltipArrow />
+                                </TooltipContent>
+                              </TooltipPortal>
+                            </Tooltip>
+                          </div>
+
+                          <div className="flex items-center justify-between">
+                            <Input value={selectedModel?.name} disabled />
+                          </div>
+                        </div>
+                        <div className="mb-4">
+                          <div className="mb-2 flex items-center">
+                            <label
+                              id="vector-database"
+                              className="inline-block font-bold text-zinc-500 dark:text-gray-300"
+                            >
+                              Vector Database
+                            </label>
+                            <Tooltip>
+                              <TooltipTrigger asChild>
+                                <InfoIcon
+                                  size={16}
+                                  className="ml-2 flex-shrink-0 dark:text-gray-500"
+                                />
+                              </TooltipTrigger>
+                              <TooltipPortal>
+                                <TooltipContent
+                                  side="top"
+                                  className="max-w-[240px]"
+                                >
+                                  <span>
+                                    Vector Database is crucial for efficient
+                                    storage and retrieval of embeddings.
+                                    Consider your specific task, available
+                                    resources, and language requirements.
+                                    Experiment to find the best fit for your
+                                    specific use case.
+                                  </span>
+                                  <TooltipArrow />
+                                </TooltipContent>
+                              </TooltipPortal>
+                            </Tooltip>
+                          </div>
+
+                          <div className="flex items-center justify-between">
+                            <Input value="HNSWLib" disabled />
+                          </div>
+                        </div>
+                        <AssistantSetting
+                          componentData={componentDataAssistantSetting}
+                        />
+                      </div>
+                    )}
+                  </div>
+                </CardSidebar>
+              )}
           </div>
-        </CardSidebar>
-        <CardSidebar title="Model">
-          <div className="px-2 pt-4">
-            <DropdownListSidebar />
-
-            {componentDataRuntimeSetting.length > 0 && (
-              <div className="mt-6">
-                <CardSidebar title="Inference Parameters" asChild>
-                  <div className="px-2 py-4">
-                    <ModelSetting />
-                  </div>
-                </CardSidebar>
-              </div>
-            )}
-
-            {componentDataEngineSetting.filter(
-              (x) => x.name === 'prompt_template'
-            ).length !== 0 && (
-              <div className="mt-4">
-                <CardSidebar title="Model Parameters" asChild>
-                  <div className="px-2 py-4">
-                    <SettingComponentBuilder
-                      componentData={componentDataEngineSetting}
-                      selector={(x: any) => x.name === 'prompt_template'}
-                    />
-                  </div>
-                </CardSidebar>
-              </div>
-            )}
-
-            {componentDataEngineSetting.length > 0 && (
-              <div className="my-4">
-                <CardSidebar title="Engine Parameters" asChild>
-                  <div className="px-2 py-4">
-                    <EngineSetting />
-                  </div>
-                </CardSidebar>
-              </div>
-            )}
-          </div>
-        </CardSidebar>
+        )}
       </div>
     </div>
   )
diff --git a/web/screens/Chat/SimpleTextMessage/index.tsx b/web/screens/Chat/SimpleTextMessage/index.tsx
index 9be45e7e6..f064132b8 100644
--- a/web/screens/Chat/SimpleTextMessage/index.tsx
+++ b/web/screens/Chat/SimpleTextMessage/index.tsx
@@ -32,10 +32,14 @@ import { usePath } from '@/hooks/usePath'
 import { toGibibytes } from '@/utils/converter'
 import { displayDate } from '@/utils/datetime'
 
+import EditChatInput from '../EditChatInput'
 import Icon from '../FileUploadPreview/Icon'
 import MessageToolbar from '../MessageToolbar'
 
-import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
+import {
+  editMessageAtom,
+  getCurrentChatMessagesAtom,
+} from '@/helpers/atoms/ChatMessage.atom'
 
 function isMarkdownValue(value: string): boolean {
   const tokenTypes: string[] = []
@@ -54,6 +58,7 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
   let text = ''
   const isUser = props.role === ChatCompletionRole.User
   const isSystem = props.role === ChatCompletionRole.System
+  const editMessage = useAtomValue(editMessageAtom)
 
   if (props.content && props.content.length > 0) {
     text = props.content[0]?.text?.value ?? ''
@@ -276,16 +281,24 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
           )}
 
           {isUser && !isMarkdownValue(text) ? (
-            <div
-              className={twMerge(
-                'message flex flex-grow flex-col gap-y-2 text-[15px] font-normal leading-relaxed',
-                isUser
-                  ? 'whitespace-pre-wrap break-words'
-                  : 'rounded-xl bg-secondary p-4'
+            <>
+              {editMessage === props.id ? (
+                <div>
+                  <EditChatInput message={props} />
+                </div>
+              ) : (
+                <div
+                  className={twMerge(
+                    'message flex flex-grow flex-col gap-y-2 text-[15px] font-normal leading-relaxed',
+                    isUser
+                      ? 'whitespace-pre-wrap break-words'
+                      : 'rounded-xl bg-secondary p-4'
+                  )}
+                >
+                  {text}
+                </div>
               )}
-            >
-              {text}
-            </div>
+            </>
           ) : (
             <div
               className={twMerge(
diff --git a/web/screens/Chat/ThreadList/index.tsx b/web/screens/Chat/ThreadList/index.tsx
index 2ad9a28c4..eb372f664 100644
--- a/web/screens/Chat/ThreadList/index.tsx
+++ b/web/screens/Chat/ThreadList/index.tsx
@@ -1,13 +1,14 @@
-import { useCallback } from 'react'
+import { useCallback, useEffect } from 'react'
 
 import { Thread } from '@janhq/core/'
 
 import { motion as m } from 'framer-motion'
-import { useAtomValue } from 'jotai'
+import { useAtomValue, useSetAtom } from 'jotai'
 import { GalleryHorizontalEndIcon, MoreVerticalIcon } from 'lucide-react'
 
 import { twMerge } from 'tailwind-merge'
 
+import { useCreateNewThread } from '@/hooks/useCreateNewThread'
 import useSetActiveThread from '@/hooks/useSetActiveThread'
 
 import { displayDate } from '@/utils/datetime'
@@ -16,8 +17,11 @@ import CleanThreadModal from '../CleanThreadModal'
 
 import DeleteThreadModal from '../DeleteThreadModal'
 
+import { assistantsAtom } from '@/helpers/atoms/Assistant.atom'
+import { editMessageAtom } from '@/helpers/atoms/ChatMessage.atom'
 import {
   getActiveThreadIdAtom,
+  threadDataReadyAtom,
   threadStatesAtom,
   threadsAtom,
 } from '@/helpers/atoms/Thread.atom'
@@ -27,14 +31,39 @@ export default function ThreadList() {
   const threads = useAtomValue(threadsAtom)
   const activeThreadId = useAtomValue(getActiveThreadIdAtom)
   const { setActiveThread } = useSetActiveThread()
+  const assistants = useAtomValue(assistantsAtom)
+  const threadDataReady = useAtomValue(threadDataReadyAtom)
+  const { requestCreateNewThread } = useCreateNewThread()
+  const setEditMessage = useSetAtom(editMessageAtom)
 
   const onThreadClick = useCallback(
     (thread: Thread) => {
       setActiveThread(thread)
+      setEditMessage('')
     },
-    [setActiveThread]
+    [setActiveThread, setEditMessage]
   )
 
+  /**
+   * Auto create thread
+   * This will create a new thread if there are assistants available
+   * and there are no threads available
+   */
+  useEffect(() => {
+    if (threadDataReady && assistants.length > 0 && threads.length === 0) {
+      requestCreateNewThread(assistants[0])
+    } else if (threadDataReady && !activeThreadId) {
+      setActiveThread(threads[0])
+    }
+  }, [
+    assistants,
+    threads,
+    threadDataReady,
+    requestCreateNewThread,
+    activeThreadId,
+    setActiveThread,
+  ])
+
   return (
     <div className="px-3 py-4">
       {threads.length === 0 ? (
diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index e3eedb6c1..125e58b3b 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -13,7 +13,7 @@ import GenerateResponse from '@/containers/Loader/GenerateResponse'
 import ModelReload from '@/containers/Loader/ModelReload'
 import ModelStart from '@/containers/Loader/ModelStart'
 
-import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
+import { fileUploadAtom } from '@/containers/Providers/Jotai'
 import { showLeftSideBarAtom } from '@/containers/Providers/KeyListener'
 
 import { snackbar } from '@/containers/Toast'
@@ -54,7 +54,6 @@ const renderError = (code: string) => {
 }
 
 const ChatScreen: React.FC = () => {
-  const setCurrentPrompt = useSetAtom(currentPromptAtom)
   const activeThread = useAtomValue(activeThreadAtom)
   const showLeftSideBar = useAtomValue(showLeftSideBarAtom)
   const engineParamsUpdate = useAtomValue(engineParamsUpdateAtom)
@@ -110,11 +109,6 @@ const ChatScreen: React.FC = () => {
       const imageType = files[0]?.type.includes('image')
       setFileUpload([{ file: files[0], type: imageType ? 'image' : 'pdf' }])
       setDragOver(false)
-      if (imageType) {
-        setCurrentPrompt('What do you see in this image?')
-      } else {
-        setCurrentPrompt('Summarize this for me')
-      }
     },
     onDropRejected: (e) => {
       if (
@@ -205,7 +199,7 @@ const ChatScreen: React.FC = () => {
           {queuedMessage && !reloadModel && (
             <div className="mb-2 text-center">
               <span className="text-muted-foreground">
-                Message queued. It can be sent once the model has started
+                Message will be sent once the model has started
               </span>
             </div>
           )}
diff --git a/web/screens/ExploreModels/ExploreModelItem/index.tsx b/web/screens/ExploreModels/ExploreModelItem/index.tsx
index 553c73a49..9cdfbc01a 100644
--- a/web/screens/ExploreModels/ExploreModelItem/index.tsx
+++ b/web/screens/ExploreModels/ExploreModelItem/index.tsx
@@ -1,6 +1,4 @@
-/* eslint-disable react/display-name */
-
-import { forwardRef, useState } from 'react'
+import { useState } from 'react'
 
 import { Model } from '@janhq/core'
 import { Badge } from '@janhq/uikit'
@@ -11,7 +9,7 @@ type Props = {
   model: Model
 }
 
-const ExploreModelItem = forwardRef<HTMLDivElement, Props>(({ model }, ref) => {
+const ExploreModelItem: React.FC<Props> = ({ model }) => {
   const [open, setOpen] = useState('')
 
   const handleToggle = () => {
@@ -23,10 +21,7 @@ const ExploreModelItem = forwardRef<HTMLDivElement, Props>(({ model }, ref) => {
   }
 
   return (
-    <div
-      ref={ref}
-      className="mb-6 flex flex-col overflow-hidden rounded-xl border border-border bg-background/60"
-    >
+    <div className="mb-6 flex flex-col overflow-hidden rounded-xl border border-border bg-background/60">
       <ExploreModelItemHeader
         model={model}
         onClick={handleToggle}
@@ -82,17 +77,11 @@ const ExploreModelItem = forwardRef<HTMLDivElement, Props>(({ model }, ref) => {
               </span>
               <p className="mt-2 font-medium uppercase">{model.format}</p>
             </div>
-            {/* <div className="mt-4">
-              <span className="font-semibold text-muted-foreground">
-                Compatibility
-              </span>
-              <p className="mt-2 font-medium">-</p>
-            </div> */}
           </div>
         </div>
       )}
     </div>
   )
-})
+}
 
 export default ExploreModelItem
diff --git a/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx b/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
index 17b897d51..7af5d3d97 100644
--- a/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
+++ b/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
@@ -1,5 +1,4 @@
-/* eslint-disable react-hooks/exhaustive-deps */
-import { useCallback, useMemo } from 'react'
+import { useCallback } from 'react'
 
 import { Model } from '@janhq/core'
 import {
@@ -12,7 +11,7 @@ import {
   TooltipTrigger,
 } from '@janhq/uikit'
 
-import { atom, useAtomValue } from 'jotai'
+import { useAtomValue } from 'jotai'
 
 import { ChevronDownIcon } from 'lucide-react'
 
@@ -25,8 +24,6 @@ import { MainViewState } from '@/constants/screens'
 import { useCreateNewThread } from '@/hooks/useCreateNewThread'
 import useDownloadModel from '@/hooks/useDownloadModel'
 
-import { useDownloadState } from '@/hooks/useDownloadState'
-
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import { toGibibytes } from '@/utils/converter'
@@ -34,7 +31,10 @@ import { toGibibytes } from '@/utils/converter'
 import { assistantsAtom } from '@/helpers/atoms/Assistant.atom'
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
 
-import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
+import {
+  downloadedModelsAtom,
+  getDownloadingModelAtom,
+} from '@/helpers/atoms/Model.atom'
 import {
   nvidiaTotalVramAtom,
   totalRamAtom,
@@ -46,13 +46,32 @@ type Props = {
   open: string
 }
 
+const getLabel = (size: number, ram: number) => {
+  if (size * 1.25 >= ram) {
+    return (
+      <Badge className="rounded-md" themes="danger">
+        Not enough RAM
+      </Badge>
+    )
+  } else {
+    return (
+      <Badge className="rounded-md" themes="success">
+        Recommended
+      </Badge>
+    )
+  }
+}
+
 const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
   const { downloadModel } = useDownloadModel()
+  const downloadingModels = useAtomValue(getDownloadingModelAtom)
   const downloadedModels = useAtomValue(downloadedModelsAtom)
-  const { modelDownloadStateAtom } = useDownloadState()
   const { requestCreateNewThread } = useCreateNewThread()
   const totalRam = useAtomValue(totalRamAtom)
+
   const nvidiaTotalVram = useAtomValue(nvidiaTotalVramAtom)
+  const { setMainViewState } = useMainViewState()
+
   // Default nvidia returns vram in MB, need to convert to bytes to match the unit of totalRamW
   let ram = nvidiaTotalVram * 1024 * 1024
   if (ram === 0) {
@@ -61,16 +80,9 @@ const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
   const serverEnabled = useAtomValue(serverEnabledAtom)
   const assistants = useAtomValue(assistantsAtom)
 
-  const downloadAtom = useMemo(
-    () => atom((get) => get(modelDownloadStateAtom)[model.id]),
-    [model.id]
-  )
-  const downloadState = useAtomValue(downloadAtom)
-  const { setMainViewState } = useMainViewState()
-
   const onDownloadClick = useCallback(() => {
     downloadModel(model)
-  }, [model])
+  }, [model, downloadModel])
 
   const isDownloaded = downloadedModels.find((md) => md.id === model.id) != null
 
@@ -86,6 +98,8 @@ const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
     </Button>
   )
 
+  const isDownloading = downloadingModels.some((md) => md.id === model.id)
+
   const onUseModelClick = useCallback(async () => {
     if (assistants.length === 0) {
       alert('No assistant available')
@@ -93,7 +107,7 @@ const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
     }
     await requestCreateNewThread(assistants[0], model)
     setMainViewState(MainViewState.Thread)
-  }, [])
+  }, [assistants, model, requestCreateNewThread, setMainViewState])
 
   if (isDownloaded) {
     downloadButton = (
@@ -118,26 +132,10 @@ const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
         )}
       </Tooltip>
     )
-  } else if (downloadState != null) {
+  } else if (isDownloading) {
     downloadButton = <ModalCancelDownload model={model} />
   }
 
-  const getLabel = (size: number) => {
-    if (size * 1.25 >= ram) {
-      return (
-        <Badge className="rounded-md" themes="danger">
-          Not enough RAM
-        </Badge>
-      )
-    } else {
-      return (
-        <Badge className="rounded-md" themes="success">
-          Recommended
-        </Badge>
-      )
-    }
-  }
-
   return (
     <div
       className="cursor-pointer rounded-t-md bg-background"
@@ -160,7 +158,7 @@ const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
           <span className="mr-4 font-semibold text-muted-foreground">
             {toGibibytes(model.metadata.size)}
           </span>
-          {getLabel(model.metadata.size)}
+          {getLabel(model.metadata.size, ram)}
 
           {downloadButton}
           <ChevronDownIcon
diff --git a/web/screens/ExploreModels/ExploreModelList/index.tsx b/web/screens/ExploreModels/ExploreModelList/index.tsx
index 54c8120dd..ddd474b53 100644
--- a/web/screens/ExploreModels/ExploreModelList/index.tsx
+++ b/web/screens/ExploreModels/ExploreModelList/index.tsx
@@ -10,7 +10,7 @@ const ExploreModelList: React.FC<Props> = ({ models }) => {
   const takenModelIds: string[] = []
   const featuredModels = models
     .filter((m) => {
-      if (m.metadata.tags.includes('Featured')) {
+      if (m.metadata?.tags?.includes('Featured')) {
         takenModelIds.push(m.id)
         return m
       }
@@ -19,7 +19,7 @@ const ExploreModelList: React.FC<Props> = ({ models }) => {
 
   const recommendedModels = models
     .filter((m) => {
-      if (m.metadata.tags.includes('Recommended')) {
+      if (m.metadata?.tags?.includes('Recommended')) {
         takenModelIds.push(m.id)
         return m
       }
diff --git a/web/screens/ExploreModels/ModelVersionItem/index.tsx b/web/screens/ExploreModels/ModelVersionItem/index.tsx
deleted file mode 100644
index 3a9385670..000000000
--- a/web/screens/ExploreModels/ModelVersionItem/index.tsx
+++ /dev/null
@@ -1,84 +0,0 @@
-import React, { useMemo } from 'react'
-
-import { Model } from '@janhq/core'
-import { Button } from '@janhq/uikit'
-import { atom, useAtomValue } from 'jotai'
-
-import ModalCancelDownload from '@/containers/ModalCancelDownload'
-
-import { MainViewState } from '@/constants/screens'
-
-import useDownloadModel from '@/hooks/useDownloadModel'
-import { useDownloadState } from '@/hooks/useDownloadState'
-
-import { useMainViewState } from '@/hooks/useMainViewState'
-
-import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
-
-type Props = {
-  model: Model
-  isRecommended: boolean
-}
-
-const ModelVersionItem: React.FC<Props> = ({ model }) => {
-  const { downloadModel } = useDownloadModel()
-  const downloadedModels = useAtomValue(downloadedModelsAtom)
-  const { setMainViewState } = useMainViewState()
-  const isDownloaded =
-    downloadedModels.find(
-      (downloadedModel) => downloadedModel.id === model.id
-    ) != null
-
-  const { modelDownloadStateAtom, downloadStates } = useDownloadState()
-
-  const downloadAtom = useMemo(
-    () => atom((get) => get(modelDownloadStateAtom)[model.id ?? '']),
-    /* eslint-disable react-hooks/exhaustive-deps */
-    [model.id]
-  )
-  const downloadState = useAtomValue(downloadAtom)
-
-  const onDownloadClick = () => {
-    downloadModel(model)
-  }
-
-  let downloadButton = (
-    <Button themes="outline" size="sm" onClick={() => onDownloadClick()}>
-      Download
-    </Button>
-  )
-
-  if (isDownloaded) {
-    downloadButton = (
-      <Button
-        themes="outline"
-        size="sm"
-        onClick={() => {
-          setMainViewState(MainViewState.MyModels)
-        }}
-      >
-        Use
-      </Button>
-    )
-  }
-
-  if (downloadState != null && downloadStates.length > 0) {
-    downloadButton = <ModalCancelDownload model={model} isFromList />
-  }
-
-  return (
-    <div className="flex items-center justify-between gap-4 border-t border-border pb-3 pl-3 pr-4 pt-3 first:border-t-0">
-      <div className="flex items-center gap-2">
-        <span className="line-clamp-1 flex-1" title={model.name}>
-          {model.name}
-        </span>
-      </div>
-      <div className="flex items-center gap-4">
-        <div className="flex justify-end gap-2"></div>
-        {downloadButton}
-      </div>
-    </div>
-  )
-}
-
-export default ModelVersionItem
diff --git a/web/screens/ExploreModels/ModelVersionList/index.tsx b/web/screens/ExploreModels/ModelVersionList/index.tsx
deleted file mode 100644
index 7992b7a51..000000000
--- a/web/screens/ExploreModels/ModelVersionList/index.tsx
+++ /dev/null
@@ -1,25 +0,0 @@
-import { Model } from '@janhq/core'
-
-import ModelVersionItem from '../ModelVersionItem'
-
-type Props = {
-  models: Model[]
-  recommendedVersion: string
-}
-
-export default function ModelVersionList({
-  models,
-  recommendedVersion,
-}: Props) {
-  return (
-    <div className="pt-4">
-      {models.map((model) => (
-        <ModelVersionItem
-          key={model.name}
-          model={model}
-          isRecommended={model.name === recommendedVersion}
-        />
-      ))}
-    </div>
-  )
-}
diff --git a/web/screens/LocalServer/Logs.tsx b/web/screens/LocalServer/Logs.tsx
deleted file mode 100644
index 125bd93ef..000000000
--- a/web/screens/LocalServer/Logs.tsx
+++ /dev/null
@@ -1,179 +0,0 @@
-/* eslint-disable @typescript-eslint/naming-convention */
-import { useEffect, useState } from 'react'
-
-import React from 'react'
-
-import { useAtomValue } from 'jotai'
-
-import { useServerLog } from '@/hooks/useServerLog'
-
-import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-
-const Logs = () => {
-  const { getServerLog } = useServerLog()
-  const serverEnabled = useAtomValue(serverEnabledAtom)
-  const [logs, setLogs] = useState([])
-
-  useEffect(() => {
-    getServerLog().then((log) => {
-      if (typeof log?.split === 'function') {
-        setLogs(log.split(/\r?\n|\r|\n/g))
-      }
-    })
-
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [logs, serverEnabled])
-
-  return (
-    <div className="overflow-hidden">
-      {logs.length > 1 ? (
-        <div className="h-full overflow-auto p-4">
-          <code className="text-xs">
-            {logs.map((log, i) => {
-              return (
-                <p key={i} className="my-2 leading-relaxed">
-                  {log}
-                </p>
-              )
-            })}
-          </code>
-        </div>
-      ) : (
-        <div className="mt-24 flex flex-col items-center justify-center">
-          <svg
-            width="115"
-            height="115"
-            viewBox="0 0 115 115"
-            fill="none"
-            xmlns="http://www.w3.org/2000/svg"
-          >
-            <circle cx="57.4999" cy="57.5009" r="50.2314" fill="#DADADA" />
-            <circle
-              cx="57.5"
-              cy="57.5"
-              r="55.9425"
-              fill="#E7E7E7"
-              stroke="white"
-              strokeWidth="3.1151"
-            />
-            <mask
-              id="mask0_1206_120508"
-              maskUnits="userSpaceOnUse"
-              x="3"
-              y="3"
-              width="109"
-              height="109"
-            >
-              <circle cx="57.4993" cy="57.5003" r="54.1253" fill="white" />
-            </mask>
-            <g mask="url(#mask0_1206_120508)">
-              <path
-                d="M47.5039 116.445H58.5351L74.3593 39.8282L63.7828 37.6406L47.5039 116.445Z"
-                fill="#8D8D8D"
-              />
-              <path
-                d="M72.165 39.4563L74.3716 39.8457L72.4246 38.418L72.165 39.4563Z"
-                fill="#8D8D8D"
-              />
-              <path
-                d="M45.6797 114.947H56.7108L72.4257 38.4193L61.9585 36.1426L45.6797 114.947Z"
-                fill="url(#paint0_linear_1206_120508)"
-              />
-              <path
-                d="M93.1887 90.6726L26.5474 76.906L24.6602 75.2136L31.7058 51.9418L34.7984 52.1448L30.0296 49.6041L32.757 36.0039L99.3983 49.7705L101.29 51.467L98.5257 64.844L93.2456 64.9414L96.1515 65.4974L98.0387 67.1898L93.1887 90.6726Z"
-                fill="#8D8D8D"
-              />
-              <path
-                d="M91.3015 88.9801L24.6602 75.2136L29.8186 50.2454L32.9112 50.4483L30.3299 47.7656L32.757 36.0039L99.3983 49.7705L96.6345 63.1475L91.3583 63.2449L96.1515 65.4974L91.3015 88.9801Z"
-                fill="url(#paint1_linear_1206_120508)"
-              />
-              <path
-                d="M92.7826 63.1065C92.7826 63.1065 92.7298 63.1065 92.6243 63.1065L92.1576 63.0741L90.3637 62.9279L89.069 62.8143L87.5308 62.6317C86.431 62.4937 85.1688 62.3638 83.7929 62.1365L81.6216 61.8078C80.8667 61.6901 80.0875 61.5359 79.2798 61.4019C77.6564 61.126 75.9396 60.7647 74.1295 60.3995C70.5133 59.6324 66.5563 58.703 62.4247 57.6518C54.1655 55.5252 46.7221 53.4797 41.2918 52.1525C39.9403 51.8075 38.7065 51.5275 37.6391 51.2677C36.5717 51.008 35.6098 50.797 34.8631 50.6306L33.1098 50.2247L32.6552 50.1151C32.6025 50.1035 32.5508 50.0872 32.501 50.0664C32.5545 50.0686 32.6076 50.0768 32.6593 50.0908L33.1219 50.176L34.8834 50.5291C35.6504 50.6833 36.5879 50.8822 37.6675 51.1297C38.7471 51.3773 39.9849 51.6452 41.3446 51.978C46.783 53.2605 54.2386 55.2816 62.4937 57.4043C66.6253 58.4554 70.5742 59.3929 74.1823 60.1722C75.9924 60.5415 77.7051 60.9109 79.3245 61.195C80.1362 61.3411 80.9114 61.4953 81.6622 61.6008L83.8254 61.9458C85.2012 62.1852 86.4553 62.3273 87.5552 62.4775L89.0893 62.6804L90.3799 62.8143L92.1698 63.0091L92.6324 63.0659L92.7826 63.1065Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M96.131 60.9773C96.0789 60.948 96.0288 60.9155 95.9808 60.8799L95.5749 60.5755C95.2056 60.3117 94.678 59.8937 93.9515 59.3985C91.9511 57.9951 89.8665 56.7156 87.7095 55.5673C84.5067 53.8752 81.1551 52.4813 77.697 51.4032C73.4578 50.101 69.0819 49.2947 64.6569 49.0005C59.9449 48.6555 55.4481 49.1142 51.353 49.2075C49.411 49.2762 47.4666 49.2369 45.529 49.0898C41.3921 48.7494 37.3342 47.762 33.5035 46.1636C32.6918 45.8267 32.0952 45.5426 31.6853 45.3519L31.2226 45.1165L31.0684 45.0312C31.1262 45.0462 31.1821 45.068 31.2348 45.0962L31.7096 45.3072C32.1155 45.4939 32.7364 45.7658 33.54 46.0865C35.8079 46.9951 38.1522 47.7 40.5451 48.1929C42.1954 48.5323 43.8654 48.7681 45.5452 48.899C47.4754 49.0336 49.4114 49.0647 51.3449 48.9924C55.4278 48.8869 59.9368 48.4201 64.6731 48.7651C69.1177 49.0615 73.5121 49.8788 77.766 51.2002C81.2331 52.295 84.5906 53.7108 87.7947 55.4293C89.949 56.5876 92.0247 57.8864 94.0083 59.3173C94.7105 59.8206 95.2259 60.2549 95.5912 60.5349L95.997 60.8596C96.0446 60.8953 96.0894 60.9347 96.131 60.9773Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M63.9192 43.0816C63.8188 43.1282 63.7141 43.1649 63.6067 43.1912L62.6935 43.4631C62.2876 43.5849 61.8128 43.7188 61.2405 43.8487C60.6683 43.9786 60.023 44.1572 59.2924 44.287C58.5619 44.4169 57.7745 44.5914 56.91 44.6929C56.0456 44.7943 55.1283 44.9364 54.1583 45.046C52.0463 45.2502 49.9242 45.3328 47.8027 45.2936C45.6814 45.2371 43.565 45.0623 41.4632 44.77C40.4973 44.6158 39.58 44.4818 38.7278 44.2951C37.8755 44.1084 37.1043 43.9461 36.3697 43.7675C35.6351 43.589 35.0101 43.4063 34.446 43.244C33.8818 43.0816 33.3989 42.9315 33.0092 42.7975L32.1082 42.485C32.0022 42.4531 31.8991 42.4123 31.7998 42.3633C31.9103 42.3761 32.0191 42.4006 32.1245 42.4363L33.0377 42.7042C33.4435 42.826 33.9143 42.968 34.4825 43.1101C35.0507 43.2521 35.7001 43.4469 36.4103 43.5971C37.1206 43.7472 37.916 43.942 38.7683 44.0922C39.6206 44.2424 40.5338 44.3966 41.4957 44.5427C43.5877 44.8202 45.693 44.9868 47.8027 45.0419C49.9143 45.0792 52.0264 45.0034 54.1299 44.8146C55.0959 44.7091 56.0172 44.6239 56.8735 44.4859C57.7299 44.3479 58.5253 44.2302 59.2518 44.08C59.9783 43.9299 60.6277 43.8 61.1999 43.6742C61.7722 43.5484 62.2633 43.4347 62.661 43.3292L63.5823 43.106C63.6933 43.0854 63.8063 43.0772 63.9192 43.0816Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M46.1782 66.8891C46.1782 66.8891 46.2837 66.9459 46.4786 67.0677L47.3552 67.6075C48.1263 68.0742 49.2546 68.7885 50.7644 69.5962C52.5839 70.6072 54.5341 71.3624 56.56 71.8405C57.1712 71.9765 57.7909 72.0714 58.4148 72.1246C59.0677 72.2062 59.729 72.063 60.2898 71.7188C60.5621 71.5185 60.7593 71.2327 60.8499 70.9071C60.9379 70.5705 60.9379 70.2169 60.8499 69.8803C60.6372 69.1763 60.1849 68.5689 59.5714 68.1635C54.4901 64.7949 47.3349 62.3395 39.2381 62.1122C38.2275 62.0797 37.2088 62.0797 36.1698 62.1122C35.1309 62.1447 34.0756 62.3882 33.3816 63.1593C33.2064 63.3413 33.0692 63.5562 32.9779 63.7918C32.8866 64.0273 32.8431 64.2786 32.85 64.5311C32.8877 65.0471 33.0864 65.5383 33.4181 65.9354C34.0716 66.7714 35.0132 67.3518 35.9182 67.9646C39.5709 70.4403 43.4387 72.8998 47.7895 74.6044C52.1402 76.309 56.7629 77.0761 61.1177 76.4308C62.1922 76.2718 63.2512 76.0219 64.2834 75.684C65.3 75.3967 66.2119 74.8217 66.9093 74.0281C67.5327 73.2028 67.8626 72.1929 67.8468 71.1587C67.8497 70.1451 67.625 69.1437 67.1893 68.2284C66.3039 66.4723 64.9462 64.9979 63.2688 63.971C61.6898 62.9951 59.9765 62.2554 58.1834 61.7753C56.4585 61.2761 54.7499 60.919 53.1183 60.5578L48.4226 59.4944L34.2542 56.276L30.4067 55.3872L29.4083 55.1518C29.181 55.099 29.0674 55.0625 29.0674 55.0625L29.4124 55.1274L30.4189 55.3385L34.2786 56.1827L48.4632 59.324L53.1589 60.3711C54.7824 60.7404 56.5032 61.0895 58.2402 61.5887C60.0548 62.0698 61.7887 62.8151 63.3865 63.8006C65.1016 64.8462 66.4904 66.3503 67.3963 68.1432C67.8467 69.0889 68.0797 70.1234 68.0782 71.1709C68.0964 72.2575 67.7507 73.319 67.096 74.1864C66.3707 75.017 65.4208 75.6203 64.3605 75.9235C63.3146 76.2697 62.2404 76.5237 61.1502 76.6824C56.7426 77.3399 52.0631 76.5566 47.7002 74.8479C43.3372 73.1393 39.441 70.6798 35.7965 68.1919C34.8955 67.5669 33.9376 66.9743 33.2477 66.0936C32.8831 65.658 32.6657 65.1181 32.6267 64.5514C32.6196 64.2683 32.6687 63.9866 32.7711 63.7226C32.8735 63.4586 33.0272 63.2174 33.2233 63.0132C33.599 62.6113 34.0734 62.3147 34.5992 62.1528C35.1094 61.9991 35.6373 61.9118 36.1698 61.893C37.2169 61.8525 38.2438 61.8565 39.2584 61.893C47.4039 62.1406 54.5794 64.6163 59.6932 68.0336C60.3373 68.4648 60.8099 69.1082 61.0285 69.8519C61.1239 70.2164 61.1239 70.5994 61.0285 70.9639C60.9286 71.3211 60.7095 71.6333 60.4075 71.8487C59.8169 72.2131 59.12 72.3662 58.431 72.2829C57.7989 72.2243 57.1713 72.1253 56.5519 71.9867C54.5186 71.4945 52.5639 70.7213 50.7441 69.6895C49.2343 68.8778 48.1142 68.1391 47.3512 67.6602C46.9778 67.4208 46.6896 67.2544 46.4907 67.1002C46.2919 66.9459 46.1782 66.8891 46.1782 66.8891Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M94.8364 71.2204C94.6993 71.2055 94.5635 71.1797 94.4305 71.1433C94.1789 71.0743 93.8014 71.0012 93.3185 70.916C91.9393 70.7187 90.5384 70.7297 89.1625 70.9484C87.1263 71.2911 85.1507 71.9282 83.2979 72.8397C81.0433 73.9901 78.866 75.2861 76.7799 76.7197C74.6823 78.1612 72.4837 79.4497 70.201 80.5753C68.3181 81.4721 66.3087 82.0743 64.243 82.3611C62.8484 82.5487 61.4325 82.5089 60.0505 82.2434C59.6768 82.1692 59.3081 82.0716 58.9466 81.9512C58.8182 81.9168 58.6932 81.8706 58.5732 81.8132C58.7037 81.8336 58.8326 81.8634 58.9588 81.9025C59.2104 81.9755 59.5838 82.0567 60.0668 82.15C61.4407 82.3746 62.841 82.3869 64.2187 82.1866C66.2604 81.8789 68.2442 81.266 70.1036 80.3683C72.3696 79.236 74.5543 77.9477 76.6419 76.5127C78.7383 75.0733 80.9295 73.777 83.2005 72.6327C85.0755 71.7192 87.077 71.0926 89.1382 70.7739C90.5308 70.568 91.9473 70.5845 93.3347 70.8226C93.72 70.8867 94.1009 70.9748 94.4752 71.0864C94.5995 71.1198 94.7204 71.1646 94.8364 71.2204Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M93.6026 77.826C93.6026 77.8504 93.286 77.7205 92.7016 77.5906C91.8761 77.4114 91.0248 77.3839 90.1894 77.5095C88.9516 77.719 87.7468 78.0901 86.6057 78.6134C85.195 79.2299 83.8293 79.9446 82.5187 80.7523C81.1063 81.5883 79.7589 82.4041 78.4602 83.025C77.321 83.5882 76.1214 84.0199 74.8846 84.3116C74.0488 84.5016 73.1926 84.5861 72.3358 84.5632C72.1034 84.5575 71.8716 84.5372 71.6418 84.5024C71.5603 84.4985 71.4797 84.4835 71.4023 84.4577C71.4023 84.4293 71.7392 84.4577 72.3358 84.4577C73.1828 84.4453 74.0257 84.3364 74.8481 84.133C76.0637 83.8193 77.242 83.3757 78.3628 82.8099C79.6371 82.1849 80.9724 81.3692 82.3888 80.529C83.7103 79.7132 85.0914 78.9983 86.5204 78.3902C87.683 77.8677 88.9122 77.5085 90.1731 77.3228C91.0279 77.2097 91.8965 77.2648 92.73 77.4851C92.9548 77.5461 93.1757 77.6207 93.3916 77.7083C93.4671 77.7375 93.5381 77.7771 93.6026 77.826Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M72.1531 44.1988C72.1531 44.2678 69.584 43.7645 66.4468 43.0746C63.3095 42.3846 60.7648 41.7718 60.7932 41.7069C60.8216 41.6419 63.3623 42.1411 66.4995 42.8311C69.6368 43.521 72.1531 44.1339 72.1531 44.1988Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M87.7278 22.8493C87.9286 21.4011 85.8726 20.21 84.3238 20.0848C83.5886 20.0273 82.8227 20.139 82.1249 19.8987C80.6135 19.3743 80.011 17.432 78.5371 16.8128C77.4342 16.3526 76.1544 16.762 75.0957 17.2967C74.0371 17.8313 72.9717 18.5046 71.7769 18.5825C70.7557 18.6468 69.6086 18.2644 68.7133 18.7686C68.0326 19.1442 67.6922 19.9224 67.059 20.3792C66.4259 20.836 65.6498 20.9206 64.8941 20.9612C64.1384 21.0018 63.3521 21.012 62.6611 21.3233C61.9701 21.6346 61.4017 22.3655 61.5446 23.1031L87.7278 22.8493Z"
-                fill="#ABABAB"
-              />
-              <path
-                d="M39.1881 32.5312C39.3293 31.4869 37.8655 30.6287 36.7662 30.5385C36.2413 30.4963 35.6955 30.5769 35.1993 30.4022C34.121 30.0182 33.6916 28.6264 32.64 28.1791C31.8556 27.847 30.951 28.1426 30.1895 28.5285C29.428 28.9144 28.6741 29.4001 27.8229 29.4538C27.0824 29.5018 26.2789 29.2254 25.632 29.5901C25.1491 29.8608 24.8972 30.4195 24.4525 30.742C24.0078 31.0645 23.4486 31.126 22.9085 31.1624C22.3684 31.1989 21.8092 31.1989 21.3187 31.4254C20.8282 31.652 20.4198 32.1741 20.5229 32.7078L39.1881 32.5312Z"
-                fill="#ABABAB"
-              />
-              <path
-                d="M76.46 61.6777L78.8178 62.1824L80.1702 66.9562L80.2674 66.977L83.4556 63.1752L85.8134 63.6799L80.8041 69.3391L80.0506 72.8588L77.9602 72.4114L78.7137 68.8917L76.46 61.6777Z"
-                fill="white"
-              />
-              <path
-                d="M67.148 61.4992L67.5195 59.7637L75.6965 61.514L75.325 63.2496L72.2769 62.5971L70.5171 70.8178L68.4364 70.3724L70.1962 62.1517L67.148 61.4992Z"
-                fill="white"
-              />
-              <path
-                d="M56.9049 67.9016L59.0361 57.9453L62.9642 58.7862C63.7193 58.9478 64.3318 59.2297 64.8016 59.632C65.272 60.0309 65.5922 60.5147 65.762 61.0832C65.9357 61.6491 65.9518 62.2627 65.8103 62.9238C65.6688 63.585 65.4013 64.1379 65.0078 64.5824C64.6144 65.0269 64.1169 65.3323 63.5153 65.4984C62.9169 65.6652 62.2353 65.6667 61.4705 65.503L58.9668 64.967L59.3279 63.2801L61.4913 63.7432C61.8964 63.8299 62.2451 63.8317 62.5375 63.7485C62.8338 63.6628 63.0734 63.5091 63.2565 63.2872C63.4435 63.0629 63.572 62.7871 63.6421 62.4597C63.7128 62.1291 63.7082 61.8265 63.628 61.5517C63.5518 61.2744 63.3954 61.0392 63.1587 60.8462C62.9228 60.65 62.6007 60.5082 62.1923 60.4207L60.7728 60.1169L59.0099 68.3522L56.9049 67.9016Z"
-                fill="white"
-              />
-              <path
-                d="M46.5049 55.2637L49.1009 55.8194L50.4108 63.0957L50.5275 63.1206L54.7013 57.0182L57.2973 57.5739L55.1661 67.5302L53.1243 67.0931L54.5114 60.6128L54.4288 60.5951L50.4754 66.4753L49.0851 66.1776L47.8905 59.1701L47.8078 59.1524L46.4154 65.657L44.3736 65.2199L46.5049 55.2637Z"
-                fill="white"
-              />
-              <path
-                d="M35.9977 63.425L38.1289 53.4688L44.8377 54.9048L44.4662 56.6404L39.8624 55.6549L39.3546 58.0273L43.6132 58.9389L43.2417 60.6744L38.9831 59.7628L38.4742 62.1401L43.0974 63.1297L42.7259 64.8653L35.9977 63.425Z"
-                fill="white"
-              />
-            </g>
-            <defs>
-              <linearGradient
-                id="paint0_linear_1206_120508"
-                x1="59.1074"
-                y1="36.1426"
-                x2="59.1074"
-                y2="114.947"
-                gradientUnits="userSpaceOnUse"
-              >
-                <stop stopColor="#CFCFCF" />
-                <stop offset="1" stopColor="#C6C6C6" />
-              </linearGradient>
-              <linearGradient
-                id="paint1_linear_1206_120508"
-                x1="62.0292"
-                y1="36.0039"
-                x2="62.0292"
-                y2="88.9801"
-                gradientUnits="userSpaceOnUse"
-              >
-                <stop stopColor="#DDDDDD" />
-                <stop offset="1" stopColor="#B6B6B6" />
-              </linearGradient>
-            </defs>
-          </svg>
-          <p className="mt-4 text-muted-foreground">Empty logs</p>
-        </div>
-      )}
-    </div>
-  )
-}
-
-export default Logs
diff --git a/web/screens/LocalServer/index.tsx b/web/screens/LocalServer/index.tsx
index b96f4c228..f9c2cf719 100644
--- a/web/screens/LocalServer/index.tsx
+++ b/web/screens/LocalServer/index.tsx
@@ -20,11 +20,12 @@ import {
   SelectValue,
 } from '@janhq/uikit'
 
-import { atom, useAtom, useAtomValue } from 'jotai'
+import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 
 import { Paintbrush, CodeIcon } from 'lucide-react'
 import { ExternalLinkIcon, InfoIcon } from 'lucide-react'
 
+import { AlertTriangleIcon } from 'lucide-react'
 import { twMerge } from 'tailwind-merge'
 
 import CardSidebar from '@/containers/CardSidebar'
@@ -33,8 +34,15 @@ import DropdownListSidebar, {
   selectedModelAtom,
 } from '@/containers/DropdownListSidebar'
 
-import { useActiveModel } from '@/hooks/useActiveModel'
-import { useServerLog } from '@/hooks/useServerLog'
+import ModalTroubleShooting, {
+  modalTroubleShootingAtom,
+} from '@/containers/ModalTroubleShoot'
+import ServerLogs from '@/containers/ServerLogs'
+
+import { toaster } from '@/containers/Toast'
+
+import { loadModelErrorAtom, useActiveModel } from '@/hooks/useActiveModel'
+import { useLogs } from '@/hooks/useLogs'
 
 import { getConfigurationsData } from '@/utils/componentSettings'
 import { toSettingParams } from '@/utils/modelParam'
@@ -45,10 +53,7 @@ import SettingComponentBuilder from '../Chat/ModelSetting/SettingComponent'
 
 import { showRightSideBarAtom } from '../Chat/Sidebar'
 
-import Logs from './Logs'
-
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-import { getActiveThreadModelParamsAtom } from '@/helpers/atoms/Thread.atom'
 
 const corsEnabledAtom = atom(true)
 const verboseEnabledAtom = atom(true)
@@ -59,19 +64,20 @@ const LocalServerScreen = () => {
   const [errorRangePort, setErrorRangePort] = useState(false)
   const [serverEnabled, setServerEnabled] = useAtom(serverEnabledAtom)
   const showRightSideBar = useAtomValue(showRightSideBarAtom)
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
+  const setModalTroubleShooting = useSetAtom(modalTroubleShootingAtom)
 
-  const modelEngineParams = toSettingParams(activeModelParams)
-  const componentDataEngineSetting = getConfigurationsData(modelEngineParams)
-
-  const { openServerLog, clearServerLog } = useServerLog()
+  const { openServerLog, clearServerLog } = useLogs()
   const { startModel, stateModel } = useActiveModel()
   const selectedModel = useAtomValue(selectedModelAtom)
 
+  const modelEngineParams = toSettingParams(selectedModel?.settings)
+  const componentDataEngineSetting = getConfigurationsData(modelEngineParams)
+
   const [isCorsEnabled, setIsCorsEnabled] = useAtom(corsEnabledAtom)
   const [isVerboseEnabled, setIsVerboseEnabled] = useAtom(verboseEnabledAtom)
   const [host, setHost] = useAtom(hostAtom)
   const [port, setPort] = useAtom(portAtom)
+  const [loadModelError, setLoadModelError] = useAtom(loadModelErrorAtom)
 
   const hostOptions = ['127.0.0.1', '0.0.0.0']
 
@@ -102,6 +108,45 @@ const LocalServerScreen = () => {
     handleChangePort(port)
   }, [handleChangePort, port])
 
+  const onStartServerClick = async () => {
+    if (selectedModel == null) return
+    try {
+      const isStarted = await window.core?.api?.startServer({
+        host,
+        port,
+        isCorsEnabled,
+        isVerboseEnabled,
+      })
+      await startModel(selectedModel.id)
+      if (isStarted) setServerEnabled(true)
+      if (firstTimeVisitAPIServer) {
+        localStorage.setItem(FIRST_TIME_VISIT_API_SERVER, 'false')
+        setFirstTimeVisitAPIServer(false)
+      }
+    } catch (e) {
+      console.error(e)
+      toaster({
+        title: `Failed to start server!`,
+        description: 'Please check Server Logs for more details.',
+        type: 'error',
+      })
+    }
+  }
+
+  const onStopServerClick = async () => {
+    window.core?.api?.stopServer()
+    setServerEnabled(false)
+    setLoadModelError(undefined)
+  }
+
+  const onToggleServer = async () => {
+    if (serverEnabled) {
+      await onStopServerClick()
+    } else {
+      await onStartServerClick()
+    }
+  }
+
   return (
     <div className="flex h-full w-full" data-testid="local-server-testid">
       {/* Left SideBar */}
@@ -118,25 +163,7 @@ const LocalServerScreen = () => {
               block
               themes={serverEnabled ? 'danger' : 'primary'}
               disabled={stateModel.loading || errorRangePort || !selectedModel}
-              onClick={() => {
-                if (serverEnabled) {
-                  window.core?.api?.stopServer()
-                  setServerEnabled(false)
-                } else {
-                  startModel(String(selectedModel?.id))
-                  window.core?.api?.startServer({
-                    host,
-                    port,
-                    isCorsEnabled,
-                    isVerboseEnabled,
-                  })
-                  setServerEnabled(true)
-                  if (firstTimeVisitAPIServer) {
-                    localStorage.setItem(FIRST_TIME_VISIT_API_SERVER, 'false')
-                    setFirstTimeVisitAPIServer(false)
-                  }
-                }
-              }}
+              onClick={onToggleServer}
             >
               {serverEnabled ? 'Stop' : 'Start'} Server
             </Button>
@@ -350,7 +377,9 @@ const LocalServerScreen = () => {
             </div>
           </div>
         ) : (
-          <Logs />
+          <div className="p-4">
+            <ServerLogs />
+          </div>
         )}
       </ScrollToBottom>
 
@@ -364,7 +393,43 @@ const LocalServerScreen = () => {
         )}
       >
         <div className="px-4 pt-4">
+          <div className="mb-4 flex items-start space-x-2">
+            <svg
+              width="18"
+              height="18"
+              viewBox="0 0 18 18"
+              className="mt-1 flex-shrink-0"
+              fill="none"
+              xmlns="http://www.w3.org/2000/svg"
+            >
+              <path
+                fillRule="evenodd"
+                clipRule="evenodd"
+                d="M9.00033 17.3337C13.6027 17.3337 17.3337 13.6027 17.3337 9.00033C17.3337 4.39795 13.6027 0.666992 9.00033 0.666992C4.39795 0.666992 0.666992 4.39795 0.666992 9.00033C0.666992 10.9978 1.36978 12.8311 2.54157 14.2666L0.910703 15.9111C0.390085 16.436 0.758808 17.3337 1.49507 17.3337H9.00033ZM5.25033 7.33366C5.25033 6.87342 5.62342 6.50033 6.08366 6.50033H11.917C12.3772 6.50033 12.7503 6.87342 12.7503 7.33366C12.7503 7.7939 12.3772 8.16699 11.917 8.16699H6.08366C5.62342 8.16699 5.25033 7.7939 5.25033 7.33366ZM6.08366 9.83366C5.62342 9.83366 5.25033 10.2068 5.25033 10.667C5.25033 11.1272 5.62342 11.5003 6.08366 11.5003H8.58366C9.0439 11.5003 9.41699 11.1272 9.41699 10.667C9.41699 10.2068 9.0439 9.83366 8.58366 9.83366H6.08366Z"
+                fill="#2563EB"
+              />
+            </svg>
+
+            <p>
+              You can concurrently send requests to one active local model and
+              multiple remote models.
+            </p>
+          </div>
           <DropdownListSidebar strictedThread={false} />
+          {loadModelError && serverEnabled && (
+            <div className="mt-3 flex space-x-2 text-xs">
+              <AlertTriangleIcon size={16} className="text-danger" />
+              <span>
+                Model failed to start. Access{' '}
+                <span
+                  className="cursor-pointer text-primary dark:text-blue-400"
+                  onClick={() => setModalTroubleShooting(true)}
+                >
+                  troubleshooting assistance
+                </span>
+              </span>
+            </div>
+          )}
 
           {componentDataEngineSetting.filter(
             (x) => x.name === 'prompt_template'
@@ -386,13 +451,17 @@ const LocalServerScreen = () => {
             <div className="my-4">
               <CardSidebar title="Engine Parameters" asChild>
                 <div className="px-2 py-4">
-                  <EngineSetting enabled={!serverEnabled} />
+                  <EngineSetting
+                    enabled={!serverEnabled}
+                    componentData={componentDataEngineSetting}
+                  />
                 </div>
               </CardSidebar>
             </div>
           )}
         </div>
       </div>
+      <ModalTroubleShooting />
     </div>
   )
 }
diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index fe590bfaa..c11c49fa4 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -83,7 +83,8 @@ const DataFolder = () => {
         await window.core?.api?.getAppConfigurations()
       const currentJanDataFolder = appConfiguration.data_folder
       appConfiguration.data_folder = destinationPath
-      await fs.syncFile(currentJanDataFolder, destinationPath)
+      const { err } = await fs.syncFile(currentJanDataFolder, destinationPath)
+      if (err) throw err
       await window.core?.api?.updateAppConfiguration(appConfiguration)
       console.debug(
         `File sync finished from ${currentJanDataFolder} to ${destinationPath}`
@@ -94,7 +95,7 @@ const DataFolder = () => {
       }, 1200)
       await window.core?.api?.relaunch()
     } catch (e) {
-      console.error(`Error: ${e}`)
+      console.error(e)
       setShowLoader(false)
       setShowChangeFolderError(true)
     }
diff --git a/web/screens/Settings/Advanced/index.tsx b/web/screens/Settings/Advanced/index.tsx
index f6c8fb4d8..60812a350 100644
--- a/web/screens/Settings/Advanced/index.tsx
+++ b/web/screens/Settings/Advanced/index.tsx
@@ -8,20 +8,46 @@ import {
   ChangeEvent,
 } from 'react'
 
-import { fs } from '@janhq/core'
-import { Switch, Button, Input } from '@janhq/uikit'
+import { openExternalUrl, fs } from '@janhq/core'
+
+import {
+  Switch,
+  Button,
+  Input,
+  Select,
+  Checkbox,
+  SelectContent,
+  SelectGroup,
+  SelectPortal,
+  SelectLabel,
+  SelectTrigger,
+  SelectValue,
+  Tooltip,
+  TooltipArrow,
+  TooltipContent,
+  TooltipTrigger,
+} from '@janhq/uikit'
+
+import { AlertTriangleIcon, AlertCircleIcon } from 'lucide-react'
 
 import ShortcutModal from '@/containers/ShortcutModal'
 
-import { toaster } from '@/containers/Toast'
+import { snackbar, toaster } from '@/containers/Toast'
 
 import { FeatureToggleContext } from '@/context/FeatureToggle'
 
+import { useActiveModel } from '@/hooks/useActiveModel'
 import { useSettings } from '@/hooks/useSettings'
 
 import DataFolder from './DataFolder'
 import FactoryReset from './FactoryReset'
 
+type GPU = {
+  id: string
+  vram: number | null
+  name: string
+}
+
 const Advanced = () => {
   const {
     experimentalFeature,
@@ -30,15 +56,24 @@ const Advanced = () => {
     setIgnoreSSL,
     proxy,
     setProxy,
+    proxyEnabled,
+    setProxyEnabled,
+    vulkanEnabled,
+    setVulkanEnabled,
   } = useContext(FeatureToggleContext)
   const [partialProxy, setPartialProxy] = useState<string>(proxy)
   const [gpuEnabled, setGpuEnabled] = useState<boolean>(false)
-  const [gpuList, setGpuList] = useState([
-    { id: 'none', vram: null, name: 'none' },
-  ])
+  const [gpuList, setGpuList] = useState<GPU[]>([])
   const [gpusInUse, setGpusInUse] = useState<string[]>([])
   const { readSettings, saveSettings, validateSettings, setShowNotification } =
     useSettings()
+  const { stopModel } = useActiveModel()
+
+  const selectedGpu = gpuList
+    .filter((x) => gpusInUse.includes(x.id))
+    .map((y) => {
+      return y['name']
+    })
 
   const onProxyChange = useCallback(
     (event: ChangeEvent<HTMLInputElement>) => {
@@ -56,14 +91,15 @@ const Advanced = () => {
   useEffect(() => {
     const setUseGpuIfPossible = async () => {
       const settings = await readSettings()
-      setGpuEnabled(settings.run_mode === 'gpu')
+      setGpuEnabled(settings.run_mode === 'gpu' && settings.gpus?.length > 0)
       setGpusInUse(settings.gpus_in_use || [])
+      setVulkanEnabled(settings.vulkan || false)
       if (settings.gpus) {
         setGpuList(settings.gpus)
       }
     }
     setUseGpuIfPossible()
-  }, [readSettings])
+  }, [readSettings, setGpuList, setGpuEnabled, setGpusInUse, setVulkanEnabled])
 
   const clearLogs = async () => {
     if (await fs.existsSync(`file://logs`)) {
@@ -81,15 +117,26 @@ const Advanced = () => {
     if (updatedGpusInUse.includes(gpuId)) {
       updatedGpusInUse = updatedGpusInUse.filter((id) => id !== gpuId)
       if (gpuEnabled && updatedGpusInUse.length === 0) {
+        // Vulkan support only allow 1 active device at a time
+        if (vulkanEnabled) {
+          updatedGpusInUse = []
+        }
         updatedGpusInUse.push(gpuId)
       }
     } else {
+      // Vulkan support only allow 1 active device at a time
+      if (vulkanEnabled) {
+        updatedGpusInUse = []
+      }
       updatedGpusInUse.push(gpuId)
     }
     setGpusInUse(updatedGpusInUse)
     saveSettings({ gpusInUse: updatedGpusInUse })
   }
 
+  const gpuSelectionPlaceHolder =
+    gpuList.length > 0 ? 'Select GPU' : "You don't have any compatible GPU"
+
   return (
     <div className="block w-full">
       {/* Keyboard shortcut  */}
@@ -127,72 +174,219 @@ const Advanced = () => {
 
       {/* CPU / GPU switching */}
       {!isMac && (
+        <div className="flex w-full flex-col items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
+          <div className="flex items-start justify-between w-full">
+            <div className="space-y-1.5">
+              <div className="flex gap-x-2">
+                <h6 className="text-sm font-semibold capitalize">
+                  GPU Acceleration
+                </h6>
+              </div>
+              <p className="pr-8 leading-relaxed">
+                Enable to enhance model performance by utilizing your GPU
+                devices for acceleration. Read{' '}
+                <span>
+                  {' '}
+                  <span
+                    className="cursor-pointer text-blue-600"
+                    onClick={() =>
+                      openExternalUrl(
+                        'https://jan.ai/guides/troubleshooting/gpu-not-used/'
+                      )
+                    }
+                  >
+                    troubleshooting guide
+                  </span>{' '}
+                </span>{' '}
+                for further assistance.
+              </p>
+            </div>
+            {gpuList.length > 0 && !gpuEnabled && (
+              <Tooltip>
+                <TooltipTrigger>
+                  <AlertCircleIcon size={20} className="mr-2 text-yellow-600" />
+                </TooltipTrigger>
+                <TooltipContent
+                  side="right"
+                  sideOffset={10}
+                  className="max-w-[240px]"
+                >
+                  <span>
+                    Disabling NVIDIA GPU Acceleration may result in reduced
+                    performance. It is recommended to keep this enabled for
+                    optimal user experience.
+                  </span>
+                  <TooltipArrow />
+                </TooltipContent>
+              </Tooltip>
+            )}
+
+            <Tooltip>
+              <TooltipTrigger>
+                <Switch
+                  disabled={gpuList.length === 0 || vulkanEnabled}
+                  checked={gpuEnabled}
+                  onCheckedChange={(e) => {
+                    if (e === true) {
+                      saveSettings({ runMode: 'gpu' })
+                      setGpuEnabled(true)
+                      setShowNotification(false)
+                      snackbar({
+                        description: 'Successfully turned on GPU Accelertion',
+                        type: 'success',
+                      })
+                      setTimeout(() => {
+                        validateSettings()
+                      }, 300)
+                    } else {
+                      saveSettings({ runMode: 'cpu' })
+                      setGpuEnabled(false)
+                      snackbar({
+                        description: 'Successfully turned off GPU Accelertion',
+                        type: 'success',
+                      })
+                    }
+                    // Stop any running model to apply the changes
+                    if (e !== gpuEnabled) stopModel()
+                  }}
+                />
+              </TooltipTrigger>
+              {gpuList.length === 0 && (
+                <TooltipContent
+                  side="right"
+                  sideOffset={10}
+                  className="max-w-[240px]"
+                >
+                  <span>
+                    Your current device does not have a compatible GPU for
+                    monitoring. To enable GPU monitoring, please ensure your
+                    device has a supported Nvidia or AMD GPU with updated
+                    drivers.
+                  </span>
+                  <TooltipArrow />
+                </TooltipContent>
+              )}
+            </Tooltip>
+          </div>
+          <div className="mt-2 w-full rounded-lg bg-secondary p-4">
+            <label className="mb-1 inline-block font-medium">
+              Choose device(s)
+            </label>
+            <Select
+              disabled={gpuList.length === 0 || !gpuEnabled}
+              value={selectedGpu.join()}
+            >
+              <SelectTrigger className="w-[340px] dark:bg-gray-500 bg-white">
+                <SelectValue placeholder={gpuSelectionPlaceHolder}>
+                  <span className="line-clamp-1 w-full pr-8">
+                    {selectedGpu.join()}
+                  </span>
+                </SelectValue>
+              </SelectTrigger>
+              <SelectPortal>
+                <SelectContent className="w-[400px] px-1 pb-2">
+                  <SelectGroup>
+                    <SelectLabel>
+                      {vulkanEnabled ? 'Vulkan Supported GPUs' : 'Nvidia'}
+                    </SelectLabel>
+                    <div className="px-4 pb-2">
+                      <div className="rounded-lg bg-secondary p-3">
+                        {gpuList
+                          .filter((gpu) =>
+                            vulkanEnabled
+                              ? gpu.name
+                              : gpu.name?.toLowerCase().includes('nvidia')
+                          )
+                          .map((gpu) => (
+                            <div
+                              key={gpu.id}
+                              className="my-1 flex items-center space-x-2"
+                            >
+                              <Checkbox
+                                id={`gpu-${gpu.id}`}
+                                name="gpu-nvidia"
+                                className="bg-white"
+                                value={gpu.id}
+                                checked={gpusInUse.includes(gpu.id)}
+                                onCheckedChange={() => handleGPUChange(gpu.id)}
+                              />
+                              <label
+                                className="flex w-full items-center justify-between"
+                                htmlFor={`gpu-${gpu.id}`}
+                              >
+                                <span>{gpu.name}</span>
+                                {!vulkanEnabled && (
+                                  <span>{gpu.vram}MB VRAM</span>
+                                )}
+                              </label>
+                            </div>
+                          ))}
+                      </div>
+                      {/* Warning message */}
+                      {gpuEnabled && gpusInUse.length > 1 && (
+                        <div className="mt-2 flex items-start space-x-2 text-yellow-500">
+                          <AlertTriangleIcon
+                            size={16}
+                            className="flex-shrink-0"
+                          />
+                          <p className="text-xs leading-relaxed">
+                            If multi-GPU is enabled with different GPU models or
+                            without NVLink, it could impact token speed.
+                          </p>
+                        </div>
+                      )}
+                    </div>
+                  </SelectGroup>
+
+                  {/* TODO enable this when we support AMD */}
+                </SelectContent>
+              </SelectPortal>
+            </Select>
+          </div>
+        </div>
+      )}
+
+      {/* Vulkan for AMD GPU/ APU and Intel Arc GPU */}
+      {!isMac && experimentalFeature && (
         <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
           <div className="flex-shrink-0 space-y-1.5">
             <div className="flex gap-x-2">
-              <h6 className="text-sm font-semibold capitalize">Nvidia GPU</h6>
+              <h6 className="text-sm font-semibold capitalize">
+                Vulkan Support
+              </h6>
             </div>
-            <p className="leading-relaxed">
-              Enable GPU acceleration for Nvidia GPUs.
+            <p className="text-xs leading-relaxed">
+              Enable Vulkan with AMD GPU/APU and Intel Arc GPU for better model
+              performance (reload needed).
             </p>
           </div>
+
           <Switch
-            checked={gpuEnabled}
+            checked={vulkanEnabled}
             onCheckedChange={(e) => {
-              if (e === true) {
-                saveSettings({ runMode: 'gpu' })
-                setGpuEnabled(true)
-                setShowNotification(false)
-                setTimeout(() => {
-                  validateSettings()
-                }, 300)
-              } else {
-                saveSettings({ runMode: 'cpu' })
-                setGpuEnabled(false)
-              }
+              toaster({
+                title: 'Reload',
+                description:
+                  'Vulkan settings updated. Reload now to apply the changes.',
+              })
+              stopModel()
+              saveSettings({ vulkan: e, gpusInUse: [] })
+              setVulkanEnabled(e)
             }}
           />
         </div>
       )}
-      {/* Directory */}
-      {gpuEnabled && (
-        <div className="mt-4">
-          <label className="block text-sm font-medium text-gray-700">
-            Select GPU(s)
-          </label>
-          <div className="mt-2 space-y-2">
-            {gpuList.map((gpu) => (
-              <div key={gpu.id}>
-                <input
-                  type="checkbox"
-                  id={`gpu-${gpu.id}`}
-                  name="gpu"
-                  value={gpu.id}
-                  checked={gpusInUse.includes(gpu.id)}
-                  onChange={() => handleGPUChange(gpu.id)}
-                />
-                <label htmlFor={`gpu-${gpu.id}`}>
-                  {' '}
-                  {gpu.name} (VRAM: {gpu.vram} MB)
-                </label>
-              </div>
-            ))}
-          </div>
-        </div>
-      )}
-      {/* Warning message */}
-      {gpuEnabled && gpusInUse.length > 1 && (
-        <p className="mt-2 italic text-red-500">
-          If enabling multi-GPU without the same GPU model or without NVLink, it
-          may affect token speed.
-        </p>
-      )}
+
       <DataFolder />
       {/* Proxy */}
       <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
-        <div className="flex-shrink-0 space-y-1.5">
-          <div className="flex gap-x-2">
+        <div className="flex-shrink-0 space-y-1.5 w-full">
+          <div className="flex gap-x-2 justify-between w-full">
             <h6 className="text-sm font-semibold capitalize">HTTPS Proxy</h6>
+            <Switch
+              checked={proxyEnabled}
+              onCheckedChange={(_) => setProxyEnabled(!proxyEnabled)}
+            />
           </div>
           <p className="leading-relaxed">
             Specify the HTTPS proxy or leave blank (proxy auto-configuration and
@@ -202,6 +396,7 @@ const Advanced = () => {
             placeholder={'http://<user>:<password>@<domain or IP>:<port>'}
             value={partialProxy}
             onChange={onProxyChange}
+            className="w-2/3"
           />
         </div>
       </div>
diff --git a/web/screens/SystemMonitor/index.tsx b/web/screens/SystemMonitor/index.tsx
deleted file mode 100644
index 3bf8bb35e..000000000
--- a/web/screens/SystemMonitor/index.tsx
+++ /dev/null
@@ -1,152 +0,0 @@
-import {
-  ScrollArea,
-  Progress,
-  Badge,
-  Button,
-  Tooltip,
-  TooltipArrow,
-  TooltipContent,
-  TooltipPortal,
-  TooltipTrigger,
-} from '@janhq/uikit'
-
-import { useAtom, useAtomValue } from 'jotai'
-
-import { useActiveModel } from '@/hooks/useActiveModel'
-
-import { toGibibytes } from '@/utils/converter'
-
-import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-import {
-  cpuUsageAtom,
-  totalRamAtom,
-  usedRamAtom,
-} from '@/helpers/atoms/SystemBar.atom'
-
-const Column = ['Name', 'Model ID', 'Size', 'Version', 'Action']
-
-export default function SystemMonitorScreen() {
-  const totalRam = useAtomValue(totalRamAtom)
-  const usedRam = useAtomValue(usedRamAtom)
-  const cpuUsage = useAtomValue(cpuUsageAtom)
-  const { activeModel, stateModel, stopModel } = useActiveModel()
-  const [serverEnabled, setServerEnabled] = useAtom(serverEnabledAtom)
-
-  return (
-    <div className="flex h-full w-full bg-background dark:bg-background">
-      <ScrollArea className="h-full w-full">
-        <div className="h-full p-8" data-testid="testid-system-monitor">
-          <div className="grid grid-cols-2 gap-8 lg:grid-cols-3">
-            <div className="rounded-xl border border-border p-4">
-              <div className="flex items-center justify-between">
-                <h4 className="text-base font-bold uppercase">
-                  cpu ({cpuUsage}%)
-                </h4>
-                <span className="text-xs text-muted-foreground">
-                  {cpuUsage}% of 100%
-                </span>
-              </div>
-              <div className="mt-2">
-                <Progress className="mb-2 h-10 rounded-md" value={cpuUsage} />
-              </div>
-            </div>
-            <div className="rounded-xl border border-border p-4">
-              <div className="flex items-center justify-between">
-                <h4 className="text-base font-bold uppercase">
-                  ram ({Math.round((usedRam / totalRam) * 100)}%)
-                </h4>
-                <span className="text-xs text-muted-foreground">
-                  {toGibibytes(usedRam)} of {toGibibytes(totalRam)} used
-                </span>
-              </div>
-              <div className="mt-2">
-                <Progress
-                  className="mb-2 h-10 rounded-md"
-                  value={Math.round((usedRam / totalRam) * 100)}
-                />
-              </div>
-            </div>
-          </div>
-
-          {activeModel && (
-            <div className="mt-8 overflow-hidden rounded-xl border border-border shadow-sm">
-              <div className="px-6 py-5">
-                <h4 className="text-base font-medium">
-                  Actively Running Models
-                </h4>
-              </div>
-              <div className="relative overflow-x-auto shadow-md">
-                <table className="w-full px-8">
-                  <thead className="w-full border-b border-border bg-secondary">
-                    <tr>
-                      {Column.map((col, i) => {
-                        return (
-                          <th
-                            key={i}
-                            className="px-6 py-2 text-left font-normal last:text-center"
-                          >
-                            {col}
-                          </th>
-                        )
-                      })}
-                    </tr>
-                  </thead>
-                  <tbody>
-                    <tr>
-                      <td className="px-6 py-2 font-bold">
-                        {activeModel.name}
-                      </td>
-                      <td className="px-6 py-2 font-bold">{activeModel.id}</td>
-                      <td className="px-6 py-2">
-                        <Badge themes="secondary">
-                          {toGibibytes(activeModel.metadata.size)}
-                        </Badge>
-                      </td>
-                      <td className="px-6 py-2">
-                        <Badge themes="secondary">v{activeModel.version}</Badge>
-                      </td>
-                      <td className="px-6 py-2 text-center">
-                        <Tooltip>
-                          <TooltipTrigger className="w-full">
-                            <Button
-                              block
-                              themes={
-                                stateModel.state === 'stop'
-                                  ? 'danger'
-                                  : 'primary'
-                              }
-                              className="w-16"
-                              loading={stateModel.loading}
-                              onClick={() => {
-                                stopModel()
-                                window.core?.api?.stopServer()
-                                setServerEnabled(false)
-                              }}
-                            >
-                              Stop
-                            </Button>
-                          </TooltipTrigger>
-                          {serverEnabled && (
-                            <TooltipPortal>
-                              <TooltipContent side="top">
-                                <span>
-                                  The API server is running, stop the model will
-                                  also stop the server
-                                </span>
-                                <TooltipArrow />
-                              </TooltipContent>
-                            </TooltipPortal>
-                          )}
-                        </Tooltip>
-                      </td>
-                    </tr>
-                  </tbody>
-                </table>
-              </div>
-            </div>
-          )}
-        </div>
-      </ScrollArea>
-    </div>
-  )
-}
diff --git a/web/services/restService.ts b/web/services/restService.ts
index 25488ae15..73348caeb 100644
--- a/web/services/restService.ts
+++ b/web/services/restService.ts
@@ -1,10 +1,5 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
-import {
-  AppRoute,
-  DownloadRoute,
-  ExtensionRoute,
-  FileSystemRoute,
-} from '@janhq/core'
+import { CoreRoutes } from '@janhq/core'
 
 import { safeJsonParse } from '@/utils/json'
 
@@ -14,15 +9,7 @@ export function openExternalUrl(url: string) {
 }
 
 // Define API routes based on different route types
-export const APIRoutes = [
-  ...Object.values(AppRoute).map((r) => ({ path: 'app', route: r })),
-  ...Object.values(DownloadRoute).map((r) => ({ path: `download`, route: r })),
-  ...Object.values(ExtensionRoute).map((r) => ({
-    path: `extension`,
-    route: r,
-  })),
-  ...Object.values(FileSystemRoute).map((r) => ({ path: `fs`, route: r })),
-]
+export const APIRoutes = [...CoreRoutes.map((r) => ({ path: `app`, route: r }))]
 
 // Define the restAPI object with methods for each API route
 export const restAPI = {
@@ -31,11 +18,14 @@ export const restAPI = {
       ...acc,
       [proxy.route]: (...args: any) => {
         // For each route, define a function that sends a request to the API
-        return fetch(`${API_BASE_URL}/v1/${proxy.path}/${proxy.route}`, {
-          method: 'POST',
-          body: JSON.stringify(args),
-          headers: { contentType: 'application/json' },
-        }).then(async (res) => {
+        return fetch(
+          `${window.core?.api.baseApiUrl}/v1/${proxy.path}/${proxy.route}`,
+          {
+            method: 'POST',
+            body: JSON.stringify(args),
+            headers: { contentType: 'application/json' },
+          }
+        ).then(async (res) => {
           try {
             if (proxy.path === 'fs') {
               const text = await res.text()
@@ -50,4 +40,7 @@ export const restAPI = {
     }
   }, {}),
   openExternalUrl,
+  // Jan Server URL
+  baseApiUrl: process.env.API_BASE_URL ?? API_BASE_URL,
+  pollingInterval: 5000,
 }
diff --git a/web/tsconfig.json b/web/tsconfig.json
index 26f0e8ef3..1729c971f 100644
--- a/web/tsconfig.json
+++ b/web/tsconfig.json
@@ -17,13 +17,13 @@
     "incremental": true,
     "plugins": [
       {
-        "name": "next",
-      },
+        "name": "next"
+      }
     ],
     "paths": {
-      "@/*": ["./*"],
-    },
+      "@/*": ["./*"]
+    }
   },
   "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
-  "exclude": ["node_modules"],
+  "exclude": ["node_modules"]
 }
diff --git a/web/types/downloadState.d.ts b/web/types/downloadState.d.ts
deleted file mode 100644
index cca526bf1..000000000
--- a/web/types/downloadState.d.ts
+++ /dev/null
@@ -1,20 +0,0 @@
-type DownloadState = {
-  modelId: string
-  time: DownloadTime
-  speed: number
-  percent: number
-  size: DownloadSize
-  isFinished?: boolean
-  children?: DownloadState[]
-  error?: string
-}
-
-type DownloadTime = {
-  elapsed: number
-  remaining: number
-}
-
-type DownloadSize = {
-  total: number
-  transferred: number
-}
diff --git a/web/utils/model.ts b/web/utils/model.ts
deleted file mode 100644
index eab4076d8..000000000
--- a/web/utils/model.ts
+++ /dev/null
@@ -1,10 +0,0 @@
-import { Model } from '@janhq/core'
-
-export const modelBinFileName = (model: Model) => {
-  const modelFormatExt = '.gguf'
-  const extractedFileName = model.sources[0]?.url.split('/').pop() ?? model.id
-  const fileName = extractedFileName.toLowerCase().endsWith(modelFormatExt)
-    ? extractedFileName
-    : model.id
-  return fileName
-}
diff --git a/web/utils/umami.tsx b/web/utils/umami.tsx
index 277ae1223..dc406a7d2 100644
--- a/web/utils/umami.tsx
+++ b/web/utils/umami.tsx
@@ -1,31 +1,67 @@
 import { useEffect } from 'react'
 
-const Umami = () => {
-  useEffect(() => {
-    if (!VERSION || !ANALYTICS_HOST || !ANALYTICS_ID) return
-    fetch(ANALYTICS_HOST, {
-      method: 'POST',
-      // eslint-disable-next-line @typescript-eslint/naming-convention
-      headers: { 'Content-Type': 'application/json' },
-      body: JSON.stringify({
-        payload: {
-          website: ANALYTICS_ID,
-          hostname: 'jan.ai',
-          screen: `${screen.width}x${screen.height}`,
-          language: navigator.language,
-          referrer: 'index.html',
-          data: { version: VERSION },
-          type: 'event',
-          title: document.title,
-          url: 'index.html',
-          name: VERSION,
-        },
-        type: 'event',
-      }),
-    })
-  }, [])
+import Script from 'next/script'
 
-  return <></>
+// Define the type for the umami data object
+interface UmamiData {
+  version: string
+}
+
+declare global {
+  interface Window {
+    umami:
+      | {
+          track: (event: string, data?: UmamiData) => void
+        }
+      | undefined
+  }
+}
+
+const Umami = () => {
+  const appVersion = VERSION
+  const analyticsScriptPath = './umami_script.js'
+  const analyticsId = ANALYTICS_ID
+
+  useEffect(() => {
+    if (!appVersion || !analyticsScriptPath || !analyticsId) return
+
+    const ping = () => {
+      // Check if umami is defined before ping
+      if (window.umami !== null && typeof window.umami !== 'undefined') {
+        window.umami.track(appVersion, {
+          version: appVersion,
+        })
+      }
+    }
+
+    // Wait for umami to be defined before ping
+    if (window.umami !== null && typeof window.umami !== 'undefined') {
+      ping()
+    } else {
+      // Listen for umami script load event
+      document.addEventListener('umami:loaded', ping)
+    }
+
+    // Cleanup function to remove event listener if the component unmounts
+    return () => {
+      document.removeEventListener('umami:loaded', ping)
+    }
+  }, [appVersion, analyticsScriptPath, analyticsId])
+
+  return (
+    <>
+      {appVersion && analyticsScriptPath && analyticsId && (
+        <Script
+          src={analyticsScriptPath}
+          data-website-id={analyticsId}
+          data-cache="true"
+          data-host-url="https://eu.umami.is"
+          defer
+          onLoad={() => document.dispatchEvent(new Event('umami:loaded'))}
+        />
+      )}
+    </>
+  )
 }
 
 export default Umami