diff --git a/.devcontainer/devcontainer.json b/.devcontainer/devcontainer.json
index f980b9df73..db1eed38df 100644
--- a/.devcontainer/devcontainer.json
+++ b/.devcontainer/devcontainer.json
@@ -1,4 +1,4 @@
 {
-    "name": "jan",
-    "image": "node:20"
-}
\ No newline at end of file
+  "name": "jan",
+  "image": "node:20"
+}
diff --git a/.github/workflows/clean-cloudflare-page-preview-url-and-r2.yml b/.github/workflows/clean-cloudflare-page-preview-url-and-r2.yml
index 620f747144..de761ca69b 100644
--- a/.github/workflows/clean-cloudflare-page-preview-url-and-r2.yml
+++ b/.github/workflows/clean-cloudflare-page-preview-url-and-r2.yml
@@ -55,10 +55,10 @@ jobs:
     steps:
       - name: install-aws-cli-action
         uses: unfor19/install-aws-cli-action@v1
-      - name: Delete object older than 7 days
+      - name: Delete object older than 10 days
         run: |
           # Get the list of objects in the 'latest' folder
-          OBJECTS=$(aws s3api list-objects --bucket ${{ secrets.CLOUDFLARE_R2_BUCKET_NAME }} --query 'Contents[?LastModified<`'$(date -d "$current_date -30 days" -u +"%Y-%m-%dT%H:%M:%SZ")'`].{Key: Key}' --endpoint-url https://${{ secrets.CLOUDFLARE_ACCOUNT_ID }}.r2.cloudflarestorage.com | jq -c .)
+          OBJECTS=$(aws s3api list-objects --bucket ${{ secrets.CLOUDFLARE_R2_BUCKET_NAME }} --query 'Contents[?LastModified<`'$(date -d "$current_date -10 days" -u +"%Y-%m-%dT%H:%M:%SZ")'`].{Key: Key}' --endpoint-url https://${{ secrets.CLOUDFLARE_ACCOUNT_ID }}.r2.cloudflarestorage.com | jq -c .)
           
           # Create a JSON file for the delete operation
           echo "{\"Objects\": $OBJECTS, \"Quiet\": false}" > delete.json
diff --git a/.github/workflows/jan-electron-linter-and-test.yml b/.github/workflows/jan-electron-linter-and-test.yml
index 6d5aaf150c..40085391f1 100644
--- a/.github/workflows/jan-electron-linter-and-test.yml
+++ b/.github/workflows/jan-electron-linter-and-test.yml
@@ -1,5 +1,6 @@
 name: Jan Electron Linter & Test
 on:
+  workflow_dispatch:
   push:
     branches:
       - main
diff --git a/.github/workflows/jan-server-build-nightly.yml b/.github/workflows/jan-server-build-nightly.yml
new file mode 100644
index 0000000000..0d1bc3ca89
--- /dev/null
+++ b/.github/workflows/jan-server-build-nightly.yml
@@ -0,0 +1,40 @@
+name: Jan Build Docker Nightly or Manual
+
+on:
+  push:
+    branches:
+      - main
+      - feature/helmchart-and-ci-jan-server
+    paths-ignore:
+      - 'README.md'
+      - 'docs/**'
+  schedule:
+    - cron: '0 20 * * 1,2,3' # At 8 PM UTC on Monday, Tuesday, and Wednesday which is 3 AM UTC+7 Tuesday, Wednesday, and Thursday
+  workflow_dispatch:
+
+jobs:
+  # Job create Update app version based on latest release tag with build number and save to output
+  get-update-version:
+    uses: ./.github/workflows/template-get-update-version.yml
+
+  build-cpu:
+    uses: ./.github/workflows/template-build-jan-server.yml
+    permissions:
+      packages: write
+    secrets: inherit
+    needs: [get-update-version]
+    with:
+      dockerfile_path: ./Dockerfile
+      docker_image_tag: "ghcr.io/janhq/jan-server:dev-cpu-latest,ghcr.io/janhq/jan-server:dev-cpu-${{ needs.get-update-version.outputs.new_version }}"
+
+  build-gpu:
+    uses: ./.github/workflows/template-build-jan-server.yml
+    permissions:
+      packages: write
+    secrets: inherit
+    needs: [get-update-version]
+    with:
+      dockerfile_path: ./Dockerfile.gpu
+      docker_image_tag: "ghcr.io/janhq/jan-server:dev-cuda-12.2-latest,ghcr.io/janhq/jan-server:dev-cuda-12.2-${{ needs.get-update-version.outputs.new_version }}"
+    
+
diff --git a/.github/workflows/jan-server-build.yml b/.github/workflows/jan-server-build.yml
new file mode 100644
index 0000000000..0665838d67
--- /dev/null
+++ b/.github/workflows/jan-server-build.yml
@@ -0,0 +1,30 @@
+name: Jan Build Docker
+
+on:
+  push:
+    tags: ["v[0-9]+.[0-9]+.[0-9]+"]
+
+jobs:
+  # Job create Update app version based on latest release tag with build number and save to output
+  get-update-version:
+    uses: ./.github/workflows/template-get-update-version.yml
+
+  build-cpu:
+    permissions:
+      packages: write
+    uses: ./.github/workflows/template-build-jan-server.yml
+    secrets: inherit
+    needs: [get-update-version]
+    with:
+      dockerfile_path: ./Dockerfile
+      docker_image_tag: "ghcr.io/janhq/jan-server:cpu-latest,ghcr.io/janhq/jan-server:cpu-${{ needs.get-update-version.outputs.new_version }}"
+
+  build-gpu:
+    permissions:
+      packages: write
+    uses: ./.github/workflows/template-build-jan-server.yml
+    secrets: inherit
+    needs: [get-update-version]
+    with:
+      dockerfile_path: ./Dockerfile.gpu
+      docker_image_tag: "ghcr.io/janhq/jan-server:cuda-12.2-latest,ghcr.io/janhq/jan-server:cuda-12.2-${{ needs.get-update-version.outputs.new_version }}"
diff --git a/.github/workflows/template-build-jan-server.yml b/.github/workflows/template-build-jan-server.yml
new file mode 100644
index 0000000000..9bb772605e
--- /dev/null
+++ b/.github/workflows/template-build-jan-server.yml
@@ -0,0 +1,39 @@
+name: build-jan-server
+on:
+  workflow_call:
+    inputs:
+      dockerfile_path:
+        required: false
+        type: string
+        default: './Dockerfile'
+      docker_image_tag:
+        required: true
+        type: string
+        default: 'ghcr.io/janhq/jan-server:dev-latest'
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    env:
+      REGISTRY: ghcr.io
+      IMAGE_NAME: janhq/jan-server
+    permissions:
+      packages: write
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Log in to the Container registry
+        uses: docker/login-action@v3
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Build and push Docker image
+        uses: docker/build-push-action@v3
+        with:
+          context: .
+          file: ${{ inputs.dockerfile_path }}
+          push: true
+          tags: ${{ inputs.docker_image_tag }}
\ No newline at end of file
diff --git a/.gitignore b/.gitignore
index 4540e5c7ab..62878011e5 100644
--- a/.gitignore
+++ b/.gitignore
@@ -5,6 +5,7 @@
 error.log
 node_modules
 *.tgz
+!charts/server/charts/*.tgz
 yarn.lock
 dist
 build
@@ -28,4 +29,5 @@ extensions/inference-nitro-extension/bin/*/*.exp
 extensions/inference-nitro-extension/bin/*/*.lib
 extensions/inference-nitro-extension/bin/saved-*
 extensions/inference-nitro-extension/bin/*.tar.gz
-
+extensions/inference-nitro-extension/bin/vulkaninfoSDK.exe
+extensions/inference-nitro-extension/bin/vulkaninfo
diff --git a/core/.prettierignore b/.prettierignore
similarity index 100%
rename from core/.prettierignore
rename to .prettierignore
diff --git a/core/.prettierrc b/.prettierrc
similarity index 100%
rename from core/.prettierrc
rename to .prettierrc
diff --git a/Dockerfile b/Dockerfile
index 949a92673f..48b2d254fb 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -1,39 +1,61 @@
-FROM node:20-bullseye AS base
+FROM node:20-bookworm AS base
 
 # 1. Install dependencies only when needed
-FROM base AS deps
+FROM base AS builder
+
+# Install g++ 11
+RUN apt update && apt install -y gcc-11 g++-11 cpp-11 jq xsel && rm -rf /var/lib/apt/lists/*
+
 WORKDIR /app
 
 # Install dependencies based on the preferred package manager
-COPY package.json yarn.lock* package-lock.json* pnpm-lock.yaml* ./
-RUN yarn install
+COPY . ./
 
-# # 2. Rebuild the source code only when needed
-FROM base AS builder
-WORKDIR /app
-COPY --from=deps /app/node_modules ./node_modules
-COPY . .
-# This will do the trick, use the corresponding env file for each environment.
-RUN yarn workspace server install
-RUN yarn server:prod
+RUN export NITRO_VERSION=$(cat extensions/inference-nitro-extension/bin/version.txt) && \
+    jq --arg nitroVersion $NITRO_VERSION '(.scripts."downloadnitro:linux" | gsub("\\${NITRO_VERSION}"; $nitroVersion)) | gsub("\r"; "")' extensions/inference-nitro-extension/package.json > /tmp/newcommand.txt && export NEW_COMMAND=$(sed 's/^"//;s/"$//' /tmp/newcommand.txt) && jq --arg newCommand "$NEW_COMMAND" '.scripts."downloadnitro:linux" = $newCommand' extensions/inference-nitro-extension/package.json > /tmp/package.json && mv /tmp/package.json extensions/inference-nitro-extension/package.json
+RUN make install-and-build
 
-# 3. Production image, copy all the files and run next
+# # 2. Rebuild the source code only when needed
 FROM base AS runner
+
+# Install g++ 11
+RUN apt update && apt install -y gcc-11 g++-11 cpp-11 jq xsel && rm -rf /var/lib/apt/lists/*
+
 WORKDIR /app
 
-ENV NODE_ENV=production
+# Copy the package.json and yarn.lock of root yarn space to leverage Docker cache
+COPY --from=builder /app/package.json ./package.json
+COPY --from=builder /app/node_modules ./node_modules/
+COPY --from=builder /app/yarn.lock ./yarn.lock
+
+# Copy the package.json, yarn.lock, and build output of server yarn space to leverage Docker cache
+COPY --from=builder /app/core ./core/
+COPY --from=builder /app/server ./server/
+RUN cd core && yarn install && yarn run build
+RUN yarn workspace @janhq/server install && yarn workspace @janhq/server build
+COPY --from=builder /app/docs/openapi ./docs/openapi/
+
+# Copy pre-install dependencies
+COPY --from=builder /app/pre-install ./pre-install/
+
+# Copy the package.json, yarn.lock, and output of web yarn space to leverage Docker cache
+COPY --from=builder /app/uikit ./uikit/
+COPY --from=builder /app/web ./web/
+COPY --from=builder /app/models ./models/
+
+RUN yarn workspace @janhq/uikit install && yarn workspace @janhq/uikit build
+RUN yarn workspace jan-web install
+
+RUN npm install -g serve@latest
 
-# RUN addgroup -g 1001 -S nodejs;
-COPY --from=builder /app/server/build ./
+EXPOSE 1337 3000 3928
 
-# Automatically leverage output traces to reduce image size
-# https://nextjs.org/docs/advanced-features/output-file-tracing
-COPY --from=builder /app/server/node_modules ./node_modules
-COPY --from=builder /app/server/package.json ./package.json
+ENV JAN_API_HOST 0.0.0.0
+ENV JAN_API_PORT 1337
 
-EXPOSE 4000 3928
+ENV API_BASE_URL http://localhost:1337
 
-ENV PORT 4000
-ENV APPDATA /app/data
+CMD ["sh", "-c", "export NODE_ENV=production && yarn workspace jan-web build && cd web && npx serve out & cd server && node build/main.js"]
 
-CMD ["node", "main.js"]
\ No newline at end of file
+# docker build -t jan .
+# docker run -p 1337:1337 -p 3000:3000 -p 3928:3928 jan
diff --git a/Dockerfile.gpu b/Dockerfile.gpu
new file mode 100644
index 0000000000..832e2c18c5
--- /dev/null
+++ b/Dockerfile.gpu
@@ -0,0 +1,88 @@
+# Please change the base image to the appropriate CUDA version base on NVIDIA Driver Compatibility
+# Run nvidia-smi to check the CUDA version and the corresponding driver version
+# Then update the base image to the appropriate CUDA version refer https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda/tags
+
+FROM nvidia/cuda:12.2.0-runtime-ubuntu22.04 AS base 
+
+# 1. Install dependencies only when needed
+FROM base AS builder
+
+# Install g++ 11
+RUN apt update && apt install -y gcc-11 g++-11 cpp-11 jq xsel curl gnupg make python3-dev && curl -sL https://deb.nodesource.com/setup_20.x | bash - && apt install nodejs -y && rm -rf /var/lib/apt/lists/*
+
+# Update alternatives for GCC and related tools
+RUN update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-11 110 \
+                         --slave /usr/bin/g++ g++ /usr/bin/g++-11 \
+                         --slave /usr/bin/gcov gcov /usr/bin/gcov-11 \
+                         --slave /usr/bin/gcc-ar gcc-ar /usr/bin/gcc-ar-11 \
+                         --slave /usr/bin/gcc-ranlib gcc-ranlib /usr/bin/gcc-ranlib-11 && \
+    update-alternatives --install /usr/bin/cpp cpp /usr/bin/cpp-11 110
+
+RUN npm install -g yarn
+
+WORKDIR /app
+
+# Install dependencies based on the preferred package manager
+COPY . ./
+
+RUN export NITRO_VERSION=$(cat extensions/inference-nitro-extension/bin/version.txt) && \
+    jq --arg nitroVersion $NITRO_VERSION '(.scripts."downloadnitro:linux" | gsub("\\${NITRO_VERSION}"; $nitroVersion)) | gsub("\r"; "")' extensions/inference-nitro-extension/package.json > /tmp/newcommand.txt && export NEW_COMMAND=$(sed 's/^"//;s/"$//' /tmp/newcommand.txt) && jq --arg newCommand "$NEW_COMMAND" '.scripts."downloadnitro:linux" = $newCommand' extensions/inference-nitro-extension/package.json > /tmp/package.json && mv /tmp/package.json extensions/inference-nitro-extension/package.json
+RUN make install-and-build
+
+# # 2. Rebuild the source code only when needed
+FROM base AS runner
+
+# Install g++ 11
+RUN apt update && apt install -y gcc-11 g++-11 cpp-11 jq xsel curl gnupg make python3-dev && curl -sL https://deb.nodesource.com/setup_20.x | bash - && apt-get install nodejs -y && rm -rf /var/lib/apt/lists/*
+
+# Update alternatives for GCC and related tools
+RUN update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-11 110 \
+                         --slave /usr/bin/g++ g++ /usr/bin/g++-11 \
+                         --slave /usr/bin/gcov gcov /usr/bin/gcov-11 \
+                         --slave /usr/bin/gcc-ar gcc-ar /usr/bin/gcc-ar-11 \
+                         --slave /usr/bin/gcc-ranlib gcc-ranlib /usr/bin/gcc-ranlib-11 && \
+    update-alternatives --install /usr/bin/cpp cpp /usr/bin/cpp-11 110
+
+RUN npm install -g yarn
+
+WORKDIR /app
+
+# Copy the package.json and yarn.lock of root yarn space to leverage Docker cache
+COPY --from=builder /app/package.json ./package.json
+COPY --from=builder /app/node_modules ./node_modules/
+COPY --from=builder /app/yarn.lock ./yarn.lock
+
+# Copy the package.json, yarn.lock, and build output of server yarn space to leverage Docker cache
+COPY --from=builder /app/core ./core/
+COPY --from=builder /app/server ./server/
+RUN cd core && yarn install && yarn run build
+RUN yarn workspace @janhq/server install && yarn workspace @janhq/server build
+COPY --from=builder /app/docs/openapi ./docs/openapi/
+
+# Copy pre-install dependencies
+COPY --from=builder /app/pre-install ./pre-install/
+
+# Copy the package.json, yarn.lock, and output of web yarn space to leverage Docker cache
+COPY --from=builder /app/uikit ./uikit/
+COPY --from=builder /app/web ./web/
+COPY --from=builder /app/models ./models/
+
+RUN yarn workspace @janhq/uikit install && yarn workspace @janhq/uikit build
+RUN yarn workspace jan-web install
+
+RUN npm install -g serve@latest
+
+EXPOSE 1337 3000 3928
+
+ENV LD_LIBRARY_PATH=/usr/local/cuda/targets/x86_64-linux/lib:/usr/local/cuda-12.0/compat${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}
+
+ENV JAN_API_HOST 0.0.0.0
+ENV JAN_API_PORT 1337
+
+ENV API_BASE_URL http://localhost:1337
+
+CMD ["sh", "-c", "export NODE_ENV=production && yarn workspace jan-web build && cd web && npx serve out & cd server && node build/main.js"]
+
+# pre-requisites: nvidia-docker
+# docker build -t jan-gpu . -f Dockerfile.gpu
+# docker run -p 1337:1337 -p 3000:3000 -p 3928:3928 --gpus all jan-gpu
diff --git a/Makefile b/Makefile
index 905a68321d..a45477b294 100644
--- a/Makefile
+++ b/Makefile
@@ -24,9 +24,9 @@ endif
 
 check-file-counts: install-and-build
 ifeq ($(OS),Windows_NT)
-	powershell -Command "if ((Get-ChildItem -Path electron/pre-install -Filter *.tgz | Measure-Object | Select-Object -ExpandProperty Count) -ne (Get-ChildItem -Path extensions -Directory | Measure-Object | Select-Object -ExpandProperty Count)) { Write-Host 'Number of .tgz files in electron/pre-install does not match the number of subdirectories in extension'; exit 1 } else { Write-Host 'Extension build successful' }"
+	powershell -Command "if ((Get-ChildItem -Path pre-install -Filter *.tgz | Measure-Object | Select-Object -ExpandProperty Count) -ne (Get-ChildItem -Path extensions -Directory | Measure-Object | Select-Object -ExpandProperty Count)) { Write-Host 'Number of .tgz files in pre-install does not match the number of subdirectories in extension'; exit 1 } else { Write-Host 'Extension build successful' }"
 else
-	@tgz_count=$$(find electron/pre-install -type f -name "*.tgz" | wc -l); dir_count=$$(find extensions -mindepth 1 -maxdepth 1 -type d | wc -l); if [ $$tgz_count -ne $$dir_count ]; then echo "Number of .tgz files in electron/pre-install ($$tgz_count) does not match the number of subdirectories in extension ($$dir_count)"; exit 1; else echo "Extension build successful"; fi
+	@tgz_count=$$(find pre-install -type f -name "*.tgz" | wc -l); dir_count=$$(find extensions -mindepth 1 -maxdepth 1 -type d | wc -l); if [ $$tgz_count -ne $$dir_count ]; then echo "Number of .tgz files in pre-install ($$tgz_count) does not match the number of subdirectories in extension ($$dir_count)"; exit 1; else echo "Extension build successful"; fi
 endif
 
 dev: check-file-counts
@@ -52,18 +52,28 @@ build: check-file-counts
 
 clean:
 ifeq ($(OS),Windows_NT)
-	powershell -Command "Get-ChildItem -Path . -Include node_modules, .next, dist -Recurse -Directory | Remove-Item -Recurse -Force"
+	powershell -Command "Get-ChildItem -Path . -Include node_modules, .next, dist, build, out -Recurse -Directory | Remove-Item -Recurse -Force"
+	powershell -Command "Remove-Item -Recurse -Force ./pre-install/*.tgz"
+	powershell -Command "Remove-Item -Recurse -Force ./electron/pre-install/*.tgz"
 	rmdir /s /q "%USERPROFILE%\jan\extensions"
 else ifeq ($(shell uname -s),Linux)
 	find . -name "node_modules" -type d -prune -exec rm -rf '{}' +
 	find . -name ".next" -type d -exec rm -rf '{}' +
 	find . -name "dist" -type d -exec rm -rf '{}' +
+	find . -name "build" -type d -exec rm -rf '{}' +
+	find . -name "out" -type d -exec rm -rf '{}' +
+	rm -rf ./pre-install/*.tgz
+	rm -rf ./electron/pre-install/*.tgz
 	rm -rf "~/jan/extensions"
 	rm -rf "~/.cache/jan*"
 else
 	find . -name "node_modules" -type d -prune -exec rm -rf '{}' +
 	find . -name ".next" -type d -exec rm -rf '{}' +
 	find . -name "dist" -type d -exec rm -rf '{}' +
+	find . -name "build" -type d -exec rm -rf '{}' +
+	find . -name "out" -type d -exec rm -rf '{}' +
+	rm -rf ./pre-install/*.tgz
+	rm -rf ./electron/pre-install/*.tgz
 	rm -rf ~/jan/extensions
 	rm -rf ~/Library/Caches/jan*
 endif
diff --git a/README.md b/README.md
index 34eecc9f35..715625080b 100644
--- a/README.md
+++ b/README.md
@@ -43,31 +43,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Stable (Recommended)</b></td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-win-x64-0.4.5.exe'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.6/jan-win-x64-0.4.6.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-mac-x64-0.4.5.dmg'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.6/jan-mac-x64-0.4.6.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-mac-arm64-0.4.5.dmg'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.6/jan-mac-arm64-0.4.6.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-linux-amd64-0.4.5.deb'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.6/jan-linux-amd64-0.4.6.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://github.com/janhq/jan/releases/download/v0.4.5/jan-linux-x86_64-0.4.5.AppImage'>
+      <a href='https://github.com/janhq/jan/releases/download/v0.4.6/jan-linux-x86_64-0.4.6.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>
@@ -76,31 +76,31 @@ Jan is an open-source ChatGPT alternative that runs 100% offline on your compute
   <tr style="text-align:center">
     <td style="text-align:center"><b>Experimental (Nightly Build)</b></td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.5-216.exe'>
+      <a href='https://delta.jan.ai/latest/jan-win-x64-0.4.6-280.exe'>
         <img src='./docs/static/img/windows.png' style="height:14px; width: 14px" />
         <b>jan.exe</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.5-216.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-x64-0.4.6-280.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>Intel</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.5-216.dmg'>
+      <a href='https://delta.jan.ai/latest/jan-mac-arm64-0.4.6-280.dmg'>
         <img src='./docs/static/img/mac.png' style="height:15px; width: 15px" />
         <b>M1/M2</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.5-216.deb'>
+      <a href='https://delta.jan.ai/latest/jan-linux-amd64-0.4.6-280.deb'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.deb</b>
       </a>
     </td>
     <td style="text-align:center">
-      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.5-216.AppImage'>
+      <a href='https://delta.jan.ai/latest/jan-linux-x86_64-0.4.6-280.AppImage'>
         <img src='./docs/static/img/linux.png' style="height:14px; width: 14px" />
         <b>jan.AppImage</b>
       </a>
@@ -167,6 +167,7 @@ To reset your installation:
    - Clear Application cache in `~/Library/Caches/jan`
 
 ## Requirements for running Jan
+
 - MacOS: 13 or higher
 - Windows:
   - Windows 10 or higher
@@ -194,17 +195,17 @@ Contributions are welcome! Please read the [CONTRIBUTING.md](CONTRIBUTING.md) fi
 
 1. **Clone the repository and prepare:**
 
-    ```bash
-    git clone https://github.com/janhq/jan
-    cd jan
-    git checkout -b DESIRED_BRANCH
-    ```
+   ```bash
+   git clone https://github.com/janhq/jan
+   cd jan
+   git checkout -b DESIRED_BRANCH
+   ```
 
 2. **Run development and use Jan Desktop**
 
-    ```bash
-    make dev
-    ```
+   ```bash
+   make dev
+   ```
 
 This will start the development server and open the desktop app.
 
@@ -218,6 +219,101 @@ make build
 
 This will build the app MacOS m1/m2 for production (with code signing already done) and put the result in `dist` folder.
 
+### Docker mode
+
+- Supported OS: Linux, WSL2 Docker
+- Pre-requisites:
+
+  - Docker Engine and Docker Compose are required to run Jan in Docker mode. Follow the [instructions](https://docs.docker.com/engine/install/ubuntu/) below to get started with Docker Engine on Ubuntu.
+
+    ```bash
+    curl -fsSL https://get.docker.com -o get-docker.sh
+    sudo sh ./get-docker.sh --dry-run
+    ```
+
+  - If you intend to run Jan in GPU mode, you need to install `nvidia-driver` and `nvidia-docker2`. Follow the instruction [here](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html) for installation.
+
+- Run Jan in Docker mode
+
+| Docker compose Profile | Description                                  |
+| ---------------------- | -------------------------------------------- |
+| `cpu-fs`               | Run Jan in CPU mode with default file system |
+| `cpu-s3fs`             | Run Jan in CPU mode with S3 file system      |
+| `gpu-fs`               | Run Jan in GPU mode with default file system |
+| `gpu-s3fs`             | Run Jan in GPU mode with S3 file system      |
+
+| Environment Variable    | Description                                                                                             |
+| ----------------------- | ------------------------------------------------------------------------------------------------------- |
+| `S3_BUCKET_NAME`        | S3 bucket name - leave blank for default file system                                                    |
+| `AWS_ACCESS_KEY_ID`     | AWS access key ID - leave blank for default file system                                                 |
+| `AWS_SECRET_ACCESS_KEY` | AWS secret access key - leave blank for default file system                                             |
+| `AWS_ENDPOINT`          | AWS endpoint URL - leave blank for default file system                                                  |
+| `AWS_REGION`            | AWS region - leave blank for default file system                                                        |
+| `API_BASE_URL`          | Jan Server URL, please modify it as your public ip address or domain name default http://localhost:1377 |
+
+- **Option 1**: Run Jan in CPU mode
+
+  ```bash
+  # cpu mode with default file system
+  docker compose --profile cpu-fs up -d
+
+  # cpu mode with S3 file system
+  docker compose --profile cpu-s3fs up -d
+  ```
+
+- **Option 2**: Run Jan in GPU mode
+
+  - **Step 1**: Check CUDA compatibility with your NVIDIA driver by running `nvidia-smi` and check the CUDA version in the output
+
+    ```bash
+    nvidia-smi
+
+    # Output
+    +---------------------------------------------------------------------------------------+
+    | NVIDIA-SMI 531.18                 Driver Version: 531.18       CUDA Version: 12.1     |
+    |-----------------------------------------+----------------------+----------------------+
+    | GPU  Name                      TCC/WDDM | Bus-Id        Disp.A | Volatile Uncorr. ECC |
+    | Fan  Temp  Perf            Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
+    |                                         |                      |               MIG M. |
+    |=========================================+======================+======================|
+    |   0  NVIDIA GeForce RTX 4070 Ti    WDDM | 00000000:01:00.0  On |                  N/A |
+    |  0%   44C    P8               16W / 285W|   1481MiB / 12282MiB |      2%      Default |
+    |                                         |                      |                  N/A |
+    +-----------------------------------------+----------------------+----------------------+
+    |   1  NVIDIA GeForce GTX 1660 Ti    WDDM | 00000000:02:00.0 Off |                  N/A |
+    |  0%   49C    P8               14W / 120W|      0MiB /  6144MiB |      0%      Default |
+    |                                         |                      |                  N/A |
+    +-----------------------------------------+----------------------+----------------------+
+    |   2  NVIDIA GeForce GTX 1660 Ti    WDDM | 00000000:05:00.0 Off |                  N/A |
+    | 29%   38C    P8               11W / 120W|      0MiB /  6144MiB |      0%      Default |
+    |                                         |                      |                  N/A |
+    +-----------------------------------------+----------------------+----------------------+
+
+    +---------------------------------------------------------------------------------------+
+    | Processes:                                                                            |
+    |  GPU   GI   CI        PID   Type   Process name                            GPU Memory |
+    |        ID   ID                                                             Usage      |
+    |=======================================================================================|
+    ```
+
+  - **Step 2**: Visit [NVIDIA NGC Catalog ](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda/tags) and find the smallest minor version of image tag that matches your CUDA version (e.g., 12.1 -> 12.1.0)
+
+  - **Step 3**: Update the `Dockerfile.gpu` line number 5 with the latest minor version of the image tag from step 2 (e.g. change `FROM nvidia/cuda:12.2.0-runtime-ubuntu22.04 AS base` to `FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04 AS base`)
+
+  - **Step 4**: Run command to start Jan in GPU mode
+
+    ```bash
+    # GPU mode with default file system
+    docker compose --profile gpu up -d
+
+    # GPU mode with S3 file system
+    docker compose --profile gpu-s3fs up -d
+    ```
+
+This will start the web server and you can access Jan at `http://localhost:3000`.
+
+> Note: RAG feature is not supported in Docker mode with s3fs yet.
+
 ## Acknowledgements
 
 Jan builds on top of other open-source projects:
diff --git a/charts/server/Chart.lock b/charts/server/Chart.lock
new file mode 100644
index 0000000000..915788d617
--- /dev/null
+++ b/charts/server/Chart.lock
@@ -0,0 +1,6 @@
+dependencies:
+- name: common
+  repository: oci://ghcr.io/janhq/charts
+  version: 0.1.2
+digest: sha256:35e98bde174130787755b0f8ea2359b7b6790d965a7157c2f7cabf1bc8c04471
+generated: "2024-02-20T16:20:37.6530108+07:00"
diff --git a/charts/server/Chart.yaml b/charts/server/Chart.yaml
new file mode 100644
index 0000000000..fb2e1c91bd
--- /dev/null
+++ b/charts/server/Chart.yaml
@@ -0,0 +1,10 @@
+apiVersion: v2
+name: jan-server
+description: A Helm chart for Kubernetes
+type: application
+version: 0.1.0
+appVersion: '1.0.0'
+dependencies:
+  - name: common
+    version: 0.1.2 # common-chart-version
+    repository: oci://ghcr.io/janhq/charts
diff --git a/charts/server/charts/common-0.1.2.tgz b/charts/server/charts/common-0.1.2.tgz
new file mode 100644
index 0000000000..946617eabb
Binary files /dev/null and b/charts/server/charts/common-0.1.2.tgz differ
diff --git a/charts/server/config.json b/charts/server/config.json
new file mode 100644
index 0000000000..62e9682fa6
--- /dev/null
+++ b/charts/server/config.json
@@ -0,0 +1,4 @@
+{
+    "image-list": "server=ghcr.io/janhq/jan-server",
+    "platforms": "linux/amd64"
+}
\ No newline at end of file
diff --git a/charts/server/values.yaml b/charts/server/values.yaml
new file mode 100644
index 0000000000..70f4631746
--- /dev/null
+++ b/charts/server/values.yaml
@@ -0,0 +1,256 @@
+common:
+  imageTag: v0.4.6-cpu
+  # DO NOT CHANGE THE LINE ABOVE. MAKE ALL CHANGES BELOW
+
+  # Global pvc for all workload
+  pvc:
+    enabled: false
+    name: 'janroot'
+    accessModes: 'ReadWriteOnce'
+    storageClassName: ''
+    capacity: '50Gi'
+
+  # Global image pull secret
+  imagePullSecrets: []
+
+  externalSecret:
+    create: false
+    name: ''
+    annotations: {}
+
+  nameOverride: 'jan-server'
+  fullnameOverride: 'jan-server'
+
+  serviceAccount:
+    create: true
+    annotations: {}
+    name: 'jan-server-service-account'
+
+  podDisruptionBudget:
+    create: false
+    minAvailable: 1
+
+  workloads:
+    - name: server
+      image:
+        repository: ghcr.io/janhq/jan-server
+        pullPolicy: Always
+
+      command: ['/bin/sh', '-c']
+      args: ['cd server && node build/main.js']
+
+      replicaCount: 1
+      ports:
+        containerPort: 1337
+
+      strategy:
+        canary:
+          steps:
+            - setWeight: 50
+            - pause: { duration: 1m }
+
+      ingress:
+        enabled: true
+        className: 'nginx'
+        annotations:
+          nginx.ingress.kubernetes.io/proxy-body-size: '100m'
+          nginx.ingress.kubernetes.io/proxy-read-timeout: '1800'
+          nginx.ingress.kubernetes.io/proxy-send-timeout: '1800'
+          # cert-manager.io/cluster-issuer: 'jan-ai-dns01-cluster-issuer'
+          # nginx.ingress.kubernetes.io/force-ssl-redirect: 'true'
+          nginx.ingress.kubernetes.io/backend-protocol: HTTP
+        hosts:
+          - host: server.local
+            paths:
+              - path: /
+                pathType: Prefix
+        tls:
+          []
+          # - hosts:
+          #     - server-dev.jan.ai
+          #   secretName: jan-server-prod-tls-v2
+
+      instrumentation:
+        enabled: false
+      podAnnotations: {}
+
+      podSecurityContext: {}
+
+      securityContext: {}
+
+      service:
+        extenalLabel: {}
+        type: ClusterIP
+        port: 1337
+        targetPort: 1337
+
+      # If you want to use GPU, please uncomment the following lines and change imageTag to the one with GPU support
+      resources:
+        # limits:
+        #   nvidia.com/gpu: 1
+        requests:
+          cpu: 2000m
+          memory: 8192M
+
+      # If you want to use pv, please uncomment the following lines and enable pvc.enabled
+      volumes:
+        []
+        # - name: janroot
+        #   persistentVolumeClaim:
+        #     claimName: janroot
+
+      volumeMounts:
+        []
+        # - name: janroot
+        #   mountPath: /app/server/build/jan
+
+      # AWS_ACCESS_KEY_ID, AWS_SECRET_ACCESS_KEY, S3_BUCKET_NAME, AWS_ENDPOINT, AWS_REGION should mount as a secret env instead of plain text here
+      # Change API_BASE_URL to your server's public domain
+      env:
+        - name: API_BASE_URL
+          value: 'http://server.local'
+
+      lifecycle: {}
+      autoscaling:
+        enabled: false
+        minReplicas: 2
+        maxReplicas: 3
+        targetCPUUtilizationPercentage: 95
+        targetMemoryUtilizationPercentage: 95
+
+      kedaScaling:
+        enabled: false # ignore if autoscaling.enable = true
+        cooldownPeriod: 30
+        pollingInterval: 2
+        minReplicas: 1
+        maxReplicas: 5
+        metricName: celery_queue_length
+        query: celery_queue_length{queue_name="myqueue"} # change queue_name here
+        serverAddress: http://prometheus-prod-kube-prome-prometheus.monitoring.svc:9090
+        threshold: '3'
+
+      nodeSelector: {}
+
+      tolerations: []
+
+      podSecurityGroup:
+        enabled: false
+        securitygroupid: []
+
+      # Reloader Option
+      reloader: 'false'
+      vpa:
+        enabled: false
+
+    - name: web
+      image:
+        repository: ghcr.io/janhq/jan-server
+        pullPolicy: Always
+
+      command: ['/bin/sh', '-c']
+      args:
+        [
+          'export NODE_ENV=production && yarn workspace jan-web build && cd web && npx serve out',
+        ]
+
+      replicaCount: 1
+      ports:
+        containerPort: 3000
+
+      strategy:
+        canary:
+          steps:
+            - setWeight: 50
+            - pause: { duration: 1m }
+
+      ingress:
+        enabled: true
+        className: 'nginx'
+        annotations:
+          nginx.ingress.kubernetes.io/proxy-body-size: '100m'
+          nginx.ingress.kubernetes.io/proxy-read-timeout: '1800'
+          nginx.ingress.kubernetes.io/proxy-send-timeout: '1800'
+          # cert-manager.io/cluster-issuer: 'jan-ai-dns01-cluster-issuer'
+          # nginx.ingress.kubernetes.io/force-ssl-redirect: 'true'
+          nginx.ingress.kubernetes.io/backend-protocol: HTTP
+        hosts:
+          - host: web.local
+            paths:
+              - path: /
+                pathType: Prefix
+        tls:
+          []
+          # - hosts:
+          #     - server-dev.jan.ai
+          #   secretName: jan-server-prod-tls-v2
+
+      instrumentation:
+        enabled: false
+      podAnnotations: {}
+
+      podSecurityContext: {}
+
+      securityContext: {}
+
+      service:
+        extenalLabel: {}
+        type: ClusterIP
+        port: 3000
+        targetPort: 3000
+
+      resources:
+        limits:
+          cpu: 1000m
+          memory: 2048M
+        requests:
+          cpu: 50m
+          memory: 500M
+
+      volumes:
+        []
+        # - name: janroot
+        #   persistentVolumeClaim:
+        #     claimName: janroot
+
+      volumeMounts:
+        []
+        # - name: janroot
+        #   mountPath: /app/server/build/jan
+
+      # AWS_ACCESS_KEY_ID, AWS_SECRET_ACCESS_KEY, S3_BUCKET_NAME, AWS_ENDPOINT, AWS_REGION should mount as a secret env instead of plain text here
+      # Change API_BASE_URL to your server's public domain
+      env:
+        - name: API_BASE_URL
+          value: 'http://server.local'
+
+      lifecycle: {}
+      autoscaling:
+        enabled: true
+        minReplicas: 1
+        maxReplicas: 3
+        targetCPUUtilizationPercentage: 95
+        targetMemoryUtilizationPercentage: 95
+
+      kedaScaling:
+        enabled: false # ignore if autoscaling.enable = true
+        cooldownPeriod: 30
+        pollingInterval: 2
+        minReplicas: 1
+        maxReplicas: 5
+        metricName: celery_queue_length
+        query: celery_queue_length{queue_name="myqueue"} # change queue_name here
+        serverAddress: http://prometheus-prod-kube-prome-prometheus.monitoring.svc:9090
+        threshold: '3'
+
+      nodeSelector: {}
+
+      tolerations: []
+
+      podSecurityGroup:
+        enabled: false
+        securitygroupid: []
+
+      # Reloader Option
+      reloader: 'false'
+      vpa:
+        enabled: false
diff --git a/core/jest.config.js b/core/jest.config.js
index fb03768fec..c18f550916 100644
--- a/core/jest.config.js
+++ b/core/jest.config.js
@@ -4,4 +4,4 @@ module.exports = {
   moduleNameMapper: {
     '@/(.*)': '<rootDir>/src/$1',
   },
-}
\ No newline at end of file
+}
diff --git a/core/package.json b/core/package.json
index 437e6d0a61..c3abe2d568 100644
--- a/core/package.json
+++ b/core/package.json
@@ -57,6 +57,7 @@
     "rollup-plugin-typescript2": "^0.36.0",
     "ts-jest": "^26.1.1",
     "tslib": "^2.6.2",
-    "typescript": "^5.2.2"
+    "typescript": "^5.2.2",
+    "rimraf": "^3.0.2"
   }
 }
diff --git a/core/rollup.config.ts b/core/rollup.config.ts
index d78130a4de..ebea8e2377 100644
--- a/core/rollup.config.ts
+++ b/core/rollup.config.ts
@@ -54,7 +54,8 @@ export default [
       'url',
       'http',
       'os',
-      'util'
+      'util',
+      'child_process',
     ],
     watch: {
       include: 'src/node/**',
diff --git a/core/src/api/index.ts b/core/src/api/index.ts
index 0d7cc51f75..6760207580 100644
--- a/core/src/api/index.ts
+++ b/core/src/api/index.ts
@@ -1,15 +1,22 @@
 /**
- * App Route APIs
+ * Native Route APIs
  * @description Enum of all the routes exposed by the app
  */
-export enum AppRoute {
+export enum NativeRoute {
   openExternalUrl = 'openExternalUrl',
   openAppDirectory = 'openAppDirectory',
   openFileExplore = 'openFileExplorer',
   selectDirectory = 'selectDirectory',
+  relaunch = 'relaunch',
+}
+
+/**
+ * App Route APIs
+ * @description Enum of all the routes exposed by the app
+ */
+export enum AppRoute {
   getAppConfigurations = 'getAppConfigurations',
   updateAppConfiguration = 'updateAppConfiguration',
-  relaunch = 'relaunch',
   joinPath = 'joinPath',
   isSubdirectory = 'isSubdirectory',
   baseName = 'baseName',
@@ -30,6 +37,7 @@ export enum DownloadRoute {
   downloadFile = 'downloadFile',
   pauseDownload = 'pauseDownload',
   resumeDownload = 'resumeDownload',
+  getDownloadProgress = 'getDownloadProgress',
 }
 
 export enum DownloadEvent {
@@ -68,6 +76,10 @@ export enum FileManagerRoute {
 
 export type ApiFunction = (...args: any[]) => any
 
+export type NativeRouteFunctions = {
+  [K in NativeRoute]: ApiFunction
+}
+
 export type AppRouteFunctions = {
   [K in AppRoute]: ApiFunction
 }
@@ -96,7 +108,8 @@ export type FileManagerRouteFunctions = {
   [K in FileManagerRoute]: ApiFunction
 }
 
-export type APIFunctions = AppRouteFunctions &
+export type APIFunctions = NativeRouteFunctions &
+  AppRouteFunctions &
   AppEventFunctions &
   DownloadRouteFunctions &
   DownloadEventFunctions &
@@ -104,11 +117,13 @@ export type APIFunctions = AppRouteFunctions &
   FileSystemRouteFunctions &
   FileManagerRoute
 
-export const APIRoutes = [
+export const CoreRoutes = [
   ...Object.values(AppRoute),
   ...Object.values(DownloadRoute),
   ...Object.values(ExtensionRoute),
   ...Object.values(FileSystemRoute),
   ...Object.values(FileManagerRoute),
 ]
+
+export const APIRoutes = [...CoreRoutes, ...Object.values(NativeRoute)]
 export const APIEvents = [...Object.values(AppEvent), ...Object.values(DownloadEvent)]
diff --git a/core/src/extension.ts b/core/src/extension.ts
index 0b7f9b7fc1..3528f581cc 100644
--- a/core/src/extension.ts
+++ b/core/src/extension.ts
@@ -1,13 +1,13 @@
 export enum ExtensionTypeEnum {
-  Assistant = "assistant",
-  Conversational = "conversational",
-  Inference = "inference",
-  Model = "model",
-  SystemMonitoring = "systemMonitoring",
+  Assistant = 'assistant',
+  Conversational = 'conversational',
+  Inference = 'inference',
+  Model = 'model',
+  SystemMonitoring = 'systemMonitoring',
 }
 
 export interface ExtensionType {
-  type(): ExtensionTypeEnum | undefined;
+  type(): ExtensionTypeEnum | undefined
 }
 /**
  * Represents a base extension.
@@ -20,16 +20,16 @@ export abstract class BaseExtension implements ExtensionType {
    * Undefined means its not extending any known extension by the application.
    */
   type(): ExtensionTypeEnum | undefined {
-    return undefined;
+    return undefined
   }
   /**
    * Called when the extension is loaded.
    * Any initialization logic for the extension should be put here.
    */
-  abstract onLoad(): void;
+  abstract onLoad(): void
   /**
    * Called when the extension is unloaded.
    * Any cleanup logic for the extension should be put here.
    */
-  abstract onUnload(): void;
+  abstract onUnload(): void
 }
diff --git a/core/src/extensions/assistant.ts b/core/src/extensions/assistant.ts
index ba345711ae..5c3114f41b 100644
--- a/core/src/extensions/assistant.ts
+++ b/core/src/extensions/assistant.ts
@@ -1,5 +1,5 @@
-import { Assistant, AssistantInterface } from "../index";
-import { BaseExtension, ExtensionTypeEnum } from "../extension";
+import { Assistant, AssistantInterface } from '../index'
+import { BaseExtension, ExtensionTypeEnum } from '../extension'
 
 /**
  * Assistant extension for managing assistants.
@@ -10,10 +10,10 @@ export abstract class AssistantExtension extends BaseExtension implements Assist
    * Assistant extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.Assistant;
+    return ExtensionTypeEnum.Assistant
   }
 
-  abstract createAssistant(assistant: Assistant): Promise<void>;
-  abstract deleteAssistant(assistant: Assistant): Promise<void>;
-  abstract getAssistants(): Promise<Assistant[]>;
+  abstract createAssistant(assistant: Assistant): Promise<void>
+  abstract deleteAssistant(assistant: Assistant): Promise<void>
+  abstract getAssistants(): Promise<Assistant[]>
 }
diff --git a/core/src/extensions/conversational.ts b/core/src/extensions/conversational.ts
index 4319784c35..a49a4e6895 100644
--- a/core/src/extensions/conversational.ts
+++ b/core/src/extensions/conversational.ts
@@ -14,7 +14,7 @@ export abstract class ConversationalExtension
    * Conversation extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.Conversational;
+    return ExtensionTypeEnum.Conversational
   }
 
   abstract getThreads(): Promise<Thread[]>
diff --git a/core/src/extensions/index.ts b/core/src/extensions/index.ts
index 1796c16187..5223345489 100644
--- a/core/src/extensions/index.ts
+++ b/core/src/extensions/index.ts
@@ -2,24 +2,24 @@
  * Conversational extension. Persists and retrieves conversations.
  * @module
  */
-export { ConversationalExtension } from "./conversational";
+export { ConversationalExtension } from './conversational'
 
 /**
  * Inference extension. Start, stop and inference models.
  */
-export { InferenceExtension } from "./inference";
+export { InferenceExtension } from './inference'
 
 /**
  * Monitoring extension for system monitoring.
  */
-export { MonitoringExtension } from "./monitoring";
+export { MonitoringExtension } from './monitoring'
 
 /**
  * Assistant extension for managing assistants.
  */
-export { AssistantExtension } from "./assistant";
+export { AssistantExtension } from './assistant'
 
 /**
  * Model extension for managing models.
  */
-export { ModelExtension } from "./model";
+export { ModelExtension } from './model'
diff --git a/core/src/extensions/inference.ts b/core/src/extensions/inference.ts
index c551d108f5..e8e51f9eb9 100644
--- a/core/src/extensions/inference.ts
+++ b/core/src/extensions/inference.ts
@@ -1,5 +1,5 @@
-import { InferenceInterface, MessageRequest, ThreadMessage } from "../index";
-import { BaseExtension, ExtensionTypeEnum } from "../extension";
+import { InferenceInterface, MessageRequest, ThreadMessage } from '../index'
+import { BaseExtension, ExtensionTypeEnum } from '../extension'
 
 /**
  * Inference extension. Start, stop and inference models.
@@ -9,8 +9,8 @@ export abstract class InferenceExtension extends BaseExtension implements Infere
    * Inference extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.Inference;
+    return ExtensionTypeEnum.Inference
   }
 
-  abstract inference(data: MessageRequest): Promise<ThreadMessage>;
+  abstract inference(data: MessageRequest): Promise<ThreadMessage>
 }
diff --git a/core/src/extensions/model.ts b/core/src/extensions/model.ts
index 30aa5b6ba2..df7d14f421 100644
--- a/core/src/extensions/model.ts
+++ b/core/src/extensions/model.ts
@@ -1,5 +1,5 @@
-import { BaseExtension, ExtensionTypeEnum } from "../extension";
-import { Model, ModelInterface } from "../index";
+import { BaseExtension, ExtensionTypeEnum } from '../extension'
+import { Model, ModelInterface } from '../index'
 
 /**
  * Model extension for managing models.
@@ -9,16 +9,16 @@ export abstract class ModelExtension extends BaseExtension implements ModelInter
    * Model extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.Model;
+    return ExtensionTypeEnum.Model
   }
 
   abstract downloadModel(
     model: Model,
-    network?: { proxy: string; ignoreSSL?: boolean },
-  ): Promise<void>;
-  abstract cancelModelDownload(modelId: string): Promise<void>;
-  abstract deleteModel(modelId: string): Promise<void>;
-  abstract saveModel(model: Model): Promise<void>;
-  abstract getDownloadedModels(): Promise<Model[]>;
-  abstract getConfiguredModels(): Promise<Model[]>;
+    network?: { proxy: string; ignoreSSL?: boolean }
+  ): Promise<void>
+  abstract cancelModelDownload(modelId: string): Promise<void>
+  abstract deleteModel(modelId: string): Promise<void>
+  abstract saveModel(model: Model): Promise<void>
+  abstract getDownloadedModels(): Promise<Model[]>
+  abstract getConfiguredModels(): Promise<Model[]>
 }
diff --git a/core/src/extensions/monitoring.ts b/core/src/extensions/monitoring.ts
index 2de9b9ae56..ba193f0f4d 100644
--- a/core/src/extensions/monitoring.ts
+++ b/core/src/extensions/monitoring.ts
@@ -1,5 +1,5 @@
-import { BaseExtension, ExtensionTypeEnum } from "../extension";
-import { MonitoringInterface } from "../index";
+import { BaseExtension, ExtensionTypeEnum } from '../extension'
+import { MonitoringInterface } from '../index'
 
 /**
  * Monitoring extension for system monitoring.
@@ -10,9 +10,9 @@ export abstract class MonitoringExtension extends BaseExtension implements Monit
    * Monitoring extension type.
    */
   type(): ExtensionTypeEnum | undefined {
-    return ExtensionTypeEnum.SystemMonitoring;
+    return ExtensionTypeEnum.SystemMonitoring
   }
 
-  abstract getResourcesInfo(): Promise<any>;
-  abstract getCurrentLoad(): Promise<any>;
+  abstract getResourcesInfo(): Promise<any>
+  abstract getCurrentLoad(): Promise<any>
 }
diff --git a/core/src/index.ts b/core/src/index.ts
index a56b6f0e13..3505797b19 100644
--- a/core/src/index.ts
+++ b/core/src/index.ts
@@ -38,3 +38,10 @@ export * from './extension'
  * @module
  */
 export * from './extensions/index'
+
+/**
+ * Declare global object
+ */
+declare global {
+  var core: any | undefined
+}
diff --git a/core/src/node/api/common/adapter.ts b/core/src/node/api/common/adapter.ts
new file mode 100644
index 0000000000..56f4cedb35
--- /dev/null
+++ b/core/src/node/api/common/adapter.ts
@@ -0,0 +1,43 @@
+import {
+  AppRoute,
+  DownloadRoute,
+  ExtensionRoute,
+  FileManagerRoute,
+  FileSystemRoute,
+} from '../../../api'
+import { Downloader } from '../processors/download'
+import { FileSystem } from '../processors/fs'
+import { Extension } from '../processors/extension'
+import { FSExt } from '../processors/fsExt'
+import { App } from '../processors/app'
+
+export class RequestAdapter {
+  downloader: Downloader
+  fileSystem: FileSystem
+  extension: Extension
+  fsExt: FSExt
+  app: App
+
+  constructor(observer?: Function) {
+    this.downloader = new Downloader(observer)
+    this.fileSystem = new FileSystem()
+    this.extension = new Extension()
+    this.fsExt = new FSExt()
+    this.app = new App()
+  }
+
+  // TODO: Clearer Factory pattern here
+  process(route: string, ...args: any) {
+    if (route in DownloadRoute) {
+      return this.downloader.process(route, ...args)
+    } else if (route in FileSystemRoute) {
+      return this.fileSystem.process(route, ...args)
+    } else if (route in ExtensionRoute) {
+      return this.extension.process(route, ...args)
+    } else if (route in FileManagerRoute) {
+      return this.fsExt.process(route, ...args)
+    } else if (route in AppRoute) {
+      return this.app.process(route, ...args)
+    }
+  }
+}
diff --git a/core/src/node/api/common/handler.ts b/core/src/node/api/common/handler.ts
new file mode 100644
index 0000000000..4a39ae52a6
--- /dev/null
+++ b/core/src/node/api/common/handler.ts
@@ -0,0 +1,23 @@
+import { CoreRoutes } from '../../../api'
+import { RequestAdapter } from './adapter'
+
+export type Handler = (route: string, args: any) => any
+
+export class RequestHandler {
+  handler: Handler
+  adataper: RequestAdapter
+
+  constructor(handler: Handler, observer?: Function) {
+    this.handler = handler
+    this.adataper = new RequestAdapter(observer)
+  }
+
+  handle() {
+    CoreRoutes.map((route) => {
+      this.handler(route, async (...args: any[]) => {
+        const values = await this.adataper.process(route, ...args)
+        return values
+      })
+    })
+  }
+}
diff --git a/core/src/node/api/index.ts b/core/src/node/api/index.ts
index 4c3041ba3f..ab0c516569 100644
--- a/core/src/node/api/index.ts
+++ b/core/src/node/api/index.ts
@@ -1,2 +1,3 @@
 export * from './HttpServer'
-export * from './routes'
+export * from './restful/v1'
+export * from './common/handler'
diff --git a/core/src/node/api/processors/Processor.ts b/core/src/node/api/processors/Processor.ts
new file mode 100644
index 0000000000..8ef0c6e191
--- /dev/null
+++ b/core/src/node/api/processors/Processor.ts
@@ -0,0 +1,3 @@
+export abstract class Processor {
+  abstract process(key: string, ...args: any[]): any
+}
diff --git a/core/src/node/api/processors/app.ts b/core/src/node/api/processors/app.ts
new file mode 100644
index 0000000000..c62b5011d8
--- /dev/null
+++ b/core/src/node/api/processors/app.ts
@@ -0,0 +1,96 @@
+import { basename, isAbsolute, join, relative } from 'path'
+
+import { Processor } from './Processor'
+import { getAppConfigurations as appConfiguration, updateAppConfiguration } from '../../helper'
+import { log as writeLog, logServer as writeServerLog } from '../../helper/log'
+import { appResourcePath } from '../../helper/path'
+
+export class App implements Processor {
+  observer?: Function
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(key: string, ...args: any[]): any {
+    const instance = this as any
+    const func = instance[key]
+    return func(...args)
+  }
+
+  /**
+   * Joins multiple paths together, respect to the current OS.
+   */
+  joinPath(args: any[]) {
+    return join(...args)
+  }
+
+  /**
+   * Checks if the given path is a subdirectory of the given directory.
+   *
+   * @param _event - The IPC event object.
+   * @param from - The path to check.
+   * @param to - The directory to check against.
+   *
+   * @returns {Promise<boolean>} - A promise that resolves with the result.
+   */
+  isSubdirectory(from: any, to: any) {
+    const rel = relative(from, to)
+    const isSubdir = rel && !rel.startsWith('..') && !isAbsolute(rel)
+
+    if (isSubdir === '') return false
+    else return isSubdir
+  }
+
+  /**
+   * Retrieve basename from given path, respect to the current OS.
+   */
+  baseName(args: any) {
+    return basename(args)
+  }
+
+  /**
+   * Log message to log file.
+   */
+  log(args: any) {
+    writeLog(args)
+  }
+
+  /**
+   * Log message to log file.
+   */
+  logServer(args: any) {
+    writeServerLog(args)
+  }
+
+  getAppConfigurations() {
+    return appConfiguration()
+  }
+
+  async updateAppConfiguration(args: any) {
+    await updateAppConfiguration(args)
+  }
+
+  /**
+   * Start Jan API Server.
+   */
+  async startServer(args?: any) {
+    const { startServer } = require('@janhq/server')
+    return startServer({
+      host: args?.host,
+      port: args?.port,
+      isCorsEnabled: args?.isCorsEnabled,
+      isVerboseEnabled: args?.isVerboseEnabled,
+      schemaPath: join(await appResourcePath(), 'docs', 'openapi', 'jan.yaml'),
+      baseDir: join(await appResourcePath(), 'docs', 'openapi'),
+    })
+  }
+
+  /**
+   * Stop Jan API Server.
+   */
+  stopServer() {
+    const { stopServer } = require('@janhq/server')
+    return stopServer()
+  }
+}
diff --git a/core/src/node/api/processors/download.ts b/core/src/node/api/processors/download.ts
new file mode 100644
index 0000000000..686ba58a1e
--- /dev/null
+++ b/core/src/node/api/processors/download.ts
@@ -0,0 +1,106 @@
+import { resolve, sep } from 'path'
+import { DownloadEvent } from '../../../api'
+import { normalizeFilePath } from '../../helper/path'
+import { getJanDataFolderPath } from '../../helper'
+import { DownloadManager } from '../../helper/download'
+import { createWriteStream, renameSync } from 'fs'
+import { Processor } from './Processor'
+import { DownloadState } from '../../../types'
+
+export class Downloader implements Processor {
+  observer?: Function
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(key: string, ...args: any[]): any {
+    const instance = this as any
+    const func = instance[key]
+    return func(this.observer, ...args)
+  }
+
+  downloadFile(observer: any, url: string, localPath: string, network: any) {
+    const request = require('request')
+    const progress = require('request-progress')
+
+    const strictSSL = !network?.ignoreSSL
+    const proxy = network?.proxy?.startsWith('http') ? network.proxy : undefined
+    if (typeof localPath === 'string') {
+      localPath = normalizeFilePath(localPath)
+    }
+    const array = localPath.split(sep)
+    const fileName = array.pop() ?? ''
+    const modelId = array.pop() ?? ''
+
+    const destination = resolve(getJanDataFolderPath(), localPath)
+    const rq = request({ url, strictSSL, proxy })
+
+    // Put request to download manager instance
+    DownloadManager.instance.setRequest(localPath, rq)
+
+    // Downloading file to a temp file first
+    const downloadingTempFile = `${destination}.download`
+
+    progress(rq, {})
+      .on('progress', (state: any) => {
+        const downloadState: DownloadState = {
+          ...state,
+          modelId,
+          fileName,
+          downloadState: 'downloading',
+        }
+        console.log('progress: ', downloadState)
+        observer?.(DownloadEvent.onFileDownloadUpdate, downloadState)
+        DownloadManager.instance.downloadProgressMap[modelId] = downloadState
+      })
+      .on('error', (error: Error) => {
+        const currentDownloadState = DownloadManager.instance.downloadProgressMap[modelId]
+        const downloadState: DownloadState = {
+          ...currentDownloadState,
+          error: error.message,
+          downloadState: 'error',
+        }
+        if (currentDownloadState) {
+          DownloadManager.instance.downloadProgressMap[modelId] = downloadState
+        }
+
+        observer?.(DownloadEvent.onFileDownloadError, downloadState)
+      })
+      .on('end', () => {
+        const currentDownloadState = DownloadManager.instance.downloadProgressMap[modelId]
+        if (currentDownloadState && DownloadManager.instance.networkRequests[localPath]) {
+          // Finished downloading, rename temp file to actual file
+          renameSync(downloadingTempFile, destination)
+          const downloadState: DownloadState = {
+            ...currentDownloadState,
+            downloadState: 'end',
+          }
+          observer?.(DownloadEvent.onFileDownloadSuccess, downloadState)
+          DownloadManager.instance.downloadProgressMap[modelId] = downloadState
+        }
+      })
+      .pipe(createWriteStream(downloadingTempFile))
+  }
+
+  abortDownload(observer: any, fileName: string) {
+    const rq = DownloadManager.instance.networkRequests[fileName]
+    if (rq) {
+      DownloadManager.instance.networkRequests[fileName] = undefined
+      rq?.abort()
+    } else {
+      observer?.(DownloadEvent.onFileDownloadError, {
+        fileName,
+        error: 'aborted',
+      })
+    }
+  }
+
+  resumeDownload(observer: any, fileName: any) {
+    DownloadManager.instance.networkRequests[fileName]?.resume()
+  }
+
+  pauseDownload(observer: any, fileName: any) {
+    DownloadManager.instance.networkRequests[fileName]?.pause()
+  }
+}
diff --git a/core/src/node/api/processors/extension.ts b/core/src/node/api/processors/extension.ts
new file mode 100644
index 0000000000..df5d2d945c
--- /dev/null
+++ b/core/src/node/api/processors/extension.ts
@@ -0,0 +1,88 @@
+import { readdirSync } from 'fs'
+import { join, extname } from 'path'
+
+import { Processor } from './Processor'
+import { ModuleManager } from '../../helper/module'
+import { getJanExtensionsPath as getPath } from '../../helper'
+import {
+  getActiveExtensions as getExtensions,
+  getExtension,
+  removeExtension,
+  installExtensions,
+} from '../../extension/store'
+import { appResourcePath } from '../../helper/path'
+
+export class Extension implements Processor {
+  observer?: Function
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(key: string, ...args: any[]): any {
+    const instance = this as any
+    const func = instance[key]
+    return func(...args)
+  }
+
+  invokeExtensionFunc(modulePath: string, method: string, ...params: any[]) {
+    const module = require(join(getPath(), modulePath))
+    ModuleManager.instance.setModule(modulePath, module)
+
+    if (typeof module[method] === 'function') {
+      return module[method](...params)
+    } else {
+      console.debug(module[method])
+      console.error(`Function "${method}" does not exist in the module.`)
+    }
+  }
+
+  /**
+   * Returns the paths of the base extensions.
+   * @returns An array of paths to the base extensions.
+   */
+  async baseExtensions() {
+    const baseExtensionPath = join(await appResourcePath(), 'pre-install')
+    return readdirSync(baseExtensionPath)
+      .filter((file) => extname(file) === '.tgz')
+      .map((file) => join(baseExtensionPath, file))
+  }
+
+  /**MARK: Extension Manager handlers */
+  async installExtension(extensions: any) {
+    // Install and activate all provided extensions
+    const installed = await installExtensions(extensions)
+    return JSON.parse(JSON.stringify(installed))
+  }
+
+  // Register IPC route to uninstall a extension
+  async uninstallExtension(extensions: any) {
+    // Uninstall all provided extensions
+    for (const ext of extensions) {
+      const extension = getExtension(ext)
+      await extension.uninstall()
+      if (extension.name) removeExtension(extension.name)
+    }
+
+    // Reload all renderer pages if needed
+    return true
+  }
+
+  // Register IPC route to update a extension
+  async updateExtension(extensions: any) {
+    // Update all provided extensions
+    const updated: any[] = []
+    for (const ext of extensions) {
+      const extension = getExtension(ext)
+      const res = await extension.update()
+      if (res) updated.push(extension)
+    }
+
+    // Reload all renderer pages if needed
+    return JSON.parse(JSON.stringify(updated))
+  }
+
+  getActiveExtensions() {
+    return JSON.parse(JSON.stringify(getExtensions()))
+  }
+}
diff --git a/core/src/node/api/processors/fs.ts b/core/src/node/api/processors/fs.ts
new file mode 100644
index 0000000000..93a5f19057
--- /dev/null
+++ b/core/src/node/api/processors/fs.ts
@@ -0,0 +1,25 @@
+import { join } from 'path'
+import { normalizeFilePath } from '../../helper/path'
+import { getJanDataFolderPath } from '../../helper'
+import { Processor } from './Processor'
+
+export class FileSystem implements Processor {
+  observer?: Function
+  private static moduleName = 'fs'
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(route: string, ...args: any[]): any {
+    return import(FileSystem.moduleName).then((mdl) =>
+      mdl[route](
+        ...args.map((arg: any) =>
+          typeof arg === 'string' && (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
+            ? join(getJanDataFolderPath(), normalizeFilePath(arg))
+            : arg
+        )
+      )
+    )
+  }
+}
diff --git a/core/src/node/api/processors/fsExt.ts b/core/src/node/api/processors/fsExt.ts
new file mode 100644
index 0000000000..71e07ae57b
--- /dev/null
+++ b/core/src/node/api/processors/fsExt.ts
@@ -0,0 +1,78 @@
+import { join } from 'path'
+import fs from 'fs'
+import { FileManagerRoute } from '../../../api'
+import { appResourcePath, normalizeFilePath } from '../../helper/path'
+import { getJanDataFolderPath, getJanDataFolderPath as getPath } from '../../helper'
+import { Processor } from './Processor'
+import { FileStat } from '../../../types'
+
+export class FSExt implements Processor {
+  observer?: Function
+
+  constructor(observer?: Function) {
+    this.observer = observer
+  }
+
+  process(key: string, ...args: any): any {
+    const instance = this as any
+    const func = instance[key]
+    return func(...args)
+  }
+
+  // Handles the 'syncFile' IPC event. This event is triggered to synchronize a file from a source path to a destination path.
+  syncFile(src: string, dest: string) {
+    const reflect = require('@alumna/reflect')
+    return reflect({
+      src,
+      dest,
+      recursive: true,
+      delete: false,
+      overwrite: true,
+      errorOnExist: false,
+    })
+  }
+
+  // Handles the 'getJanDataFolderPath' IPC event. This event is triggered to get the user space path.
+  getJanDataFolderPath() {
+    return Promise.resolve(getPath())
+  }
+
+  // Handles the 'getResourcePath' IPC event. This event is triggered to get the resource path.
+  getResourcePath() {
+    return appResourcePath()
+  }
+
+  // Handles the 'getUserHomePath' IPC event. This event is triggered to get the user home path.
+  getUserHomePath() {
+    return process.env[process.platform == 'win32' ? 'USERPROFILE' : 'HOME']
+  }
+
+  // handle fs is directory here
+  fileStat(path: string) {
+    const normalizedPath = normalizeFilePath(path)
+
+    const fullPath = join(getJanDataFolderPath(), normalizedPath)
+    const isExist = fs.existsSync(fullPath)
+    if (!isExist) return undefined
+
+    const isDirectory = fs.lstatSync(fullPath).isDirectory()
+    const size = fs.statSync(fullPath).size
+
+    const fileStat: FileStat = {
+      isDirectory,
+      size,
+    }
+
+    return fileStat
+  }
+
+  writeBlob(path: string, data: any) {
+    try {
+      const normalizedPath = normalizeFilePath(path)
+      const dataBuffer = Buffer.from(data, 'base64')
+      fs.writeFileSync(join(getJanDataFolderPath(), normalizedPath), dataBuffer)
+    } catch (err) {
+      console.error(`writeFile ${path} result: ${err}`)
+    }
+  }
+}
diff --git a/core/src/node/api/restful/app/download.ts b/core/src/node/api/restful/app/download.ts
new file mode 100644
index 0000000000..b5919659b1
--- /dev/null
+++ b/core/src/node/api/restful/app/download.ts
@@ -0,0 +1,23 @@
+import { DownloadRoute } from '../../../../api'
+import { DownloadManager } from '../../../helper/download'
+import { HttpServer } from '../../HttpServer'
+
+export const downloadRouter = async (app: HttpServer) => {
+  app.get(`/download/${DownloadRoute.getDownloadProgress}/:modelId`, async (req, res) => {
+    const modelId = req.params.modelId
+
+    console.debug(`Getting download progress for model ${modelId}`)
+    console.debug(
+      `All Download progress: ${JSON.stringify(DownloadManager.instance.downloadProgressMap)}`
+    )
+
+    // check if null DownloadManager.instance.downloadProgressMap
+    if (!DownloadManager.instance.downloadProgressMap[modelId]) {
+      return res.status(404).send({
+        message: 'Download progress not found',
+      })
+    } else {
+      return res.status(200).send(DownloadManager.instance.downloadProgressMap[modelId])
+    }
+  })
+}
diff --git a/core/src/node/api/restful/app/handlers.ts b/core/src/node/api/restful/app/handlers.ts
new file mode 100644
index 0000000000..43c3f7add9
--- /dev/null
+++ b/core/src/node/api/restful/app/handlers.ts
@@ -0,0 +1,13 @@
+import { HttpServer } from '../../HttpServer'
+import { Handler, RequestHandler } from '../../common/handler'
+
+export function handleRequests(app: HttpServer) {
+  const restWrapper: Handler = (route: string, listener: (...args: any[]) => any) => {
+    app.post(`/app/${route}`, async (request: any, reply: any) => {
+      const args = JSON.parse(request.body) as any[]
+      reply.send(JSON.stringify(await listener(...args)))
+    })
+  }
+  const handler = new RequestHandler(restWrapper)
+  handler.handle()
+}
diff --git a/core/src/node/api/routes/common.ts b/core/src/node/api/restful/common.ts
similarity index 53%
rename from core/src/node/api/routes/common.ts
rename to core/src/node/api/restful/common.ts
index 27385e5619..4336329890 100644
--- a/core/src/node/api/routes/common.ts
+++ b/core/src/node/api/restful/common.ts
@@ -1,22 +1,34 @@
-import { AppRoute } from '../../../api'
 import { HttpServer } from '../HttpServer'
-import { basename, join } from 'path'
 import {
   chatCompletions,
   deleteBuilder,
   downloadModel,
   getBuilder,
   retrieveBuilder,
-} from '../common/builder'
+  createMessage,
+  createThread,
+  getMessages,
+  retrieveMessage,
+  updateThread,
+} from './helper/builder'
 
-import { JanApiRouteConfiguration } from '../common/configuration'
-import { startModel, stopModel } from '../common/startStopModel'
+import { JanApiRouteConfiguration } from './helper/configuration'
+import { startModel, stopModel } from './helper/startStopModel'
 import { ModelSettingParams } from '../../../types'
 
 export const commonRouter = async (app: HttpServer) => {
+  const normalizeData = (data: any) => {
+    return {
+      object: 'list',
+      data,
+    }
+  }
   // Common Routes
+  // Read & Delete :: Threads | Models | Assistants
   Object.keys(JanApiRouteConfiguration).forEach((key) => {
-    app.get(`/${key}`, async (_request) => getBuilder(JanApiRouteConfiguration[key]))
+    app.get(`/${key}`, async (_request) =>
+      getBuilder(JanApiRouteConfiguration[key]).then(normalizeData)
+    )
 
     app.get(`/${key}/:id`, async (request: any) =>
       retrieveBuilder(JanApiRouteConfiguration[key], request.params.id)
@@ -27,7 +39,26 @@ export const commonRouter = async (app: HttpServer) => {
     )
   })
 
-  // Download Model Routes
+  // Threads
+  app.post(`/threads/`, async (req, res) => createThread(req.body))
+
+  app.get(`/threads/:threadId/messages`, async (req, res) =>
+    getMessages(req.params.threadId).then(normalizeData)
+  )
+
+  app.get(`/threads/:threadId/messages/:messageId`, async (req, res) =>
+    retrieveMessage(req.params.threadId, req.params.messageId)
+  )
+
+  app.post(`/threads/:threadId/messages`, async (req, res) =>
+    createMessage(req.params.threadId as any, req.body as any)
+  )
+
+  app.patch(`/threads/:threadId`, async (request: any) =>
+    updateThread(request.params.threadId, request.body)
+  )
+
+  // Models
   app.get(`/models/download/:modelId`, async (request: any) =>
     downloadModel(request.params.modelId, {
       ignoreSSL: request.query.ignoreSSL === 'true',
@@ -46,17 +77,6 @@ export const commonRouter = async (app: HttpServer) => {
 
   app.put(`/models/:modelId/stop`, async (request: any) => stopModel(request.params.modelId))
 
-  // Chat Completion Routes
+  // Chat Completion
   app.post(`/chat/completions`, async (request: any, reply: any) => chatCompletions(request, reply))
-
-  // App Routes
-  app.post(`/app/${AppRoute.joinPath}`, async (request: any, reply: any) => {
-    const args = JSON.parse(request.body) as any[]
-    reply.send(JSON.stringify(join(...args[0])))
-  })
-
-  app.post(`/app/${AppRoute.baseName}`, async (request: any, reply: any) => {
-    const args = JSON.parse(request.body) as any[]
-    reply.send(JSON.stringify(basename(args[0])))
-  })
 }
diff --git a/core/src/node/api/common/builder.ts b/core/src/node/api/restful/helper/builder.ts
similarity index 96%
rename from core/src/node/api/common/builder.ts
rename to core/src/node/api/restful/helper/builder.ts
index 5c99cf4d8e..7001c0c769 100644
--- a/core/src/node/api/common/builder.ts
+++ b/core/src/node/api/restful/helper/builder.ts
@@ -1,10 +1,11 @@
 import fs from 'fs'
 import { JanApiRouteConfiguration, RouteConfiguration } from './configuration'
 import { join } from 'path'
-import { ContentType, MessageStatus, Model, ThreadMessage } from './../../../index'
-import { getEngineConfiguration, getJanDataFolderPath } from '../../utils'
+import { ContentType, MessageStatus, Model, ThreadMessage } from '../../../../index'
+import { getEngineConfiguration, getJanDataFolderPath } from '../../../helper'
 import { DEFAULT_CHAT_COMPLETION_URL } from './consts'
 
+// TODO: Refactor these
 export const getBuilder = async (configuration: RouteConfiguration) => {
   const directoryPath = join(getJanDataFolderPath(), configuration.dirName)
   try {
@@ -124,7 +125,7 @@ export const getMessages = async (threadId: string): Promise<ThreadMessage[]> =>
   }
 }
 
-export const retrieveMesasge = async (threadId: string, messageId: string) => {
+export const retrieveMessage = async (threadId: string, messageId: string) => {
   const messages = await getMessages(threadId)
   const filteredMessages = messages.filter((m) => m.id === messageId)
   if (!filteredMessages || filteredMessages.length === 0) {
@@ -317,13 +318,6 @@ export const chatCompletions = async (request: any, reply: any) => {
     apiUrl = engineConfiguration.full_url
   }
 
-  reply.raw.writeHead(200, {
-    'Content-Type': 'text/event-stream',
-    'Cache-Control': 'no-cache',
-    'Connection': 'keep-alive',
-    'Access-Control-Allow-Origin': '*',
-  })
-
   const headers: Record<string, any> = {
     'Content-Type': 'application/json',
   }
@@ -342,8 +336,14 @@ export const chatCompletions = async (request: any, reply: any) => {
   })
   if (response.status !== 200) {
     console.error(response)
-    return
+    reply.code(400).send(response)
   } else {
+    reply.raw.writeHead(200, {
+      'Content-Type': 'text/event-stream',
+      'Cache-Control': 'no-cache',
+      'Connection': 'keep-alive',
+      'Access-Control-Allow-Origin': '*',
+    })
     response.body.pipe(reply.raw)
   }
 }
diff --git a/core/src/node/api/common/configuration.ts b/core/src/node/api/restful/helper/configuration.ts
similarity index 100%
rename from core/src/node/api/common/configuration.ts
rename to core/src/node/api/restful/helper/configuration.ts
diff --git a/core/src/node/api/common/consts.ts b/core/src/node/api/restful/helper/consts.ts
similarity index 100%
rename from core/src/node/api/common/consts.ts
rename to core/src/node/api/restful/helper/consts.ts
diff --git a/core/src/node/api/common/startStopModel.ts b/core/src/node/api/restful/helper/startStopModel.ts
similarity index 99%
rename from core/src/node/api/common/startStopModel.ts
rename to core/src/node/api/restful/helper/startStopModel.ts
index 0d4934e1c0..0e6972b0bf 100644
--- a/core/src/node/api/common/startStopModel.ts
+++ b/core/src/node/api/restful/helper/startStopModel.ts
@@ -1,9 +1,9 @@
 import fs from 'fs'
 import { join } from 'path'
-import { getJanDataFolderPath, getJanExtensionsPath, getSystemResourceInfo } from '../../utils'
-import { logServer } from '../../log'
+import { getJanDataFolderPath, getJanExtensionsPath, getSystemResourceInfo } from '../../../helper'
+import { logServer } from '../../../helper/log'
 import { ChildProcessWithoutNullStreams, spawn } from 'child_process'
-import { Model, ModelSettingParams, PromptTemplate } from '../../../types'
+import { Model, ModelSettingParams, PromptTemplate } from '../../../../types'
 import {
   LOCAL_HOST,
   NITRO_DEFAULT_PORT,
diff --git a/core/src/node/api/restful/v1.ts b/core/src/node/api/restful/v1.ts
new file mode 100644
index 0000000000..5eb8f50679
--- /dev/null
+++ b/core/src/node/api/restful/v1.ts
@@ -0,0 +1,16 @@
+import { HttpServer } from '../HttpServer'
+import { commonRouter } from './common'
+import { downloadRouter } from './app/download'
+import { handleRequests } from './app/handlers'
+
+export const v1Router = async (app: HttpServer) => {
+  // MARK: Public API Routes
+  app.register(commonRouter)
+
+  // MARK: Internal Application Routes
+  handleRequests(app)
+
+  // Expanded route for tracking download progress
+  // TODO: Replace by Observer Wrapper (ZeroMQ / Vanilla Websocket)
+  app.register(downloadRouter)
+}
diff --git a/core/src/node/api/routes/download.ts b/core/src/node/api/routes/download.ts
deleted file mode 100644
index b4e11f9578..0000000000
--- a/core/src/node/api/routes/download.ts
+++ /dev/null
@@ -1,58 +0,0 @@
-import { DownloadRoute } from '../../../api'
-import { join } from 'path'
-import { DownloadManager } from '../../download'
-import { HttpServer } from '../HttpServer'
-import { createWriteStream } from 'fs'
-import { getJanDataFolderPath } from '../../utils'
-import { normalizeFilePath } from "../../path";
-
-export const downloadRouter = async (app: HttpServer) => {
-  app.post(`/${DownloadRoute.downloadFile}`, async (req, res) => {
-    const strictSSL = !(req.query.ignoreSSL === "true");
-    const proxy = req.query.proxy?.startsWith("http") ? req.query.proxy : undefined;
-    const body = JSON.parse(req.body as any);
-    const normalizedArgs = body.map((arg: any) => {
-      if (typeof arg === "string") {
-        return join(getJanDataFolderPath(), normalizeFilePath(arg));
-      }
-      return arg;
-    });
-
-    const localPath = normalizedArgs[1];
-    const fileName = localPath.split("/").pop() ?? "";
-
-    const request = require("request");
-    const progress = require("request-progress");
-
-    const rq = request({ url: normalizedArgs[0], strictSSL, proxy });
-    progress(rq, {})
-      .on("progress", function (state: any) {
-        console.log("download onProgress", state);
-      })
-      .on("error", function (err: Error) {
-        console.log("download onError", err);
-      })
-      .on("end", function () {
-        console.log("download onEnd");
-      })
-      .pipe(createWriteStream(normalizedArgs[1]));
-
-    DownloadManager.instance.setRequest(fileName, rq);
-  });
-
-  app.post(`/${DownloadRoute.abortDownload}`, async (req, res) => {
-    const body = JSON.parse(req.body as any);
-    const normalizedArgs = body.map((arg: any) => {
-      if (typeof arg === "string") {
-        return join(getJanDataFolderPath(), normalizeFilePath(arg));
-      }
-      return arg;
-    });
-
-    const localPath = normalizedArgs[0];
-    const fileName = localPath.split("/").pop() ?? "";
-    const rq = DownloadManager.instance.networkRequests[fileName];
-    DownloadManager.instance.networkRequests[fileName] = undefined;
-    rq?.abort();
-  });
-};
diff --git a/core/src/node/api/routes/extension.ts b/core/src/node/api/routes/extension.ts
deleted file mode 100644
index 02bc54eb37..0000000000
--- a/core/src/node/api/routes/extension.ts
+++ /dev/null
@@ -1,49 +0,0 @@
-import { join, extname } from 'path'
-import { ExtensionRoute } from '../../../api/index'
-import { ModuleManager } from '../../module'
-import { getActiveExtensions, installExtensions } from '../../extension/store'
-import { HttpServer } from '../HttpServer'
-
-import { readdirSync } from 'fs'
-import { getJanExtensionsPath } from '../../utils'
-
-export const extensionRouter = async (app: HttpServer) => {
-  // TODO: Share code between node projects
-  app.post(`/${ExtensionRoute.getActiveExtensions}`, async (_req, res) => {
-    const activeExtensions = await getActiveExtensions()
-    res.status(200).send(activeExtensions)
-  })
-
-  app.post(`/${ExtensionRoute.baseExtensions}`, async (_req, res) => {
-    const baseExtensionPath = join(__dirname, '..', '..', '..', 'pre-install')
-    const extensions = readdirSync(baseExtensionPath)
-      .filter((file) => extname(file) === '.tgz')
-      .map((file) => join(baseExtensionPath, file))
-
-    res.status(200).send(extensions)
-  })
-
-  app.post(`/${ExtensionRoute.installExtension}`, async (req) => {
-    const extensions = req.body as any
-    const installed = await installExtensions(JSON.parse(extensions)[0])
-    return JSON.parse(JSON.stringify(installed))
-  })
-
-  app.post(`/${ExtensionRoute.invokeExtensionFunc}`, async (req, res) => {
-    const args = JSON.parse(req.body as any)
-    console.debug(args)
-    const module = await import(join(getJanExtensionsPath(), args[0]))
-
-    ModuleManager.instance.setModule(args[0], module)
-    const method = args[1]
-    if (typeof module[method] === 'function') {
-      // remove first item from args
-      const newArgs = args.slice(2)
-      console.log(newArgs)
-      return module[method](...args.slice(2))
-    } else {
-      console.debug(module[method])
-      console.error(`Function "${method}" does not exist in the module.`)
-    }
-  })
-}
diff --git a/core/src/node/api/routes/fileManager.ts b/core/src/node/api/routes/fileManager.ts
deleted file mode 100644
index 66056444e0..0000000000
--- a/core/src/node/api/routes/fileManager.ts
+++ /dev/null
@@ -1,14 +0,0 @@
-import { FileManagerRoute } from '../../../api'
-import { HttpServer } from '../../index'
-
-export const fsRouter = async (app: HttpServer) => {
-  app.post(`/app/${FileManagerRoute.syncFile}`, async (request: any, reply: any) => {})
-
-  app.post(`/app/${FileManagerRoute.getJanDataFolderPath}`, async (request: any, reply: any) => {})
-
-  app.post(`/app/${FileManagerRoute.getResourcePath}`, async (request: any, reply: any) => {})
-
-  app.post(`/app/${FileManagerRoute.getUserHomePath}`, async (request: any, reply: any) => {})
-
-  app.post(`/app/${FileManagerRoute.fileStat}`, async (request: any, reply: any) => {})
-}
diff --git a/core/src/node/api/routes/fs.ts b/core/src/node/api/routes/fs.ts
deleted file mode 100644
index c5404ccce9..0000000000
--- a/core/src/node/api/routes/fs.ts
+++ /dev/null
@@ -1,29 +0,0 @@
-import { FileSystemRoute } from '../../../api'
-import { join } from 'path'
-import { HttpServer } from '../HttpServer'
-import { getJanDataFolderPath } from '../../utils'
-import { normalizeFilePath } from '../../path'
-
-export const fsRouter = async (app: HttpServer) => {
-  const moduleName = 'fs'
-  // Generate handlers for each fs route
-  Object.values(FileSystemRoute).forEach((route) => {
-    app.post(`/${route}`, async (req, res) => {
-      const body = JSON.parse(req.body as any)
-      try {
-        const result = await import(moduleName).then((mdl) => {
-          return mdl[route](
-            ...body.map((arg: any) =>
-              typeof arg === 'string' && (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
-                ? join(getJanDataFolderPath(), normalizeFilePath(arg))
-                : arg
-            )
-          )
-        })
-        res.status(200).send(result)
-      } catch (ex) {
-        console.log(ex)
-      }
-    })
-  })
-}
diff --git a/core/src/node/api/routes/index.ts b/core/src/node/api/routes/index.ts
deleted file mode 100644
index e6edc62f7c..0000000000
--- a/core/src/node/api/routes/index.ts
+++ /dev/null
@@ -1,6 +0,0 @@
-export * from './download'
-export * from './extension'
-export * from './fs'
-export * from './thread'
-export * from './common'
-export * from './v1'
diff --git a/core/src/node/api/routes/thread.ts b/core/src/node/api/routes/thread.ts
deleted file mode 100644
index 4066d27165..0000000000
--- a/core/src/node/api/routes/thread.ts
+++ /dev/null
@@ -1,30 +0,0 @@
-import { HttpServer } from '../HttpServer'
-import {
-  createMessage,
-  createThread,
-  getMessages,
-  retrieveMesasge,
-  updateThread,
-} from '../common/builder'
-
-export const threadRouter = async (app: HttpServer) => {
-  // create thread
-  app.post(`/`, async (req, res) => createThread(req.body))
-
-  app.get(`/:threadId/messages`, async (req, res) => getMessages(req.params.threadId))
-
-  // retrieve message
-  app.get(`/:threadId/messages/:messageId`, async (req, res) =>
-    retrieveMesasge(req.params.threadId, req.params.messageId),
-  )
-
-  // create message
-  app.post(`/:threadId/messages`, async (req, res) =>
-    createMessage(req.params.threadId as any, req.body as any),
-  )
-
-  // modify thread
-  app.patch(`/:threadId`, async (request: any) =>
-    updateThread(request.params.threadId, request.body),
-  )
-}
diff --git a/core/src/node/api/routes/v1.ts b/core/src/node/api/routes/v1.ts
deleted file mode 100644
index a2a48cd8b6..0000000000
--- a/core/src/node/api/routes/v1.ts
+++ /dev/null
@@ -1,25 +0,0 @@
-import { HttpServer } from '../HttpServer'
-import { commonRouter } from './common'
-import { threadRouter } from './thread'
-import { fsRouter } from './fs'
-import { extensionRouter } from './extension'
-import { downloadRouter } from './download'
-
-export const v1Router = async (app: HttpServer) => {
-  // MARK: External Routes
-  app.register(commonRouter)
-  app.register(threadRouter, {
-    prefix: '/threads',
-  })
-
-  // MARK: Internal Application Routes
-  app.register(fsRouter, {
-    prefix: '/fs',
-  })
-  app.register(extensionRouter, {
-    prefix: '/extension',
-  })
-  app.register(downloadRouter, {
-    prefix: '/download',
-  })
-}
diff --git a/core/src/node/extension/extension.ts b/core/src/node/extension/extension.ts
index aeb0277c0b..1f8dfa3ec2 100644
--- a/core/src/node/extension/extension.ts
+++ b/core/src/node/extension/extension.ts
@@ -104,7 +104,7 @@ export default class Extension {
       await pacote.extract(
         this.specifier,
         join(ExtensionManager.instance.getExtensionsPath() ?? '', this.name ?? ''),
-        this.installOptions,
+        this.installOptions
       )
 
       // Set the url using the custom extensions protocol
diff --git a/core/src/node/extension/index.ts b/core/src/node/extension/index.ts
index ed8544773a..994fc97f2f 100644
--- a/core/src/node/extension/index.ts
+++ b/core/src/node/extension/index.ts
@@ -41,8 +41,8 @@ async function registerExtensionProtocol() {
     console.error('Electron is not available')
   }
   const extensionPath = ExtensionManager.instance.getExtensionsPath()
-  if (electron) {
-    return electron.protocol.registerFileProtocol('extension', (request: any, callback: any) => {
+  if (electron && electron.protocol) {
+    return electron.protocol?.registerFileProtocol('extension', (request: any, callback: any) => {
       const entry = request.url.substr('extension://'.length - 1)
 
       const url = normalize(extensionPath + entry)
@@ -69,7 +69,7 @@ export function useExtensions(extensionsPath: string) {
 
   // Read extension list from extensions folder
   const extensions = JSON.parse(
-    readFileSync(ExtensionManager.instance.getExtensionsFile(), 'utf-8'),
+    readFileSync(ExtensionManager.instance.getExtensionsFile(), 'utf-8')
   )
   try {
     // Create and store a Extension instance for each extension in list
@@ -82,7 +82,7 @@ export function useExtensions(extensionsPath: string) {
     throw new Error(
       'Could not successfully rebuild list of installed extensions.\n' +
         error +
-        '\nPlease check the extensions.json file in the extensions folder.',
+        '\nPlease check the extensions.json file in the extensions folder.'
     )
   }
 
@@ -122,7 +122,7 @@ function loadExtension(ext: any) {
 export function getStore() {
   if (!ExtensionManager.instance.getExtensionsFile()) {
     throw new Error(
-      'The extension path has not yet been set up. Please run useExtensions before accessing the store',
+      'The extension path has not yet been set up. Please run useExtensions before accessing the store'
     )
   }
 
diff --git a/core/src/node/extension/store.ts b/core/src/node/extension/store.ts
index 84b1f9caf3..93b1aeb2b6 100644
--- a/core/src/node/extension/store.ts
+++ b/core/src/node/extension/store.ts
@@ -1,6 +1,6 @@
-import { writeFileSync } from "fs";
-import Extension from "./extension";
-import { ExtensionManager } from "./manager";
+import { writeFileSync } from 'fs'
+import Extension from './extension'
+import { ExtensionManager } from './manager'
 
 /**
  * @module store
@@ -11,7 +11,7 @@ import { ExtensionManager } from "./manager";
  * Register of installed extensions
  * @type {Object.<string, Extension>} extension - List of installed extensions
  */
-const extensions: Record<string, Extension> = {};
+const extensions: Record<string, Extension> = {}
 
 /**
  * Get a extension from the stored extensions.
@@ -21,10 +21,10 @@ const extensions: Record<string, Extension> = {};
  */
 export function getExtension(name: string) {
   if (!Object.prototype.hasOwnProperty.call(extensions, name)) {
-    throw new Error(`Extension ${name} does not exist`);
+    throw new Error(`Extension ${name} does not exist`)
   }
 
-  return extensions[name];
+  return extensions[name]
 }
 
 /**
@@ -33,7 +33,7 @@ export function getExtension(name: string) {
  * @alias extensionManager.getAllExtensions
  */
 export function getAllExtensions() {
-  return Object.values(extensions);
+  return Object.values(extensions)
 }
 
 /**
@@ -42,7 +42,7 @@ export function getAllExtensions() {
  * @alias extensionManager.getActiveExtensions
  */
 export function getActiveExtensions() {
-  return Object.values(extensions).filter((extension) => extension.active);
+  return Object.values(extensions).filter((extension) => extension.active)
 }
 
 /**
@@ -53,9 +53,9 @@ export function getActiveExtensions() {
  * @alias extensionManager.removeExtension
  */
 export function removeExtension(name: string, persist = true) {
-  const del = delete extensions[name];
-  if (persist) persistExtensions();
-  return del;
+  const del = delete extensions[name]
+  if (persist) persistExtensions()
+  return del
 }
 
 /**
@@ -65,10 +65,10 @@ export function removeExtension(name: string, persist = true) {
  * @returns {void}
  */
 export function addExtension(extension: Extension, persist = true) {
-  if (extension.name) extensions[extension.name] = extension;
+  if (extension.name) extensions[extension.name] = extension
   if (persist) {
-    persistExtensions();
-    extension.subscribe("pe-persist", persistExtensions);
+    persistExtensions()
+    extension.subscribe('pe-persist', persistExtensions)
   }
 }
 
@@ -77,14 +77,11 @@ export function addExtension(extension: Extension, persist = true) {
  * @returns {void}
  */
 export function persistExtensions() {
-  const persistData: Record<string, Extension> = {};
+  const persistData: Record<string, Extension> = {}
   for (const name in extensions) {
-    persistData[name] = extensions[name];
+    persistData[name] = extensions[name]
   }
-  writeFileSync(
-    ExtensionManager.instance.getExtensionsFile(),
-    JSON.stringify(persistData),
-  );
+  writeFileSync(ExtensionManager.instance.getExtensionsFile(), JSON.stringify(persistData))
 }
 
 /**
@@ -94,26 +91,29 @@ export function persistExtensions() {
  * @returns {Promise.<Array.<Extension>>} New extension
  * @alias extensionManager.installExtensions
  */
-export async function installExtensions(extensions: any, store = true) {
-  const installed: Extension[] = [];
+export async function installExtensions(extensions: any) {
+  const installed: Extension[] = []
   for (const ext of extensions) {
     // Set install options and activation based on input type
-    const isObject = typeof ext === "object";
-    const spec = isObject ? [ext.specifier, ext] : [ext];
-    const activate = isObject ? ext.activate !== false : true;
+    const isObject = typeof ext === 'object'
+    const spec = isObject ? [ext.specifier, ext] : [ext]
+    const activate = isObject ? ext.activate !== false : true
 
     // Install and possibly activate extension
-    const extension = new Extension(...spec);
-    await extension._install();
-    if (activate) extension.setActive(true);
+    const extension = new Extension(...spec)
+    if (!extension.origin) {
+      continue
+    }
+    await extension._install()
+    if (activate) extension.setActive(true)
 
     // Add extension to store if needed
-    if (store) addExtension(extension);
-    installed.push(extension);
+    addExtension(extension)
+    installed.push(extension)
   }
 
   // Return list of all installed extensions
-  return installed;
+  return installed
 }
 
 /**
diff --git a/core/src/node/utils/index.ts b/core/src/node/helper/config.ts
similarity index 91%
rename from core/src/node/utils/index.ts
rename to core/src/node/helper/config.ts
index 4bcbf13b17..71e7215780 100644
--- a/core/src/node/utils/index.ts
+++ b/core/src/node/helper/config.ts
@@ -1,8 +1,7 @@
-import { AppConfiguration, SystemResourceInfo } from '../../types'
+import { AppConfiguration } from '../../types'
 import { join } from 'path'
 import fs from 'fs'
 import os from 'os'
-import { log, logServer } from '../log'
 import childProcess from 'child_process'
 
 // TODO: move this to core
@@ -56,34 +55,6 @@ export const updateAppConfiguration = (configuration: AppConfiguration): Promise
   return Promise.resolve()
 }
 
-/**
- * Utility function to get server log path
- *
- * @returns {string} The log path.
- */
-export const getServerLogPath = (): string => {
-  const appConfigurations = getAppConfigurations()
-  const logFolderPath = join(appConfigurations.data_folder, 'logs')
-  if (!fs.existsSync(logFolderPath)) {
-    fs.mkdirSync(logFolderPath, { recursive: true })
-  }
-  return join(logFolderPath, 'server.log')
-}
-
-/**
- * Utility function to get app log path
- *
- * @returns {string} The log path.
- */
-export const getAppLogPath = (): string => {
-  const appConfigurations = getAppConfigurations()
-  const logFolderPath = join(appConfigurations.data_folder, 'logs')
-  if (!fs.existsSync(logFolderPath)) {
-    fs.mkdirSync(logFolderPath, { recursive: true })
-  }
-  return join(logFolderPath, 'app.log')
-}
-
 /**
  * Utility function to get data folder path
  *
@@ -146,18 +117,6 @@ const exec = async (command: string): Promise<string> => {
   })
 }
 
-export const getSystemResourceInfo = async (): Promise<SystemResourceInfo> => {
-  const cpu = await physicalCpuCount()
-  const message = `[NITRO]::CPU informations - ${cpu}`
-  log(message)
-  logServer(message)
-
-  return {
-    numCpuPhysicalCore: cpu,
-    memAvailable: 0, // TODO: this should not be 0
-  }
-}
-
 export const getEngineConfiguration = async (engineId: string) => {
   if (engineId !== 'openai') {
     return undefined
@@ -167,3 +126,31 @@ export const getEngineConfiguration = async (engineId: string) => {
   const data = fs.readFileSync(filePath, 'utf-8')
   return JSON.parse(data)
 }
+
+/**
+ * Utility function to get server log path
+ *
+ * @returns {string} The log path.
+ */
+export const getServerLogPath = (): string => {
+  const appConfigurations = getAppConfigurations()
+  const logFolderPath = join(appConfigurations.data_folder, 'logs')
+  if (!fs.existsSync(logFolderPath)) {
+    fs.mkdirSync(logFolderPath, { recursive: true })
+  }
+  return join(logFolderPath, 'server.log')
+}
+
+/**
+ * Utility function to get app log path
+ *
+ * @returns {string} The log path.
+ */
+export const getAppLogPath = (): string => {
+  const appConfigurations = getAppConfigurations()
+  const logFolderPath = join(appConfigurations.data_folder, 'logs')
+  if (!fs.existsSync(logFolderPath)) {
+    fs.mkdirSync(logFolderPath, { recursive: true })
+  }
+  return join(logFolderPath, 'app.log')
+}
diff --git a/core/src/node/download.ts b/core/src/node/helper/download.ts
similarity index 67%
rename from core/src/node/download.ts
rename to core/src/node/helper/download.ts
index 6d15fc3445..b9fb88bb5c 100644
--- a/core/src/node/download.ts
+++ b/core/src/node/helper/download.ts
@@ -1,15 +1,18 @@
+import { DownloadState } from '../../types'
 
 /**
  * Manages file downloads and network requests.
  */
 export class DownloadManager {
-  public networkRequests: Record<string, any> = {};
+  public networkRequests: Record<string, any> = {}
 
-  public static instance: DownloadManager = new DownloadManager();
+  public static instance: DownloadManager = new DownloadManager()
+
+  public downloadProgressMap: Record<string, DownloadState> = {}
 
   constructor() {
     if (DownloadManager.instance) {
-      return DownloadManager.instance;
+      return DownloadManager.instance
     }
   }
   /**
@@ -18,6 +21,6 @@ export class DownloadManager {
    * @param {Request | undefined} request - The network request to set, or undefined to clear the request.
    */
   setRequest(fileName: string, request: any | undefined) {
-    this.networkRequests[fileName] = request;
+    this.networkRequests[fileName] = request
   }
 }
diff --git a/core/src/node/helper/index.ts b/core/src/node/helper/index.ts
new file mode 100644
index 0000000000..6fc54fc6b1
--- /dev/null
+++ b/core/src/node/helper/index.ts
@@ -0,0 +1,6 @@
+export * from './config'
+export * from './download'
+export * from './log'
+export * from './module'
+export * from './path'
+export * from './resource'
diff --git a/core/src/node/log.ts b/core/src/node/helper/log.ts
similarity index 93%
rename from core/src/node/log.ts
rename to core/src/node/helper/log.ts
index 6f2c2f80f3..8ff1969434 100644
--- a/core/src/node/log.ts
+++ b/core/src/node/helper/log.ts
@@ -1,6 +1,6 @@
 import fs from 'fs'
 import util from 'util'
-import { getAppLogPath, getServerLogPath } from './utils'
+import { getAppLogPath, getServerLogPath } from './config'
 
 export const log = (message: string) => {
   const path = getAppLogPath()
diff --git a/core/src/node/module.ts b/core/src/node/helper/module.ts
similarity index 100%
rename from core/src/node/module.ts
rename to core/src/node/helper/module.ts
diff --git a/core/src/node/helper/path.ts b/core/src/node/helper/path.ts
new file mode 100644
index 0000000000..c20889f4c9
--- /dev/null
+++ b/core/src/node/helper/path.ts
@@ -0,0 +1,35 @@
+import { join } from 'path'
+
+/**
+ * Normalize file path
+ * Remove all file protocol prefix
+ * @param path
+ * @returns
+ */
+export function normalizeFilePath(path: string): string {
+  return path.replace(/^(file:[\\/]+)([^:\s]+)$/, '$2')
+}
+
+export async function appResourcePath(): Promise<string> {
+  let electron: any = undefined
+
+  try {
+    const moduleName = 'electron'
+    electron = await import(moduleName)
+  } catch (err) {
+    console.error('Electron is not available')
+  }
+
+  // electron
+  if (electron && electron.protocol) {
+    let appPath = join(electron.app.getAppPath(), '..', 'app.asar.unpacked')
+
+    if (!electron.app.isPackaged) {
+      // for development mode
+      appPath = join(electron.app.getAppPath())
+    }
+    return appPath
+  }
+  // server
+  return join(global.core.appPath(), '../../..')
+}
diff --git a/core/src/node/helper/resource.ts b/core/src/node/helper/resource.ts
new file mode 100644
index 0000000000..c79a63688b
--- /dev/null
+++ b/core/src/node/helper/resource.ts
@@ -0,0 +1,14 @@
+import { SystemResourceInfo } from '../../types'
+import { physicalCpuCount } from './config'
+import { log, logServer } from './log'
+
+export const getSystemResourceInfo = async (): Promise<SystemResourceInfo> => {
+  const cpu = await physicalCpuCount()
+  const message = `[NITRO]::CPU informations - ${cpu}`
+  log(message)
+
+  return {
+    numCpuPhysicalCore: cpu,
+    memAvailable: 0, // TODO: this should not be 0
+  }
+}
diff --git a/core/src/node/index.ts b/core/src/node/index.ts
index 10385ecfcc..31f2f076e9 100644
--- a/core/src/node/index.ts
+++ b/core/src/node/index.ts
@@ -2,9 +2,5 @@ export * from './extension/index'
 export * from './extension/extension'
 export * from './extension/manager'
 export * from './extension/store'
-export * from './download'
-export * from './module'
 export * from './api'
-export * from './log'
-export * from './utils'
-export * from './path'
+export * from './helper'
diff --git a/core/src/node/path.ts b/core/src/node/path.ts
deleted file mode 100644
index adbc38c6c1..0000000000
--- a/core/src/node/path.ts
+++ /dev/null
@@ -1,9 +0,0 @@
-/**
- * Normalize file path
- * Remove all file protocol prefix
- * @param path 
- * @returns 
- */
-export function normalizeFilePath(path: string): string {
-  return path.replace(/^(file:[\\/]+)([^:\s]+)$/, "$2");
-}
diff --git a/core/src/types/assistant/assistantEvent.ts b/core/src/types/assistant/assistantEvent.ts
new file mode 100644
index 0000000000..8c32f5d37a
--- /dev/null
+++ b/core/src/types/assistant/assistantEvent.ts
@@ -0,0 +1,7 @@
+/**
+ * The `EventName` enumeration contains the names of all the available events in the Jan platform.
+ */
+export enum AssistantEvent {
+  /** The `OnAssistantsUpdate` event is emitted when the assistant list is updated. */
+  OnAssistantsUpdate = 'OnAssistantsUpdate',
+}
diff --git a/core/src/types/assistant/index.ts b/core/src/types/assistant/index.ts
index 83ea73f856..e18589551a 100644
--- a/core/src/types/assistant/index.ts
+++ b/core/src/types/assistant/index.ts
@@ -1,2 +1,3 @@
 export * from './assistantEntity'
+export * from './assistantEvent'
 export * from './assistantInterface'
diff --git a/core/src/types/file/index.ts b/core/src/types/file/index.ts
index 6526cfc6d4..cc7274a28f 100644
--- a/core/src/types/file/index.ts
+++ b/core/src/types/file/index.ts
@@ -2,3 +2,26 @@ export type FileStat = {
   isDirectory: boolean
   size: number
 }
+
+export type DownloadState = {
+  modelId: string
+  fileName: string
+  time: DownloadTime
+  speed: number
+  percent: number
+
+  size: DownloadSize
+  children?: DownloadState[]
+  error?: string
+  downloadState: 'downloading' | 'error' | 'end'
+}
+
+type DownloadTime = {
+  elapsed: number
+  remaining: number
+}
+
+type DownloadSize = {
+  total: number
+  transferred: number
+}
diff --git a/core/src/types/message/index.ts b/core/src/types/message/index.ts
index e8d78deda4..ebb4c363d8 100644
--- a/core/src/types/message/index.ts
+++ b/core/src/types/message/index.ts
@@ -1,3 +1,4 @@
 export * from './messageEntity'
 export * from './messageInterface'
 export * from './messageEvent'
+export * from './messageRequestType'
diff --git a/core/src/types/message/messageEntity.ts b/core/src/types/message/messageEntity.ts
index 87e4b1997e..e9211d5508 100644
--- a/core/src/types/message/messageEntity.ts
+++ b/core/src/types/message/messageEntity.ts
@@ -27,6 +27,8 @@ export type ThreadMessage = {
   updated: number
   /** The additional metadata of this message. **/
   metadata?: Record<string, unknown>
+
+  type?: string
 }
 
 /**
@@ -56,6 +58,8 @@ export type MessageRequest = {
   /** The thread of this message is belong to. **/
   // TODO: deprecate threadId field
   thread?: Thread
+
+  type?: string
 }
 
 /**
diff --git a/core/src/types/message/messageRequestType.ts b/core/src/types/message/messageRequestType.ts
new file mode 100644
index 0000000000..cbb4cf4217
--- /dev/null
+++ b/core/src/types/message/messageRequestType.ts
@@ -0,0 +1,5 @@
+export enum MessageRequestType {
+  Thread = 'Thread',
+  Assistant = 'Assistant',
+  Summary = 'Summary',
+}
diff --git a/core/src/types/model/modelEvent.ts b/core/src/types/model/modelEvent.ts
index 978a487249..443f3a34fb 100644
--- a/core/src/types/model/modelEvent.ts
+++ b/core/src/types/model/modelEvent.ts
@@ -12,4 +12,6 @@ export enum ModelEvent {
   OnModelStop = 'OnModelStop',
   /** The `OnModelStopped` event is emitted when a model stopped ok. */
   OnModelStopped = 'OnModelStopped',
+  /** The `OnModelUpdate` event is emitted when the model list is updated. */
+  OnModelsUpdate = 'OnModelsUpdate',
 }
diff --git a/core/src/types/model/modelInterface.ts b/core/src/types/model/modelInterface.ts
index 74a479f3cb..93d5867eeb 100644
--- a/core/src/types/model/modelInterface.ts
+++ b/core/src/types/model/modelInterface.ts
@@ -10,7 +10,7 @@ export interface ModelInterface {
    * @param network - Optional object to specify proxy/whether to ignore SSL certificates.
    * @returns A Promise that resolves when the model has been downloaded.
    */
-  downloadModel(model: Model, network?: { ignoreSSL?: boolean, proxy?: string }): Promise<void>
+  downloadModel(model: Model, network?: { ignoreSSL?: boolean; proxy?: string }): Promise<void>
 
   /**
    * Cancels the download of a specific model.
diff --git a/core/tests/node/path.test.ts b/core/tests/node/path.test.ts
index 9f8a557bb0..5390df1193 100644
--- a/core/tests/node/path.test.ts
+++ b/core/tests/node/path.test.ts
@@ -1,4 +1,4 @@
-import { normalizeFilePath } from "../../src/node/path";
+import { normalizeFilePath } from "../../src/node/helper/path";
 
 describe("Test file normalize", () => {
   test("returns no file protocol prefix on Unix", async () => {
diff --git a/core/tslint.json b/core/tslint.json
index 398a416704..6543a641a1 100644
--- a/core/tslint.json
+++ b/core/tslint.json
@@ -1,6 +1,3 @@
 {
-  "extends": [
-    "tslint-config-standard",
-    "tslint-config-prettier"
-  ]
-}
\ No newline at end of file
+  "extends": ["tslint-config-standard", "tslint-config-prettier"]
+}
diff --git a/docker-compose.yml b/docker-compose.yml
new file mode 100644
index 0000000000..1691a841a0
--- /dev/null
+++ b/docker-compose.yml
@@ -0,0 +1,172 @@
+# Docker Compose file for setting up Minio, createbuckets, app_cpu, and app_gpu services
+
+version: '3.7'
+
+services:
+  # Minio service for object storage
+  minio:
+    image: minio/minio
+    volumes:
+      - minio_data:/data
+    ports:
+      - "9000:9000"
+      - "9001:9001"
+    environment:
+      # Set the root user and password for Minio
+      MINIO_ROOT_USER: minioadmin # This acts as AWS_ACCESS_KEY
+      MINIO_ROOT_PASSWORD: minioadmin # This acts as AWS_SECRET_ACCESS_KEY
+    command: server --console-address ":9001" /data
+    restart: always
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:9000/minio/health/live"]
+      interval: 30s
+      timeout: 20s
+      retries: 3
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.2
+
+  # createbuckets service to create a bucket and set its policy
+  createbuckets:
+    image: minio/mc
+    depends_on:
+      - minio
+    entrypoint: >
+      /bin/sh -c "
+      /usr/bin/mc alias set myminio http://minio:9000 minioadmin minioadmin;
+      /usr/bin/mc mb myminio/mybucket;
+      /usr/bin/mc policy set public myminio/mybucket;
+      exit 0;
+      "
+    networks:
+      vpcbr:
+
+  # app_cpu service for running the CPU version of the application
+  app_cpu_s3fs:
+    image: jan:latest
+    volumes:
+      - app_data_cpu_s3fs:/app/server/build/jan
+    build:
+      context: .
+      dockerfile: Dockerfile
+    environment:
+      # Set the AWS access key, secret access key, bucket name, endpoint, and region for app_cpu
+      AWS_ACCESS_KEY_ID: minioadmin
+      AWS_SECRET_ACCESS_KEY: minioadmin
+      S3_BUCKET_NAME: mybucket
+      AWS_ENDPOINT: http://10.5.0.2:9000
+      AWS_REGION: us-east-1
+      API_BASE_URL: http://localhost:1337
+    restart: always
+    profiles:
+      - cpu-s3fs
+    ports:
+      - "3000:3000"
+      - "1337:1337"
+      - "3928:3928"
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.3
+
+  # app_gpu service for running the GPU version of the application
+  app_gpu_s3fs:
+    deploy:
+      resources:
+        reservations:
+          devices:
+          - driver: nvidia
+            count: all
+            capabilities: [gpu]
+    image: jan-gpu:latest
+    volumes:
+      - app_data_gpu_s3fs:/app/server/build/jan
+    build:
+      context: .
+      dockerfile: Dockerfile.gpu
+    restart: always
+    environment:
+      # Set the AWS access key, secret access key, bucket name, endpoint, and region for app_gpu
+      AWS_ACCESS_KEY_ID: minioadmin
+      AWS_SECRET_ACCESS_KEY: minioadmin
+      S3_BUCKET_NAME: mybucket
+      AWS_ENDPOINT: http://10.5.0.2:9000
+      AWS_REGION: us-east-1
+      API_BASE_URL: http://localhost:1337
+    profiles:
+      - gpu-s3fs
+    ports:
+      - "3000:3000"
+      - "1337:1337"
+      - "3928:3928"
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.4
+
+  app_cpu_fs:
+    image: jan:latest
+    volumes:
+      - app_data_cpu_fs:/app/server/build/jan
+    build:
+      context: .
+      dockerfile: Dockerfile
+    environment:
+      API_BASE_URL: http://localhost:1337
+    restart: always
+    profiles:
+      - cpu-fs
+    ports:
+      - "3000:3000"
+      - "1337:1337"
+      - "3928:3928"
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.5
+
+  # app_gpu service for running the GPU version of the application
+  app_gpu_fs:
+    deploy:
+      resources:
+        reservations:
+          devices:
+          - driver: nvidia
+            count: all
+            capabilities: [gpu]
+    image: jan-gpu:latest
+    volumes:
+      - app_data_gpu_fs:/app/server/build/jan
+    build:
+      context: .
+      dockerfile: Dockerfile.gpu
+    restart: always
+    environment:
+      API_BASE_URL: http://localhost:1337
+    profiles:
+      - gpu-fs
+    ports:
+      - "3000:3000"
+      - "1337:1337"
+      - "3928:3928"
+    networks:
+      vpcbr:
+        ipv4_address: 10.5.0.6
+
+volumes:
+  minio_data:
+  app_data_cpu_s3fs:
+  app_data_gpu_s3fs:
+  app_data_cpu_fs:
+  app_data_gpu_fs:
+
+networks:
+  vpcbr:
+    driver: bridge
+    ipam:
+     config:
+       - subnet: 10.5.0.0/16
+         gateway: 10.5.0.1
+
+# Usage:
+# - Run 'docker compose --profile cpu-s3fs up -d' to start the app_cpu service
+# - Run 'docker compose --profile gpu-s3fs up -d' to start the app_gpu service
+# - Run 'docker compose --profile cpu-fs up -d' to start the app_cpu service
+# - Run 'docker compose --profile gpu-fs up -d' to start the app_gpu service
diff --git a/docs/blog/authors.yml b/docs/blog/authors.yml
index f30d4610dd..ec58002e48 100644
--- a/docs/blog/authors.yml
+++ b/docs/blog/authors.yml
@@ -1,6 +1,76 @@
 dan-jan:
   name: Daniel Onggunhao
   title: Co-Founder
-  url: https://github.com/dan-jan 
+  url: https://github.com/dan-jan
   image_url: https://avatars.githubusercontent.com/u/101145494?v=4
-  email: daniel@jan.ai
\ No newline at end of file
+  email: daniel@jan.ai
+
+namchuai:
+  name: Nam Nguyen
+  title: Developer
+  url: https://github.com/namchuai
+  image_url: https://avatars.githubusercontent.com/u/10397206?v=4
+  email: james@jan.ai
+
+hiro-v:
+  name: Hiro Vuong
+  title: MLE
+  url: https://github.com/hiro-v
+  image_url: https://avatars.githubusercontent.com/u/22463238?v=4
+  email: hiro@jan.ai
+
+ashley-jan:
+  name: Ashley Tran
+  title: Product Designer
+  url: https://github.com/imtuyethan
+  image_url: https://avatars.githubusercontent.com/u/89722390?v=4
+  email: ashley@jan.ai
+
+hientominh:
+  name: Hien To
+  title: DevOps Engineer
+  url: https://github.com/hientominh
+  image_url: https://avatars.githubusercontent.com/u/37921427?v=4
+  email: hien@jan.ai
+
+Van-QA:
+  name: Van Pham
+  title: QA & Release Manager
+  url: https://github.com/Van-QA
+  image_url: https://avatars.githubusercontent.com/u/64197333?v=4
+  email: van@jan.ai
+
+louis-jan:
+  name: Louis Le
+  title: Software Engineer
+  url: https://github.com/louis-jan
+  image_url: https://avatars.githubusercontent.com/u/133622055?v=4
+  email: louis@jan.ai
+
+hahuyhoang411:
+  name: Rex Ha
+  title: LLM Researcher & Content Writer
+  url: https://github.com/hahuyhoang411
+  image_url: https://avatars.githubusercontent.com/u/64120343?v=4
+  email: rex@jan.ai
+
+automaticcat:
+  name: Alan Dao
+  title: AI Engineer
+  url: https://github.com/tikikun
+  image_url: https://avatars.githubusercontent.com/u/22268502?v=4
+  email: alan@jan.ai
+
+hieu-jan:
+  name: Henry Ho
+  title: Software Engineer
+  url: https://github.com/hieu-jan
+  image_url: https://avatars.githubusercontent.com/u/150573299?v=4
+  email: hieu@jan.ai
+
+0xsage:
+  name: Nicole Zhu
+  title: Co-Founder
+  url: https://github.com/0xsage
+  image_url: https://avatars.githubusercontent.com/u/69952136?v=4
+  email: nicole@jan.ai
diff --git a/docs/docs/about/01-README.md b/docs/docs/about/01-README.md
index 3b27595135..d5d3b8dc22 100644
--- a/docs/docs/about/01-README.md
+++ b/docs/docs/about/01-README.md
@@ -110,9 +110,10 @@ Adhering to Jan's privacy preserving philosophy, our analytics philosophy is to
 
 #### What is tracked
 
-1. By default, Github tracks downloads and device metadata for all public Github repos. This helps us troubleshoot & ensure cross platform support.
-1. We use Posthog to track a single `app.opened` event without additional user metadata, in order to understand retention.
-1. Additionally, we plan to enable a `Settings` feature for users to turn off all tracking.
+1. By default, Github tracks downloads and device metadata for all public GitHub repositories. This helps us troubleshoot & ensure cross-platform support.
+2. We use [Umami](https://umami.is/) to collect, analyze, and understand application data while maintaining visitor privacy and data ownership. We are using the Umami Cloud in Europe to ensure GDPR compliance. Please see [Umami Privacy Policy](https://umami.is/privacy) for more details.
+3. We use Umami to track a single `app.opened` event without additional user metadata, in order to understand retention. In addition, we track `app.event` to understand app version usage.
+4. Additionally, we plan to enable a `Settings` feature for users to turn off all tracking.
 
 #### Request for help
 
diff --git a/docs/docs/developer/01-overview/04-install-and-prerequisites.md b/docs/docs/developer/01-overview/04-install-and-prerequisites.md
new file mode 100644
index 0000000000..110f62e361
--- /dev/null
+++ b/docs/docs/developer/01-overview/04-install-and-prerequisites.md
@@ -0,0 +1,79 @@
+---
+title: Installation and Prerequisites
+slug: /developer/prereq
+description: Guide to install and setup Jan for development.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    installation,
+    prerequisites,
+    developer setup,
+  ]
+---
+
+## Requirements
+
+### Hardware Requirements
+
+Ensure your system meets the following specifications to guarantee a smooth development experience:
+
+- [Hardware Requirements](../../guides/02-installation/06-hardware.md)
+
+### System Requirements
+
+Make sure your operating system meets the specific requirements for Jan development:
+
+- [Windows](../../install/windows/#system-requirements)
+- [MacOS](../../install/mac/#system-requirements)
+- [Linux](../../install/linux/#system-requirements)
+
+## Prerequisites
+
+- [Node.js](https://nodejs.org/en/) (version 20.0.0 or higher)
+- [yarn](https://yarnpkg.com/) (version 1.22.0 or higher)
+- [make](https://www.gnu.org/software/make/) (version 3.81 or higher)
+
+## Instructions
+
+1. **Clone the Repository:**
+
+```bash
+git clone https://github.com/janhq/jan
+cd jan
+git checkout -b DESIRED_BRANCH
+```
+
+2. **Install Dependencies**
+
+```bash
+yarn install
+```
+
+3. **Run Development and Use Jan Desktop**
+
+```bash
+make dev
+```
+
+This command starts the development server and opens the Jan Desktop app.
+
+## For Production Build
+
+```bash
+# Do steps 1 and 2 in the previous section
+# Build the app
+make build
+```
+
+This will build the app MacOS (M1/M2/M3) for production (with code signing already done) and place the result in `/electron/dist` folder.
+
+## Troubleshooting
+
+If you run into any issues due to a broken build, please check the [Stuck on a Broken Build](../../troubleshooting/stuck-on-broken-build) guide.
diff --git a/docs/docs/guides/02-installation/01-mac.md b/docs/docs/guides/02-installation/01-mac.md
index 8e67b5bed2..7a39613843 100644
--- a/docs/docs/guides/02-installation/01-mac.md
+++ b/docs/docs/guides/02-installation/01-mac.md
@@ -12,11 +12,16 @@ keywords:
     conversational AI,
     no-subscription fee,
     large language model,
+    installation guide,
   ]
 ---
 
 # Installing Jan on MacOS
 
+## System Requirements
+
+Ensure that your MacOS version is 13 or higher to run Jan.
+
 ## Installation
 
 Jan is available for download via our homepage, [https://jan.ai/](https://jan.ai/).
diff --git a/docs/docs/guides/02-installation/02-windows.md b/docs/docs/guides/02-installation/02-windows.md
index b200554d22..d60ab86f7f 100644
--- a/docs/docs/guides/02-installation/02-windows.md
+++ b/docs/docs/guides/02-installation/02-windows.md
@@ -12,11 +12,23 @@ keywords:
     conversational AI,
     no-subscription fee,
     large language model,
+    installation guide,
   ]
 ---
 
 # Installing Jan on Windows
 
+## System Requirements
+
+Ensure that your system meets the following requirements:
+
+- Windows 10 or higher is required to run Jan.
+
+To enable GPU support, you will need:
+
+- NVIDIA GPU with CUDA Toolkit 11.7 or higher
+- NVIDIA driver 470.63.01 or higher
+
 ## Installation
 
 Jan is available for download via our homepage, [https://jan.ai](https://jan.ai/).
@@ -59,13 +71,3 @@ To remove all user data associated with Jan, you can delete the `/jan` directory
 cd C:\Users\%USERNAME%\AppData\Roaming
 rmdir /S jan
 ```
-
-## Troubleshooting
-
-### Microsoft Defender
-
-**Error: "Microsoft Defender SmartScreen prevented an unrecognized app from starting"**
-
-Windows Defender may display the above warning when running the Jan Installer, as a standard security measure.
-
-To proceed, select the "More info" option and select the "Run Anyway" option to continue with the installation.
diff --git a/docs/docs/guides/02-installation/03-linux.md b/docs/docs/guides/02-installation/03-linux.md
index 21dfac1a96..0ec7fea605 100644
--- a/docs/docs/guides/02-installation/03-linux.md
+++ b/docs/docs/guides/02-installation/03-linux.md
@@ -12,11 +12,24 @@ keywords:
     conversational AI,
     no-subscription fee,
     large language model,
+    installation guide,
   ]
 ---
 
 # Installing Jan on Linux
 
+## System Requirements
+
+Ensure that your system meets the following requirements:
+
+- glibc 2.27 or higher (check with `ldd --version`)
+- gcc 11, g++ 11, cpp 11, or higher, refer to this [link](https://jan.ai/guides/troubleshooting/gpu-not-used/#specific-requirements-for-linux) for more information.
+
+To enable GPU support, you will need:
+
+- NVIDIA GPU with CUDA Toolkit 11.7 or higher
+- NVIDIA driver 470.63.01 or higher
+
 ## Installation
 
 Jan is available for download via our homepage, [https://jan.ai](https://jan.ai/).
@@ -66,7 +79,6 @@ jan-linux-amd64-{version}.deb
 # AppImage
 jan-linux-x86_64-{version}.AppImage
 ```
-```
 
 ## Uninstall Jan
 
diff --git a/docs/docs/guides/02-installation/05-docker.md b/docs/docs/guides/02-installation/05-docker.md
new file mode 100644
index 0000000000..6236ed92e4
--- /dev/null
+++ b/docs/docs/guides/02-installation/05-docker.md
@@ -0,0 +1,102 @@
+---
+title: Docker
+slug: /install/docker
+description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    docker installation,
+  ]
+---
+
+# Installing Jan using Docker
+
+## Installation
+
+### Pre-requisites
+
+:::note
+
+**Supported OS**: Linux, WSL2 Docker
+
+:::
+
+- Docker Engine and Docker Compose are required to run Jan in Docker mode. Follow the [instructions](https://docs.docker.com/engine/install/ubuntu/) below to get started with Docker Engine on Ubuntu.
+
+```bash
+curl -fsSL https://get.docker.com -o get-docker.sh
+sudo sh ./get-docker.sh --dry-run
+```
+
+- If you intend to run Jan in GPU mode, you need to install `nvidia-driver` and `nvidia-docker2`. Follow the instruction [here](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html) for installation.
+
+### Instructions
+
+- Run Jan in Docker mode
+
+  - **Option 1**: Run Jan in CPU mode
+
+    ```bash
+    docker compose --profile cpu up -d
+    ```
+
+  - **Option 2**: Run Jan in GPU mode
+
+    - **Step 1**: Check CUDA compatibility with your NVIDIA driver by running `nvidia-smi` and check the CUDA version in the output
+
+      ```bash
+      nvidia-smi
+
+      # Output
+      +---------------------------------------------------------------------------------------+
+      | NVIDIA-SMI 531.18                 Driver Version: 531.18       CUDA Version: 12.1     |
+      |-----------------------------------------+----------------------+----------------------+
+      | GPU  Name                      TCC/WDDM | Bus-Id        Disp.A | Volatile Uncorr. ECC |
+      | Fan  Temp  Perf            Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
+      |                                         |                      |               MIG M. |
+      |=========================================+======================+======================|
+      |   0  NVIDIA GeForce RTX 4070 Ti    WDDM | 00000000:01:00.0  On |                  N/A |
+      |  0%   44C    P8               16W / 285W|   1481MiB / 12282MiB |      2%      Default |
+      |                                         |                      |                  N/A |
+      +-----------------------------------------+----------------------+----------------------+
+      |   1  NVIDIA GeForce GTX 1660 Ti    WDDM | 00000000:02:00.0 Off |                  N/A |
+      |  0%   49C    P8               14W / 120W|      0MiB /  6144MiB |      0%      Default |
+      |                                         |                      |                  N/A |
+      +-----------------------------------------+----------------------+----------------------+
+      |   2  NVIDIA GeForce GTX 1660 Ti    WDDM | 00000000:05:00.0 Off |                  N/A |
+      | 29%   38C    P8               11W / 120W|      0MiB /  6144MiB |      0%      Default |
+      |                                         |                      |                  N/A |
+      +-----------------------------------------+----------------------+----------------------+
+
+      +---------------------------------------------------------------------------------------+
+      | Processes:                                                                            |
+      |  GPU   GI   CI        PID   Type   Process name                            GPU Memory |
+      |        ID   ID                                                             Usage      |
+      |=======================================================================================|
+      ```
+
+    - **Step 2**: Visit [NVIDIA NGC Catalog ](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda/tags) and find the smallest minor version of image tag that matches your CUDA version (e.g., 12.1 -> 12.1.0)
+
+    - **Step 3**: Update the `Dockerfile.gpu` line number 5 with the latest minor version of the image tag from step 2 (e.g. change `FROM nvidia/cuda:12.2.0-runtime-ubuntu22.04 AS base` to `FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04 AS base`)
+
+    - **Step 4**: Run command to start Jan in GPU mode
+
+      ```bash
+      # GPU mode
+      docker compose --profile gpu up -d
+      ```
+
+  This will start the web server and you can access Jan at `http://localhost:3000`.
+
+:::warning
+
+- Docker mode is currently only suitable for development and localhost. Production is not supported yet, and the RAG feature is not available in Docker mode.
+
+:::
diff --git a/docs/docs/guides/02-installation/05-nightly-build.md b/docs/docs/guides/02-installation/07-nightly-build.md
similarity index 100%
rename from docs/docs/guides/02-installation/05-nightly-build.md
rename to docs/docs/guides/02-installation/07-nightly-build.md
diff --git a/docs/docs/guides/02-installation/07-antivirus-compatibility-testing.md b/docs/docs/guides/02-installation/08-antivirus-compatibility-testing.md
similarity index 100%
rename from docs/docs/guides/02-installation/07-antivirus-compatibility-testing.md
rename to docs/docs/guides/02-installation/08-antivirus-compatibility-testing.md
diff --git a/docs/docs/guides/04-using-models/02-import-manually.mdx b/docs/docs/guides/04-using-models/02-import-manually.mdx
index 68142a8af0..7c446ea1c9 100644
--- a/docs/docs/guides/04-using-models/02-import-manually.mdx
+++ b/docs/docs/guides/04-using-models/02-import-manually.mdx
@@ -29,6 +29,10 @@ In this section, we will show you how to import a GGUF model from [HuggingFace](
 
 > We are fast shipping a UI to make this easier, but it's a bit manual for now. Apologies.
 
+## Import Models Using Absolute Filepath (version 0.4.7)
+
+Starting from version 0.4.7, Jan has introduced the capability to import models using an absolute file path. It allows you to import models from any directory on your computer. Please check the [import models using absolute filepath](../import-models-using-absolute-filepath) guide for more information. 
+
 ## Manually Importing a Downloaded Model (nightly versions and v0.4.4+)
 
 ### 1. Create a Model Folder
@@ -186,7 +190,6 @@ This means that you can easily reconfigure your models, export them, and share y
 
 Edit `model.json` and include the following configurations:
 
-- Ensure the filename must be `model.json`.
 - Ensure the `id` property matches the folder name you created.
 - Ensure the GGUF filename should match the `id` property exactly.
 - Ensure the `source.url` property is the direct binary download link ending in `.gguf`. In HuggingFace, you can find the direct links in the `Files and versions` tab.
diff --git a/docs/docs/guides/04-using-models/03-import-models-using-absolute-filepath.mdx b/docs/docs/guides/04-using-models/03-import-models-using-absolute-filepath.mdx
new file mode 100644
index 0000000000..490f68cd67
--- /dev/null
+++ b/docs/docs/guides/04-using-models/03-import-models-using-absolute-filepath.mdx
@@ -0,0 +1,84 @@
+---
+title: Import Models Using Absolute Filepath
+slug: /guides/using-models/import-models-using-absolute-filepath
+description: Guide to import model using absolute filepath in Jan.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    import-models-manually,
+    absolute-filepath,
+  ]
+---
+
+In this guide, we will walk you through the process of importing a model using an absolute filepath in Jan, using our latest model, [Trinity](https://huggingface.co/janhq/trinity-v1-GGUF), as an example.
+
+### 1. Get the Absolute Filepath of the Model
+
+After downloading .gguf model, you can get the absolute filepath of the model file.
+
+### 2. Configure the Model JSON
+
+1. Navigate to the `~/jan/models` folder. 
+2. Create a folder named `<modelname>`, for example, `tinyllama`.
+3. Create a `model.json` file inside the folder, including the following configurations:
+
+- Ensure the `id` property matches the folder name you created.
+- Ensure the `url` property is the direct binary download link ending in `.gguf`. Now, you can use the absolute filepath of the model file.
+- Ensure the `engine` property is set to `nitro`.
+
+```json
+{
+  "sources": [
+    {
+      "filename": "tinyllama.gguf",
+      // highlight-next-line
+      "url": "<absolute-filepath-of-the-model-file>"
+    }
+  ],
+  "id": "tinyllama-1.1b",
+  "object": "model",
+  "name": "(Absolute Path) TinyLlama Chat 1.1B Q4",
+  "version": "1.0",
+  "description": "TinyLlama is a tiny model with only 1.1B. It's a good model for less powerful computers.",
+  "format": "gguf",
+  "settings": {
+    "ctx_len": 4096,
+    "prompt_template": "<|system|>\n{system_message}<|user|>\n{prompt}<|assistant|>",
+    "llama_model_path": "tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 2048,
+    "stop": [],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "author": "TinyLlama",
+    "tags": ["Tiny", "Foundation Model"],
+    "size": 669000000
+  },
+  "engine": "nitro"
+}
+```
+
+:::warning
+
+- If you are using Windows, you need to use double backslashes in the url property, for example: `C:\\Users\\username\\filename.gguf`.
+
+:::
+
+### 3. Start the Model
+
+Restart Jan and navigate to the Hub. Locate your model and click the Use button.
+
+![Demo](assets/03-demo-absolute-filepath.gif)
\ No newline at end of file
diff --git a/docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx b/docs/docs/guides/04-using-models/04-integrate-with-remote-server.mdx
similarity index 90%
rename from docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx
rename to docs/docs/guides/04-using-models/04-integrate-with-remote-server.mdx
index 533797fcaa..3632a40b02 100644
--- a/docs/docs/guides/04-using-models/03-integrate-with-remote-server.mdx
+++ b/docs/docs/guides/04-using-models/04-integrate-with-remote-server.mdx
@@ -65,6 +65,13 @@ Navigate to the `~/jan/models` folder. Create a folder named `gpt-3.5-turbo-16k`
 }
 ```
 
+:::tip
+
+- You can find the list of available models in the [OpenAI Platform](https://platform.openai.com/docs/models/overview).
+- Please note that the `id` property need to match the model name in the list. For example, if you want to use the [GPT-4 Turbo](https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo), you need to set the `id` property as `gpt-4-1106-preview`.
+
+:::
+
 ### 2. Configure OpenAI API Keys
 
 You can find your API keys in the [OpenAI Platform](https://platform.openai.com/api-keys) and set the OpenAI API keys in `~/jan/engines/openai.json` file.
@@ -81,7 +88,7 @@ You can find your API keys in the [OpenAI Platform](https://platform.openai.com/
 
 Restart Jan and navigate to the Hub. Then, select your configured model and start the model.
 
-![image-01](assets/03-openai-platform-configuration.png)
+![image-01](assets/04-openai-platform-configuration.png)
 
 ## Engines with OAI Compatible Configuration
 
@@ -152,7 +159,7 @@ Navigate to the `~/jan/models` folder. Create a folder named `mistral-ins-7b-q4`
 
 Restart Jan and navigate to the Hub. Locate your model and click the Use button.
 
-![image-02](assets/03-oai-compatible-configuration.png)
+![image-02](assets/04-oai-compatible-configuration.png)
 
 ## Assistance and Support
 
diff --git a/docs/docs/guides/04-using-models/04-customize-engine-settings.mdx b/docs/docs/guides/04-using-models/05-customize-engine-settings.mdx
similarity index 100%
rename from docs/docs/guides/04-using-models/04-customize-engine-settings.mdx
rename to docs/docs/guides/04-using-models/05-customize-engine-settings.mdx
diff --git a/docs/docs/guides/04-using-models/assets/03-demo-absolute-filepath.gif b/docs/docs/guides/04-using-models/assets/03-demo-absolute-filepath.gif
new file mode 100644
index 0000000000..24dcc251a7
Binary files /dev/null and b/docs/docs/guides/04-using-models/assets/03-demo-absolute-filepath.gif differ
diff --git a/docs/docs/guides/04-using-models/assets/03-oai-compatible-configuration.png b/docs/docs/guides/04-using-models/assets/04-oai-compatible-configuration.png
similarity index 100%
rename from docs/docs/guides/04-using-models/assets/03-oai-compatible-configuration.png
rename to docs/docs/guides/04-using-models/assets/04-oai-compatible-configuration.png
diff --git a/docs/docs/guides/04-using-models/assets/03-openai-platform-configuration.png b/docs/docs/guides/04-using-models/assets/04-openai-platform-configuration.png
similarity index 100%
rename from docs/docs/guides/04-using-models/assets/03-openai-platform-configuration.png
rename to docs/docs/guides/04-using-models/assets/04-openai-platform-configuration.png
diff --git a/docs/docs/guides/05-using-server/01-server.md b/docs/docs/guides/05-using-server/01-server.md
deleted file mode 100644
index 952b7399fa..0000000000
--- a/docs/docs/guides/05-using-server/01-server.md
+++ /dev/null
@@ -1,33 +0,0 @@
----
-title: Connect to Server
-description: Connect to Jan's built-in API server.
-keywords:
-  [
-    Jan AI,
-    Jan,
-    ChatGPT alternative,
-    local AI,
-    private AI,
-    conversational AI,
-    no-subscription fee,
-    large language model,
-  ]
----
-
-:::warning
-
-This page is under construction.
-
-:::
-
-Jan ships with a built-in API server, that can be used as a drop-in, local replacement for OpenAI's API.
-
-Jan runs on port `1337` by default, but this can (soon) be changed in Settings.
-
-1. Go to Settings > Advanced > Enable API Server
-
-2. Go to http://localhost:1337 for the API docs.
-
-3. In terminal, simply CURL...
-
-Note: Some UI states may be broken when in Server Mode.
diff --git a/docs/docs/guides/05-using-server/01-start-server.md b/docs/docs/guides/05-using-server/01-start-server.md
new file mode 100644
index 0000000000..2433fd80a1
--- /dev/null
+++ b/docs/docs/guides/05-using-server/01-start-server.md
@@ -0,0 +1,72 @@
+---
+title: Start Local Server
+slug: /guides/using-server/start-server
+description: How to run Jan's built-in API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    local server,
+    api server,
+  ]
+---
+
+Jan ships with a built-in API server that can be used as a drop-in, local replacement for OpenAI's API. You can run your server by following these simple steps.
+
+## Open Local API Server View
+
+Navigate to the Local API Server view by clicking the corresponding icon on the left side of the screen.
+
+<br></br>
+
+![01-local-api-view](./assets/01-local-api-view.gif)
+
+## Choosing a Model
+
+On the top right of your screen under `Model Settings`, set the LLM that your local server will be running. You can choose from any of the models already installed, or pick a new model by clicking `Explore the Hub`.
+
+<br></br>
+
+![01-choose-model](./assets/01-choose-model.png)
+
+## Server Options
+
+On the left side of your screen, you can set custom server options.
+
+<br></br>
+
+![01-server-settings](./assets/01-server-options.png)
+
+### Local Server Address
+
+By default, Jan will be accessible only on localhost `127.0.0.1`. This means a local server can only be accessed on the same machine where the server is being run.
+
+You can make the local server more accessible by clicking on the address and choosing `0.0.0.0` instead, which allows the server to be accessed from other devices on the local network. This is less secure than choosing localhost, and should be done with caution.
+
+### Port
+
+Jan runs on port `1337` by default. You can change the port to any other port number if needed.
+
+### Cross-Origin Resource Sharing (CORS)
+
+Cross-Origin Resource Sharing (CORS) manages resource access on the local server from external domains. Enabled for security by default, it can be disabled if needed.
+
+### Verbose Server Logs
+
+The center of the screen displays the server logs as the local server runs. This option provides extensive details about server activities.
+
+## Start Server
+
+Click the `Start Server` button on the top left of your screen. You will see the server log display a message such as `Server listening at http://127.0.0.1:1337`, and the `Start Server` button will change to a red `Stop Server` button.
+
+<br></br>
+
+![01-running-server](./assets/01-running-server.gif)
+
+You server is now running and you can use the server address and port to make requests to the local server.
diff --git a/docs/docs/guides/05-using-server/02-using-server.md b/docs/docs/guides/05-using-server/02-using-server.md
new file mode 100644
index 0000000000..3d4b004a1f
--- /dev/null
+++ b/docs/docs/guides/05-using-server/02-using-server.md
@@ -0,0 +1,102 @@
+---
+title: Using Jan's Built-in API Server
+description: How to use Jan's built-in API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    local server,
+    api server,
+  ]
+---
+
+Jan's built-in API server is compatible with [OpenAI's API](https://platform.openai.com/docs/api-reference) and can be used as a drop-in, local replacement. Follow these steps to use the API server.
+
+## Open the API Reference
+
+Jan contains a comprehensive API reference. This reference displays all the API endpoints available, gives you examples requests and responses, and allows you to execute them in browser.
+
+On the top left of your screen below the red `Stop Server` button is the blue `API Reference`. Clicking this will open the reference in your browser.
+
+<br></br>
+
+![02-api-reference](./assets/02-api-reference.png)
+
+Scroll through the various available endpoints to learn what options are available and try them out by executing the example requests. In addition, you can also use the [Jan API Reference](https://jan.ai/api-reference/) on the Jan website.
+
+### Chat
+
+In the Chat section of the API reference, you will see an example JSON request body.
+
+<br></br>
+
+![02-chat-example](./assets/02-chat-example.png)
+
+With your local server running, you can click the `Try it out` button on the top left, then the blue `Execute` button below the JSON. The browser will send the example request to your server, and display the response body below.
+
+Use the API endpoints, request and response body examples as models for your own application.
+
+### cURL Request Example
+
+Here is an example curl request with a local server running `tinyllama-1.1b`:
+
+<br></br>
+
+```json
+{
+  "messages": [
+    {
+      "content": "You are a helpful assistant.",
+      "role": "system"
+    },
+    {
+      "content": "Hello!",
+      "role": "user"
+    }
+  ],
+  "model": "tinyllama-1.1b",
+  "stream": true,
+  "max_tokens": 2048,
+  "stop": [
+    "hello"
+  ],
+  "frequency_penalty": 0,
+  "presence_penalty": 0,
+  "temperature": 0.7,
+  "top_p": 0.95
+}
+'
+```
+
+### Response Body Example
+
+```json
+{
+  "choices": [
+    {
+      "finish_reason": null,
+      "index": 0,
+      "message": {
+        "content": "Hello user. What can I help you with?",
+        "role": "assistant"
+      }
+    }
+  ],
+  "created": 1700193928,
+  "id": "ebwd2niJvJB1Q2Whyvkz",
+  "model": "_",
+  "object": "chat.completion",
+  "system_fingerprint": "_",
+  "usage": {
+    "completion_tokens": 500,
+    "prompt_tokens": 33,
+    "total_tokens": 533
+  }
+}
+```
diff --git a/docs/docs/guides/05-using-server/assets/01-choose-model.png b/docs/docs/guides/05-using-server/assets/01-choose-model.png
new file mode 100644
index 0000000000..9062a1e951
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/01-choose-model.png differ
diff --git a/docs/docs/guides/05-using-server/assets/01-local-api-view.gif b/docs/docs/guides/05-using-server/assets/01-local-api-view.gif
new file mode 100644
index 0000000000..cb221fce45
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/01-local-api-view.gif differ
diff --git a/docs/docs/guides/05-using-server/assets/01-running-server.gif b/docs/docs/guides/05-using-server/assets/01-running-server.gif
new file mode 100644
index 0000000000..a4225f3cb0
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/01-running-server.gif differ
diff --git a/docs/docs/guides/05-using-server/assets/01-server-options.png b/docs/docs/guides/05-using-server/assets/01-server-options.png
new file mode 100644
index 0000000000..c48844e405
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/01-server-options.png differ
diff --git a/docs/docs/guides/05-using-server/assets/02-api-reference.png b/docs/docs/guides/05-using-server/assets/02-api-reference.png
new file mode 100644
index 0000000000..154d9dfc90
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/02-api-reference.png differ
diff --git a/docs/docs/guides/05-using-server/assets/02-chat-example.png b/docs/docs/guides/05-using-server/assets/02-chat-example.png
new file mode 100644
index 0000000000..bd7e33a6ae
Binary files /dev/null and b/docs/docs/guides/05-using-server/assets/02-chat-example.png differ
diff --git a/docs/docs/guides/07-integrations/01-integrate-continue.mdx b/docs/docs/guides/07-integrations/01-integrate-continue.mdx
index 3a0e9f282b..1fa0397e29 100644
--- a/docs/docs/guides/07-integrations/01-integrate-continue.mdx
+++ b/docs/docs/guides/07-integrations/01-integrate-continue.mdx
@@ -35,7 +35,7 @@ To get started with Continue in VS Code, please follow this [guide to install Co
 
 ### 2. Enable Jan API Server
 
-To configure the Continue to use Jan's Local Server, you need to enable Jan API Server with your preferred model, please follow this [guide to enable Jan API Server](../05-using-server/01-server.md)
+To configure the Continue to use Jan's Local Server, you need to enable Jan API Server with your preferred model, please follow this [guide to enable Jan API Server](/guides/using-server/start-server).
 
 ### 3. Configure Continue to Use Jan's Local Server
 
@@ -77,7 +77,7 @@ Edit the `config.json` file and include the following configuration.
       // highlight-start
       "model": "mistral-ins-7b-q4",
       "apiKey": "EMPTY",
-      "apiBase": "http://localhost:1337"
+      "apiBase": "http://localhost:1337/v1"
       // highlight-end
     }
   ]
@@ -86,7 +86,7 @@ Edit the `config.json` file and include the following configuration.
 
 - Ensure that the `provider` is `openai`.
 - Ensure that the `model` is the same as the one you enabled in the Jan API Server.
-- Ensure that the `apiBase` is `http://localhost:1337`.
+- Ensure that the `apiBase` is `http://localhost:1337/v1`.
 - Ensure that the `apiKey` is `EMPTY`.
 
 ### 4. Ensure the Using Model Is Activated in Jan
diff --git a/docs/docs/guides/07-integrations/04-integrate-mistral-ai.mdx b/docs/docs/guides/07-integrations/04-integrate-mistral-ai.mdx
new file mode 100644
index 0000000000..14ddeaa750
--- /dev/null
+++ b/docs/docs/guides/07-integrations/04-integrate-mistral-ai.mdx
@@ -0,0 +1,89 @@
+---
+title: Integrate Mistral AI with Jan
+slug: /guides/integrations/mistral-ai
+description: Guide to integrate Mistral AI with Jan
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    Mistral integration,
+  ]
+---
+
+## Quick Introduction
+
+[Mistral AI](https://docs.mistral.ai/) currently provides two ways of accessing their Large Language Models (LLM) - via their API or via open source models available on Hugging Face.  In this guide, we will show you how to integrate Mistral AI with Jan using the API method.
+
+## Steps to Integrate Mistral AI with Jan
+
+### 1. Configure Mistral API key
+
+You can find your API keys in the [Mistral API Key](https://console.mistral.ai/user/api-keys/) and set the Mistral AI API key in `~/jan/engines/openai.json` file.
+
+```json title="~/jan/engines/openai.json"
+{
+  // highlight-start
+  "full_url": "https://api.mistral.ai/v1/chat/completions",
+  "api_key": "<your-mistral-ai-api-key>"
+  // highlight-end
+}
+```
+
+### 2. Modify a Model JSON
+
+Navigate to the `~/jan/models` folder. Create a folder named `<mistral-modelname>`, for example, `mistral-tiny` and create a `model.json` file inside the folder including the following configurations:
+
+- Ensure the filename must be `model.json`.
+- Ensure the `id` property is set to the model id from Mistral AI.
+- Ensure the `format` property is set to `api`.
+- Ensure the `engine` property is set to `openai`.
+- Ensure the `state` property is set to `ready`.
+
+```json title="~/jan/models/mistral-tiny/model.json"
+{
+  "sources": [
+    {
+      "filename": "mistral-tiny",
+      "url": "https://mistral.ai/"
+    }
+  ],
+  "id": "mistral-tiny",
+  "object": "model",
+  "name": "Mistral-7B-v0.2 (Tiny Endpoint)",
+  "version": "1.0",
+  "description": "Currently powered by Mistral-7B-v0.2, a better fine-tuning of the initial Mistral-7B released, inspired by the fantastic work of the community.",
+  // highlight-next-line
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "Mistral AI",
+    "tags": ["General", "Big Context Length"]
+  },
+  // highlight-start
+  "engine": "openai"
+  // highlight-end
+}
+```
+
+:::tip
+
+Mistral AI provides different endpoints. Please check out their [endpoint documentation](https://docs.mistral.ai/platform/endpoints/) to find the one that suits your needs. In this example, we will use the `mistral-tiny` model.
+
+:::
+
+### 3. Start the Model
+
+Restart Jan and navigate to the Hub. Locate your model and click the Use button.
+
+![Mitral AI Tiny Model](assets/04-mistral-ai-tiny-hub.png)
+
+### 4. Try Out the Integration of Jan and Mistral AI
+
+![Mistral AI Integration Demo](assets/04-mistral-ai-integration-demo.gif)
diff --git a/docs/docs/guides/07-integrations/05-integrate-lmstudio.mdx b/docs/docs/guides/07-integrations/05-integrate-lmstudio.mdx
new file mode 100644
index 0000000000..58e2f0be97
--- /dev/null
+++ b/docs/docs/guides/07-integrations/05-integrate-lmstudio.mdx
@@ -0,0 +1,184 @@
+---
+title: Integrate LM Studio with Jan
+slug: /guides/integrations/lmstudio
+description: Guide to integrate LM Studio with Jan
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    LM Studio integration,
+  ]
+---
+
+## Quick Introduction
+
+With [LM Studio](https://lmstudio.ai/), you can discover, download, and run local Large Language Models (LLMs). In this guide, we will show you how to integrate and use your current models on LM Studio with Jan using 2 methods.  The first method is integrating LM Studio server with Jan UI. The second method is migrating your downloaded model from LM Studio to Jan. We will use the [Phi 2 - GGUF](https://huggingface.co/TheBloke/phi-2-GGUF) model on Hugging Face as an example.
+
+## Steps to Integrate LM Studio Server with Jan UI
+
+### 1. Start the LM Studio Server
+
+1. Navigate to the `Local Inference Server` on the LM Studio application.  
+2. Select the model you want to use. 
+3. Start the server after configuring the server port and options. 
+
+![LM Studio Server](assets/05-setting-lmstudio-server.gif)
+
+<br></br>
+
+Modify the `openai.json` file in the `~/jan/engines` folder to include the full URL of the LM Studio server.
+
+```json title="~/jan/engines/openai.json"
+{
+  "full_url": "http://localhost:<port>/v1/chat/completions"
+}
+```
+
+:::tip
+
+- Replace `<port>` with the port number you set in the LM Studio server. The default port is `1234`.
+
+:::
+
+### 2. Modify a Model JSON
+
+Navigate to the `~/jan/models` folder. Create a folder named `<lmstudio-modelname>`, for example, `lmstudio-phi-2` and create a `model.json` file inside the folder including the following configurations:
+
+- Set the `format` property to `api`.
+- Set the `engine` property to `openai`.
+- Set the `state` property to `ready`.
+
+```json title="~/jan/models/lmstudio-phi-2/model.json"
+{
+  "sources": [
+    {
+      "filename": "phi-2-GGUF",
+      "url": "https://huggingface.co/TheBloke/phi-2-GGUF"
+    }
+  ],
+  "id": "lmstudio-phi-2",
+  "object": "model",
+  "name": "LM Studio - Phi 2 - GGUF",
+  "version": "1.0",
+  "description": "TheBloke/phi-2-GGUF",
+  // highlight-next-line
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "Microsoft",
+    "tags": ["General", "Big Context Length"]
+  },
+  // highlight-start
+  "engine": "openai"
+  // highlight-end
+}
+```
+
+### 3. Start the Model
+
+1. Restart Jan and navigate to the **Hub**. 
+2. Locate your model and click the **Use** button.
+
+![LM Studio Model](assets/05-lmstudio-run.png)
+
+### 4. Try Out the Integration of Jan and LM Studio
+
+![LM Studio Integration Demo](assets/05-lmstudio-integration-demo.gif)
+
+## Steps to Migrate Your Downloaded Model from LM Studio to Jan (version 0.4.6 and older)
+
+### 1. Migrate Your Downloaded Model
+
+1. Navigate to `My Models` in the LM Studio application and reveal the model folder.
+
+![Reveal-model-folder-lmstudio](assets/05-reveal-model-folder-lmstudio.gif)
+
+2. Copy the model folder that you want to migrate to `~/jan/models` folder.
+
+3. Ensure the folder name property is the same as the model name of `.gguf` filename by changing the folder name if necessary. For example, in this case, we changed foldername from `TheBloke` to `phi-2.Q4_K_S`.
+
+### 2. Start the Model
+
+1. Restart Jan and navigate to the **Hub**. Jan will automatically detect the model and display it in the **Hub**. 
+2. Locate your model and click the **Use** button to try the migrating model.
+
+![Demo](assets/05-demo-migrating-model.gif)
+
+## Steps to Pointing to the Downloaded Model of LM Studio from Jan (version 0.4.7+)
+
+Starting from version 0.4.7, Jan supports importing models using an absolute filepath, so you can directly use the model from the LM Studio folder.
+
+### 1. Reveal the Model Absolute Path
+
+Navigate to `My Models` in the LM Studio application and reveal the model folder. Then, you can get the absolute path of your model.
+
+![Reveal-model-folder-lmstudio](assets/05-reveal-model-folder-lmstudio.gif)
+
+### 2. Modify a Model JSON
+
+Navigate to the `~/jan/models` folder. Create a folder named `<modelname>`, for example, `phi-2.Q4_K_S` and create a `model.json` file inside the folder including the following configurations:
+
+- Ensure the `id` property matches the folder name you created.
+- Ensure the `url` property is the direct binary download link ending in `.gguf`. Now, you can use the absolute filepath of the model file. In this example, the absolute filepath is `/Users/<username>/.cache/lm-studio/models/TheBloke/phi-2-GGUF/phi-2.Q4_K_S.gguf`.
+- Ensure the `engine` property is set to `nitro`.
+
+```json
+{
+  "object": "model",
+  "version": 1,
+  "format": "gguf",
+  "sources": [
+    {
+      "filename": "phi-2.Q4_K_S.gguf",
+      "url": "<absolute-path-of-model-file>"
+    }
+  ],
+  "id": "phi-2.Q4_K_S",
+  "name": "phi-2.Q4_K_S",
+  "created": 1708308111506,
+  "description": "phi-2.Q4_K_S - user self import model",
+  "settings": {
+    "ctx_len": 4096,
+    "embedding": false,
+    "prompt_template": "{system_message}\n### Instruction: {prompt}\n### Response:",
+    "llama_model_path": "phi-2.Q4_K_S.gguf"
+  },
+  "parameters": {
+    "temperature": 0.7,
+    "top_p": 0.95,
+    "stream": true,
+    "max_tokens": 2048,
+    "stop": ["<endofstring>"],
+    "frequency_penalty": 0,
+    "presence_penalty": 0
+  },
+  "metadata": {
+    "size": 1615568736,
+    "author": "User",
+    "tags": []
+  },
+  "engine": "nitro"
+}
+```
+
+:::warning
+
+- If you are using Windows, you need to use double backslashes in the url property, for example: `C:\\Users\\username\\filename.gguf`.
+
+:::
+
+
+### 3. Start the Model
+
+1. Restart Jan and navigate to the **Hub**. 
+2. Jan will automatically detect the model and display it in the **Hub**. 
+3. Locate your model and click the **Use** button to try the migrating model.  
+
+![Demo](assets/05-demo-pointing-model.gif)
diff --git a/docs/docs/guides/07-integrations/06-integrate-ollama.mdx b/docs/docs/guides/07-integrations/06-integrate-ollama.mdx
new file mode 100644
index 0000000000..e55c3e49f7
--- /dev/null
+++ b/docs/docs/guides/07-integrations/06-integrate-ollama.mdx
@@ -0,0 +1,90 @@
+---
+title: Integrate Ollama with Jan
+slug: /guides/integrations/ollama
+description: Guide to integrate Ollama with Jan
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    Ollama integration,
+  ]
+---
+
+## Quick Introduction
+
+With [Ollama](https://ollama.com/), you can run large language models locally. In this guide, we will show you how to integrate and use your current models on Ollama with Jan using 2 methods.  The first method is integrating Ollama server with Jan UI. The second method is migrating your downloaded model from Ollama to Jan. We will use the [llama2](https://ollama.com/library/llama2) model as an example.
+
+## Steps to Integrate Ollama Server with Jan UI
+
+### 1. Start the Ollama Server
+
+1. Select the model you want to use from the [Ollama library](https://ollama.com/library). 
+2. Run your model by using the following command:
+  
+```bash
+ollama run <model-name>
+```
+
+3. According to the [Ollama documentation on OpenAI compatibility](https://github.com/ollama/ollama/blob/main/docs/openai.md), you can use the `http://localhost:11434/v1/chat/completions` endpoint to interact with the Ollama server. Thus, modify the `openai.json` file in the `~/jan/engines` folder to include the full URL of the Ollama server.
+
+```json title="~/jan/engines/openai.json"
+{
+  "full_url": "http://localhost:11434/v1/chat/completions"
+}
+```
+
+### 2. Modify a Model JSON
+
+1. Navigate to the `~/jan/models` folder. 
+2. Create a folder named `<ollam-modelname>`, for example, `lmstudio-phi-2`.
+3. Create a `model.json` file inside the folder including the following configurations:
+
+- Set the `id` property to the model name as Ollama model name.
+- Set the `format` property to `api`.
+- Set the `engine` property to `openai`.
+- Set the `state` property to `ready`.
+
+```json title="~/jan/models/llama2/model.json"
+{
+  "sources": [
+    {
+      "filename": "llama2",
+      "url": "https://ollama.com/library/llama2"
+    }
+  ],
+  // highlight-next-line
+  "id": "llama2",
+  "object": "model",
+  "name": "Ollama - Llama2",
+  "version": "1.0",
+  "description": "Llama 2 is a collection of foundation language models ranging from 7B to 70B parameters.",
+  // highlight-next-line
+  "format": "api",
+  "settings": {},
+  "parameters": {},
+  "metadata": {
+    "author": "Meta",
+    "tags": ["General", "Big Context Length"]
+  },
+  // highlight-next-line
+  "engine": "openai"
+}
+```
+
+### 3. Start the Model
+
+1. Restart Jan and navigate to the **Hub**.
+2. Locate your model and click the **Use** button.
+
+![Ollama Model](assets/06-ollama-run.png)
+
+### 4. Try Out the Integration of Jan and Ollama
+
+![Ollama Integration Demo](assets/06-ollama-integration-demo.gif)
+
diff --git a/docs/docs/guides/07-integrations/assets/04-mistral-ai-integration-demo.gif b/docs/docs/guides/07-integrations/assets/04-mistral-ai-integration-demo.gif
new file mode 100644
index 0000000000..015167e2ab
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/04-mistral-ai-integration-demo.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/04-mistral-ai-tiny-hub.png b/docs/docs/guides/07-integrations/assets/04-mistral-ai-tiny-hub.png
new file mode 100644
index 0000000000..1ae377d709
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/04-mistral-ai-tiny-hub.png differ
diff --git a/docs/docs/guides/07-integrations/assets/05-demo-migrating-model.gif b/docs/docs/guides/07-integrations/assets/05-demo-migrating-model.gif
new file mode 100644
index 0000000000..985755e47c
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-demo-migrating-model.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/05-demo-pointing-model.gif b/docs/docs/guides/07-integrations/assets/05-demo-pointing-model.gif
new file mode 100644
index 0000000000..137fb955ac
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-demo-pointing-model.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/05-lmstudio-integration-demo.gif b/docs/docs/guides/07-integrations/assets/05-lmstudio-integration-demo.gif
new file mode 100644
index 0000000000..445ea3416a
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-lmstudio-integration-demo.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/05-lmstudio-run.png b/docs/docs/guides/07-integrations/assets/05-lmstudio-run.png
new file mode 100644
index 0000000000..721581f72e
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-lmstudio-run.png differ
diff --git a/docs/docs/guides/07-integrations/assets/05-reveal-model-folder-lmstudio.gif b/docs/docs/guides/07-integrations/assets/05-reveal-model-folder-lmstudio.gif
new file mode 100644
index 0000000000..4c1ee85fc3
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-reveal-model-folder-lmstudio.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/05-setting-lmstudio-server.gif b/docs/docs/guides/07-integrations/assets/05-setting-lmstudio-server.gif
new file mode 100644
index 0000000000..63084be01d
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/05-setting-lmstudio-server.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/06-ollama-integration-demo.gif b/docs/docs/guides/07-integrations/assets/06-ollama-integration-demo.gif
new file mode 100644
index 0000000000..708f2058a7
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/06-ollama-integration-demo.gif differ
diff --git a/docs/docs/guides/07-integrations/assets/06-ollama-run.png b/docs/docs/guides/07-integrations/assets/06-ollama-run.png
new file mode 100644
index 0000000000..7f18e1b15b
Binary files /dev/null and b/docs/docs/guides/07-integrations/assets/06-ollama-run.png differ
diff --git a/docs/docs/guides/08-troubleshooting/02-somethings-amiss.mdx b/docs/docs/guides/08-troubleshooting/02-somethings-amiss.mdx
index a5669e36dd..4e16e362a5 100644
--- a/docs/docs/guides/08-troubleshooting/02-somethings-amiss.mdx
+++ b/docs/docs/guides/08-troubleshooting/02-somethings-amiss.mdx
@@ -45,7 +45,9 @@ This may occur due to several reasons. Please follow these steps to resolve it:
 
 5. If you are on Nvidia GPUs, please download [Cuda](https://developer.nvidia.com/cuda-downloads).
 
-6. When [checking app logs](https://jan.ai/troubleshooting/how-to-get-error-logs/), if you encounter the error log `Bind address failed at 127.0.0.1:3928`, it indicates that the port used by Nitro might already be in use. Use the following commands to check the port status:
+6. If you're using Linux, please ensure that your system meets the following requirements gcc 11, g++ 11, cpp 11, or higher, refer to this [link](https://jan.ai/guides/troubleshooting/gpu-not-used/#specific-requirements-for-linux) for more information.
+
+7. When [checking app logs](https://jan.ai/troubleshooting/how-to-get-error-logs/), if you encounter the error log `Bind address failed at 127.0.0.1:3928`, it indicates that the port used by Nitro might already be in use. Use the following commands to check the port status:
 
 <Tabs groupId="operating-systems">
   <TabItem value="mac" label="macOS">
diff --git a/docs/docs/guides/08-troubleshooting/03-gpu-not-used.mdx b/docs/docs/guides/08-troubleshooting/03-gpu-not-used.mdx
index d35993ab6a..53638027b0 100644
--- a/docs/docs/guides/08-troubleshooting/03-gpu-not-used.mdx
+++ b/docs/docs/guides/08-troubleshooting/03-gpu-not-used.mdx
@@ -188,4 +188,6 @@ Troubleshooting tips:
 
 2. If the issue persists, ensure your (V)RAM is accessible by the application. Some folks have virtual RAM and need additional configuration.
 
-3. Get help in [Jan Discord](https://discord.gg/mY69SZaMaC).
+3. If you are facing issues with the installation of RTX issues, please update the NVIDIA driver that supports CUDA 11.7 or higher. Ensure that the CUDA path is added to the environment variable.
+
+4. Get help in [Jan Discord](https://discord.gg/mY69SZaMaC).
diff --git a/docs/docs/guides/08-troubleshooting/06-unexpected-token.mdx b/docs/docs/guides/08-troubleshooting/06-unexpected-token.mdx
index 973001f1b0..1de609ffa4 100644
--- a/docs/docs/guides/08-troubleshooting/06-unexpected-token.mdx
+++ b/docs/docs/guides/08-troubleshooting/06-unexpected-token.mdx
@@ -17,4 +17,8 @@ keywords:
   ]
 ---
 
-1. You may receive an error response `Error occurred: Unexpected token '<', "<!DOCTYPE"...is not valid JSON`, when you start a chat with OpenAI models. Using a VPN may help fix the issue.
+You may receive an error response `Error occurred: Unexpected token '<', "<!DOCTYPE"...is not valid JSON`, when you start a chat with OpenAI models. 
+
+1. Check that you added an OpenAI API key. You can get an API key from OpenAI's [developer platform](https://platform.openai.com/). Alternatively, we recommend you download a local model from Jan Hub, which remains free to use and runs on your own computer!
+
+2. Using a VPN may help fix the issue.
diff --git a/docs/docs/guides/08-troubleshooting/07-undefined-issue.mdx b/docs/docs/guides/08-troubleshooting/07-undefined-issue.mdx
new file mode 100644
index 0000000000..4aba6438d9
--- /dev/null
+++ b/docs/docs/guides/08-troubleshooting/07-undefined-issue.mdx
@@ -0,0 +1,26 @@
+---
+title: Undefined Issue
+slug: /troubleshooting/undefined-issue
+description: Undefined issue troubleshooting guide.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    troubleshooting,
+    undefined issue,
+  ]
+---
+
+You may encounter an "undefined" issue when using Jan. Here are some troubleshooting steps to help you resolve the issue.
+
+1. Try wiping the Jan folder and reopening the Jan app and see if the issue persists.
+2. If the issue persists, try to go `~/jan/extensions/@janhq/inference-nitro-extensions/dist/bin/<your-os>/nitro` and run the nitro manually and see if you get any error messages.
+3. Resolve the error messages you get from the nitro and see if the issue persists.
+4. Reopen the Jan app and see if the issue is resolved.
+5. If the issue persists, please share with us the [app logs](https://jan.ai/troubleshooting/how-to-get-error-logs/) via [Jan Discord](https://discord.gg/mY69SZaMaC).
diff --git a/docs/docs/guides/09-advanced-settings/01-https-proxy.mdx b/docs/docs/guides/09-advanced-settings/01-https-proxy.mdx
new file mode 100644
index 0000000000..35f4c30f90
--- /dev/null
+++ b/docs/docs/guides/09-advanced-settings/01-https-proxy.mdx
@@ -0,0 +1,101 @@
+---
+title: HTTPS Proxy
+slug: /guides/advanced-settings/https-proxy
+description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    advanced-settings,
+    https-proxy,
+  ]
+---
+
+In this guide, we will show you how to set up your own HTTPS proxy server and configure Jan to use it.
+
+## Why HTTPS Proxy?
+An HTTPS proxy helps you to maintain your privacy and security while still being able to browser the internet circumventing geographical restrictions. 
+
+## Setting Up Your Own HTTPS Proxy Server
+In this section, we will show you a high-level overview of how to set up your own HTTPS proxy server. This guide focus on using Squid as a popular and open-source proxy server software, but there are other software options you might consider based on your needs and preferences.
+
+### Step 1: Choosing a Server
+Firstly, you need to choose a server to host your proxy server. We recommend using a cloud provider like Amazon AWS, Google Cloud, Microsoft Azure, Digital Ocean, etc. Ensure that your server has a public IP address and is accessible from the internet.
+
+### Step 2: Installing Squid
+```bash
+sudo apt-get update
+sudo apt-get install squid
+```
+
+### Step 3: Configure Squid for HTTPS
+
+To enable HTTPS, you will need to configure Squid with SSL support.
+
+- Generate SSL certificate
+
+Squid requires an SSL certificate to be able to handle HTTPS traffic. You can generate a self-signed certificate or obtain one from a Certificate Authority (CA). For a self-signed certificate, you can use OpenSSL:
+
+```bash
+openssl req -new -newkey rsa:2048 -days 365 -nodes -x509 -keyout squid-proxy.pem -out squid-proxy.pem
+```
+
+- Configure Squid to use the SSL certificate: Edit the Squid configuration file `/etc/squid/squid.conf` to include the path to your SSL certificate and enable the HTTPS port:
+
+```bash
+http_port 3128 ssl-bump cert=/path/to/your/squid-proxy.pem
+ssl_bump server-first all
+ssl_bump bump all
+```
+
+- Enable SSL Bumping: To intercept HTTPS traffic, Squid uses a process called SSL Bumping. This process allows Squid to decrypt and re-encrypt HTTPS traffic. To enable SSL Bumping, ensure the `ssl_bump` directives are configured correctly in your `squid.conf` file.
+
+### Step 4 (Optional): Configure ACLs and Authentication
+
+- Access Control Lists (ACLs): You can define rules to control who can access your proxy. This is done by editing the squid.conf file and defining ACLs:
+
+```bash
+acl allowed_ips src "/etc/squid/allowed_ips.txt"
+http_access allow allowed_ips
+```
+
+- Authentication: If you want to add an authentication layer, Squid supports several authentication schemes. Basic authentication setup might look like this:
+
+```bash
+auth_param basic program /usr/lib/squid/basic_ncsa_auth /etc/squid/passwords
+acl authenticated proxy_auth REQUIRED
+http_access allow authenticated
+```
+
+### Step 5: Restart and Test Your Proxy
+
+After configuring, restart Squid to apply the changes:
+
+```bash
+sudo systemctl restart squid
+```
+
+To test, configure your browser or another client to use the proxy server with its IP address and port (default is 3128). Check if you can access the internet through your proxy.
+
+:::tip
+
+Tips for Secure Your Proxy:
+- Firewall rules: Ensure that only intended users or IP addresses can connect to your proxy server. This can be achieved by setting up appropriate firewall rules.
+- Regular updates: Keep your server and proxy software updated to ensure that you are protected against known vulnerabilities.
+- Monitoring and logging: Monitor your proxy server for unusual activity and enable logging to keep track of the traffic passing through your proxy.
+
+::: 
+
+## Setting Up Jan to Use Your HTTPS Proxy
+
+Once you have your HTTPS proxy server set up, you can configure Jan to use it. Navigate to `Settings` > `Advanced Settings` and specify the HTTPS proxy (proxy auto-configuration and SOCKS not supported).
+
+You can turn on the feature `Ignore SSL Certificates` if you are using a self-signed certificate. This feature allows self-signed or unverified certificates.
+
+![01-https-proxy-jan-configure](./assets/01-https-proxy-jan-configure.png)
\ No newline at end of file
diff --git a/docs/docs/guides/09-advanced-settings/README.mdx b/docs/docs/guides/09-advanced-settings/README.mdx
new file mode 100644
index 0000000000..ba3da9bb18
--- /dev/null
+++ b/docs/docs/guides/09-advanced-settings/README.mdx
@@ -0,0 +1,65 @@
+---
+title: Advanced Settings
+slug: /guides/advanced-settings/
+description: Jan is a ChatGPT-alternative that runs on your own computer, with a local API server.
+keywords:
+  [
+    Jan AI,
+    Jan,
+    ChatGPT alternative,
+    local AI,
+    private AI,
+    conversational AI,
+    no-subscription fee,
+    large language model,
+    advanced-settings,
+  ]
+---
+
+This guide will show you how to use the advanced settings in Jan.
+
+## Keyboard Shortcuts
+
+Keyboard shortcuts are a great way to speed up your workflow. Here are some of the keyboard shortcuts that you can use in Jan.
+
+| Combination     | Description                                        |
+| --------------- | -------------------------------------------------- |
+| `⌘ E`           | Show list your models                              |
+| `⌘ K`           | Show list navigation pages                         |
+| `⌘ B`           | Toggle collapsible left panel                      |
+| `⌘ ,`           | Navigate to setting page                           |
+| `Enter`         | Send a message                                     |
+| `Shift + Enter` | Insert new line in input box                       |
+| `Arrow Up`      | Navigate to previous option (within search dialog) |
+| `Arrow Down`    | Navigate to next option (within search dialog)     |
+
+<br></br>
+
+:::note
+`⌘` is the command key on macOS, and `Ctrl` on Windows.
+:::
+
+## Experimental Mode
+
+Experimental mode allows you to enable experimental features that may be unstable tested.
+
+## Jan Data Folder
+
+The Jan data folder is the location where messages, model configurations, and other user data are placed. You can change the location of the data folder to a different location.
+
+![00-changing-folder](./assets/00-changing-folder.gif)
+
+## HTTPS Proxy & Ignore SSL Certificate
+
+HTTPS Proxy allows you to use a proxy server to connect to the internet. You can also ignore SSL certificates if you are using a self-signed certificate.
+Please check out the guide on [how to set up your own HTTPS proxy server and configure Jan to use it](../advanced-settings/https-proxy) for more information.
+
+## Clear Logs
+
+Clear logs will remove all logs from the Jan application.
+
+## Reset To Factory Default
+
+Reset the application to its original state, deleting all your usage data, including model customizations and conversation history. This action is irreversible and recommended only if the application is in a corrupted state.
+
+![00-reset-factory-settings](./assets/00-reset-factory-settings.gif)
diff --git a/docs/docs/guides/09-advanced-settings/assets/00-changing-folder.gif b/docs/docs/guides/09-advanced-settings/assets/00-changing-folder.gif
new file mode 100644
index 0000000000..ac280a5c34
Binary files /dev/null and b/docs/docs/guides/09-advanced-settings/assets/00-changing-folder.gif differ
diff --git a/docs/docs/guides/09-advanced-settings/assets/00-reset-factory-settings.gif b/docs/docs/guides/09-advanced-settings/assets/00-reset-factory-settings.gif
new file mode 100644
index 0000000000..81760848d3
Binary files /dev/null and b/docs/docs/guides/09-advanced-settings/assets/00-reset-factory-settings.gif differ
diff --git a/docs/docs/guides/09-advanced-settings/assets/01-https-proxy-jan-configure.png b/docs/docs/guides/09-advanced-settings/assets/01-https-proxy-jan-configure.png
new file mode 100644
index 0000000000..25e0f76601
Binary files /dev/null and b/docs/docs/guides/09-advanced-settings/assets/01-https-proxy-jan-configure.png differ
diff --git a/docs/docs/template/QA_script.md b/docs/docs/template/QA_script.md
index 05dbed2b41..bba667bcdc 100644
--- a/docs/docs/template/QA_script.md
+++ b/docs/docs/template/QA_script.md
@@ -1,6 +1,6 @@
 # [Release Version] QA Script 
 
-**Release Version:**
+**Release Version:** v0.4.6
 
 **Operating System:**
 
@@ -25,10 +25,10 @@
 
 ### 3. Users uninstall app
 
-- [ ] :key: Check that the uninstallation process removes all components of the app from the system.
+- [ ] :key::warning: Check that the uninstallation process removes the app successfully from the system.
 - [ ] Clean the Jan root directory and open the app to check if it creates all the necessary folders, especially models and extensions.
 - [ ] When updating the app, check if the `/models` directory has any JSON files that change according to the update.
-- [ ] Verify if updating the app also updates extensions correctly (test functionality changes; support notifications for necessary tests with each version related to extensions update).
+- [ ] Verify if updating the app also updates extensions correctly (test functionality changes, support notifications for necessary tests with each version related to extensions update).
 
 ### 4. Users close app
 
@@ -60,49 +60,45 @@
 - [ ] :key: Ensure that the conversation thread is maintained without any loss of data upon sending multiple messages.
 - [ ] Test for the ability to send different types of messages (e.g., text, emojis, code blocks).
 - [ ] :key: Validate the scroll functionality in the chat window for lengthy conversations.
-- [ ] Check if the user can renew responses multiple times.
 - [ ] Check if the user can copy the response.
 - [ ] Check if the user can delete responses.
-- [ ] :warning: Test if the user deletes the message midway, then the assistant stops that response.
 - [ ] :key: Check the `clear message` button works.
 - [ ] :key: Check the `delete entire chat` works.
-- [ ] :warning: Check if deleting all the chat retains the system prompt.
+- [ ] Check if deleting all the chat retains the system prompt.
 - [ ] Check the output format of the AI (code blocks, JSON, markdown, ...).
 - [ ] :key: Validate that there is appropriate error handling and messaging if the assistant fails to respond.
 - [ ] Test assistant's ability to maintain context over multiple exchanges.
 - [ ] :key: Check the `create new chat` button works correctly
 - [ ] Confirm that by changing `models` mid-thread the app can still handle it.
-- [ ] Check that by changing `instructions` mid-thread the app can still handle it.
-- [ ] Check the `regenerate` button renews the response.
-- [ ] Check the `Instructions` update correctly after the user updates it midway.
+- [ ] Check the `regenerate` button renews the response (single / multiple times).
+- [ ] Check the `Instructions` update correctly after the user updates it midway (mid-thread).
 
 ### 2. Users can customize chat settings like model parameters via both the GUI & thread.json
 
-- [ ] :key: Confirm that the chat settings options are accessible via the GUI.
+- [ ] :key: Confirm that the Threads settings options are accessible.
 - [ ] Test the functionality to adjust model parameters (e.g., Temperature, Top K, Top P) from the GUI and verify they are reflected in the chat behavior.
 - [ ] :key: Ensure that changes can be saved and persisted between sessions.
 - [ ] Validate that users can access and modify the thread.json file.
 - [ ] :key: Check that changes made in thread.json are correctly applied to the chat session upon reload or restart.
-- [ ] Verify if there is a revert option to go back to previous settings after changes are made.
-- [ ] Test for user feedback or confirmation after saving changes to settings.
 - [ ] Check the maximum and minimum limits of the adjustable parameters and how they affect the assistant's responses.
 - [ ] :key: Validate user permissions for those who can change settings and persist them.
 - [ ] :key: Ensure that users switch between threads with different models, the app can handle it.
 
-### 3. Users can click on a history thread
+### 3. Model dropdown
+- [ ] :key: Model list should highlight recommended based on user RAM
+- [ ] Model size should display (for both installed and imported models)
 
+### 4. Users can click on a history thread
 - [ ] Test the ability to click on any thread in the history panel.
 - [ ] :key: Verify that clicking a thread brings up the past conversation in the main chat window.
 - [ ] :key: Ensure that the selected thread is highlighted or otherwise indicated in the history panel.
 - [ ] Confirm that the chat window displays the entire conversation from the selected history thread without any missing messages.
 - [ ] :key: Check the performance and accuracy of the history feature when dealing with a large number of threads.
 - [ ] Validate that historical threads reflect the exact state of the chat at that time, including settings.
-- [ ] :key: :warning: Test the search functionality within the history panel for quick navigation.
 - [ ] :key: Verify the ability to delete or clean old threads.
 - [ ] :key: Confirm that changing the title of the thread updates correctly.
 
-### 4. Users can config instructions for the assistant.
-
+### 5. Users can config instructions for the assistant.
 - [ ] Ensure there is a clear interface to input or change instructions for the assistant.
 - [ ] Test if the instructions set by the user are being followed by the assistant in subsequent conversations.
 - [ ] :key: Validate that changes to instructions are updated in real time and do not require a restart of the application or session.
@@ -112,6 +108,8 @@
 - [ ] Validate that instructions can be saved with descriptive names for easy retrieval.
 - [ ] :key: Check if the assistant can handle conflicting instructions and how it resolves them.
 - [ ] Ensure that instruction configurations are documented for user reference.
+- [ ] :key: RAG - Users can import documents and the system should process queries about the uploaded file, providing accurate and appropriate responses in the conversation thread.
+
 
 ## D. Hub
 
@@ -125,8 +123,7 @@
 
 - [ ] Display the best model for their RAM at the top.
 - [ ] :key: Ensure that models are labeled with RAM requirements and compatibility.
-- [ ] :key: Validate that the download function is disabled for models that exceed the user's system capabilities.
-- [ ] Test that the platform provides alternative recommendations for models not suitable due to RAM limitations.
+- [ ] :warning: Test that the platform provides alternative recommendations for models not suitable due to RAM limitations.
 - [ ] :key: Check the download model functionality and validate if the cancel download feature works correctly.
 
 ### 3. Users can download models via a HuggingFace URL (coming soon)
@@ -139,7 +136,7 @@
 
 - [ ] :key: Have clear instructions so users can do their own.
 - [ ] :key: Ensure the new model updates after restarting the app.
-- [ ] Ensure it raises clear errors for users to fix the problem while adding a new model.
+- [ ] :warning:Ensure it raises clear errors for users to fix the problem while adding a new model.
 
 ### 5. Users can use the model as they want
 
@@ -149,9 +146,13 @@
 - [ ] Check if starting another model stops the other model entirely.
 - [ ] Check the `Explore models` navigate correctly to the model panel.
 - [ ] :key: Check when deleting a model it will delete all the files on the user's computer.
-- [ ] The recommended tags should present right for the user's hardware.
+- [ ] :warning:The recommended tags should present right for the user's hardware.
 - [ ] Assess that the descriptions of models are accurate and informative.
 
+### 6. Users can Integrate With a Remote Server
+- [ ] :key: Import openAI GPT model https://jan.ai/guides/using-models/integrate-with-remote-server/ and the model displayed in Hub / Thread dropdown
+- [ ] Users can use the remote model properly
+
 ## E. System Monitor
 
 ### 1. Users can see disk and RAM utilization
@@ -181,7 +182,7 @@
 - [ ] Confirm that the application saves the theme preference and persists it across sessions.
 - [ ] Validate that all elements of the UI are compatible with the theme changes and maintain legibility and contrast.
 
-### 2. Users change the extensions
+### 2. Users change the extensions [TBU]
 
 - [ ] Confirm that the `Extensions` tab lists all available plugins.
 - [ ] :key: Test the toggle switch for each plugin to ensure it enables or disables the plugin correctly.
@@ -208,3 +209,19 @@
 - [ ] :key: Test that the application prevents the installation of incompatible or corrupt plugin files.
 - [ ] :key: Check that the user can uninstall or disable custom plugins as easily as pre-installed ones.
 - [ ] Verify that the application's performance remains stable after the installation of custom plugins.
+
+### 5. Advanced Settings
+- [ ] Attemp to test downloading model from hub using **HTTP Proxy** [guideline](https://github.com/janhq/jan/pull/1562)
+- [ ] Users can move **Jan data folder**
+- [ ] Users can click on Reset button to **factory reset** app settings to its original state & delete all usage data.
+
+## G. Local API server
+
+### 1. Local Server Usage with Server Options
+- [ ] :key: Explore API Reference: Swagger API for sending/receiving requests
+    - [ ] Use default server option
+    - [ ] Configure and use custom server options
+- [ ] Test starting/stopping the local API server with different Model/Model settings
+- [ ] Server logs captured with correct Server Options provided
+- [ ] Verify functionality of Open logs/Clear feature
+- [ ] Ensure that threads and other functions impacting the model are disabled while the local server is running
diff --git a/docs/openapi/jan.yaml b/docs/openapi/jan.yaml
index bfff0ad738..864c80fdf6 100644
--- a/docs/openapi/jan.yaml
+++ b/docs/openapi/jan.yaml
@@ -67,20 +67,31 @@ paths:
       x-codeSamples:
         - lang: cURL
           source: |
-            curl http://localhost:1337/v1/chat/completions \
-              -H "Content-Type: application/json" \
+            curl -X 'POST' \
+              'http://localhost:1337/v1/chat/completions' \
+              -H 'accept: application/json' \
+              -H 'Content-Type: application/json' \
               -d '{
-                "model": "tinyllama-1.1b",
                 "messages": [
                   {
-                    "role": "system",
-                    "content": "You are a helpful assistant."
+                    "content": "You are a helpful assistant.",
+                    "role": "system"
                   },
                   {
-                    "role": "user",
-                    "content": "Hello!"
+                    "content": "Hello!",
+                    "role": "user"
                   }
-                ]
+                ],
+                "model": "tinyllama-1.1b",
+                "stream": true,
+                "max_tokens": 2048,
+                "stop": [
+                  "hello"
+                ],
+                "frequency_penalty": 0,
+                "presence_penalty": 0,
+                "temperature": 0.7,
+                "top_p": 0.95
               }'
   /models:
     get:
@@ -103,7 +114,9 @@ paths:
       x-codeSamples:
         - lang: cURL
           source: |
-            curl http://localhost:1337/v1/models
+            curl -X 'GET' \
+              'http://localhost:1337/v1/models' \
+              -H 'accept: application/json'
   "/models/download/{model_id}":
     get:
       operationId: downloadModel
@@ -131,7 +144,9 @@ paths:
       x-codeSamples:
         - lang: cURL
           source: |
-            curl -X POST http://localhost:1337/v1/models/download/{model_id}
+            curl -X 'GET' \
+              'http://localhost:1337/v1/models/download/{model_id}' \
+              -H 'accept: application/json'
   "/models/{model_id}":
     get:
       operationId: retrieveModel
@@ -162,7 +177,9 @@ paths:
       x-codeSamples:
         - lang: cURL
           source: |
-            curl http://localhost:1337/v1/models/{model_id}
+            curl -X 'GET' \
+              'http://localhost:1337/v1/models/{model_id}' \
+              -H 'accept: application/json'
     delete:
       operationId: deleteModel
       tags:
@@ -191,7 +208,9 @@ paths:
       x-codeSamples:
         - lang: cURL
           source: |
-            curl -X DELETE http://localhost:1337/v1/models/{model_id}
+            curl -X 'DELETE' \
+              'http://localhost:1337/v1/models/{model_id}' \
+              -H 'accept: application/json'
   /threads:
     post:
       operationId: createThread
diff --git a/docs/openapi/specs/assistants.yaml b/docs/openapi/specs/assistants.yaml
index d784c315a6..5db1f6a976 100644
--- a/docs/openapi/specs/assistants.yaml
+++ b/docs/openapi/specs/assistants.yaml
@@ -316,4 +316,4 @@ components:
         deleted:
           type: boolean
           description: Indicates whether the assistant was successfully deleted.
-          example: true
\ No newline at end of file
+          example: true
diff --git a/docs/openapi/specs/chat.yaml b/docs/openapi/specs/chat.yaml
index b324501a86..cfa3915982 100644
--- a/docs/openapi/specs/chat.yaml
+++ b/docs/openapi/specs/chat.yaml
@@ -188,4 +188,4 @@ components:
             total_tokens:
               type: integer
               example: 533
-              description: Total number of tokens used
\ No newline at end of file
+              description: Total number of tokens used
diff --git a/docs/openapi/specs/messages.yaml b/docs/openapi/specs/messages.yaml
index d9d7d87a40..6f5fe1a58f 100644
--- a/docs/openapi/specs/messages.yaml
+++ b/docs/openapi/specs/messages.yaml
@@ -1,3 +1,4 @@
+---
 components:
   schemas:
     MessageObject:
@@ -75,7 +76,7 @@ components:
           example: msg_abc123
         object:
           type: string
-          description: "Type of the object, indicating it's a thread message."
+          description: Type of the object, indicating it's a thread message.
           default: thread.message
         created_at:
           type: integer
@@ -88,7 +89,7 @@ components:
           example: thread_abc123
         role:
           type: string
-          description: "Role of the sender, either 'user' or 'assistant'."
+          description: Role of the sender, either 'user' or 'assistant'.
           example: user
         content:
           type: array
@@ -97,7 +98,7 @@ components:
             properties:
               type:
                 type: string
-                description: "Type of content, e.g., 'text'."
+                description: Type of content, e.g., 'text'.
                 example: text
               text:
                 type: object
@@ -110,21 +111,21 @@ components:
                     type: array
                     items:
                       type: string
-                    description: "Annotations for the text content, if any."
+                    description: Annotations for the text content, if any.
                     example: []
         file_ids:
           type: array
           items:
             type: string
-          description: "Array of file IDs associated with the message, if any."
+          description: Array of file IDs associated with the message, if any.
           example: []
         assistant_id:
           type: string
-          description: "Identifier of the assistant involved in the message, if applicable."
+          description: Identifier of the assistant involved in the message, if applicable.
           example: null
         run_id:
           type: string
-          description: "Run ID associated with the message, if applicable."
+          description: Run ID associated with the message, if applicable.
           example: null
         metadata:
           type: object
@@ -139,7 +140,7 @@ components:
           example: msg_abc123
         object:
           type: string
-          description: "Type of the object, indicating it's a thread message."
+          description: Type of the object, indicating it's a thread message.
           example: thread.message
         created_at:
           type: integer
@@ -152,7 +153,7 @@ components:
           example: thread_abc123
         role:
           type: string
-          description: "Role of the sender, either 'user' or 'assistant'."
+          description: Role of the sender, either 'user' or 'assistant'.
           example: user
         content:
           type: array
@@ -161,7 +162,7 @@ components:
             properties:
               type:
                 type: string
-                description: "Type of content, e.g., 'text'."
+                description: Type of content, e.g., 'text'.
                 example: text
               text:
                 type: object
@@ -174,21 +175,21 @@ components:
                     type: array
                     items:
                       type: string
-                    description: "Annotations for the text content, if any."
+                    description: Annotations for the text content, if any.
                     example: []
         file_ids:
           type: array
           items:
             type: string
-          description: "Array of file IDs associated with the message, if any."
+          description: Array of file IDs associated with the message, if any.
           example: []
         assistant_id:
           type: string
-          description: "Identifier of the assistant involved in the message, if applicable."
+          description: Identifier of the assistant involved in the message, if applicable.
           example: null
         run_id:
           type: string
-          description: "Run ID associated with the message, if applicable."
+          description: Run ID associated with the message, if applicable.
           example: null
         metadata:
           type: object
@@ -199,7 +200,7 @@ components:
       properties:
         object:
           type: string
-          description: "Type of the object, indicating it's a list."
+          description: Type of the object, indicating it's a list.
           default: list
         data:
           type: array
@@ -226,7 +227,7 @@ components:
           example: msg_abc123
         object:
           type: string
-          description: "Type of the object, indicating it's a thread message."
+          description: Type of the object, indicating it's a thread message.
           example: thread.message
         created_at:
           type: integer
@@ -239,7 +240,7 @@ components:
           example: thread_abc123
         role:
           type: string
-          description: "Role of the sender, either 'user' or 'assistant'."
+          description: Role of the sender, either 'user' or 'assistant'.
           example: user
         content:
           type: array
@@ -248,7 +249,7 @@ components:
             properties:
               type:
                 type: string
-                description: "Type of content, e.g., 'text'."
+                description: Type of content, e.g., 'text'.
               text:
                 type: object
                 properties:
@@ -260,20 +261,20 @@ components:
                     type: array
                     items:
                       type: string
-                    description: "Annotations for the text content, if any."
+                    description: Annotations for the text content, if any.
         file_ids:
           type: array
           items:
             type: string
-          description: "Array of file IDs associated with the message, if any."
+          description: Array of file IDs associated with the message, if any.
           example: []
         assistant_id:
           type: string
-          description: "Identifier of the assistant involved in the message, if applicable."
+          description: Identifier of the assistant involved in the message, if applicable.
           example: null
         run_id:
           type: string
-          description: "Run ID associated with the message, if applicable."
+          description: Run ID associated with the message, if applicable.
           example: null
         metadata:
           type: object
@@ -309,4 +310,4 @@ components:
         data:
           type: array
           items:
-            $ref: "#/components/schemas/MessageFileObject"
\ No newline at end of file
+            $ref: "#/components/schemas/MessageFileObject"
diff --git a/docs/openapi/specs/models.yaml b/docs/openapi/specs/models.yaml
index 8113f3ab80..40e6abaaff 100644
--- a/docs/openapi/specs/models.yaml
+++ b/docs/openapi/specs/models.yaml
@@ -18,114 +18,82 @@ components:
     Model:
       type: object
       properties:
-        type:
+        source_url:
           type: string
-          default: model
-          description: The type of the object.
-        version:
-          type: string
-          default: "1"
-          description: The version number of the model.
+          format: uri
+          description: URL to the source of the model.
+          example: https://huggingface.co/janhq/trinity-v1.2-GGUF/resolve/main/trinity-v1.2.Q4_K_M.gguf
         id:
           type: string
-          description: Unique identifier used in chat-completions model_name, matches
+          description:
+            Unique identifier used in chat-completions model_name, matches
             folder name.
-          example: zephyr-7b
+          example: trinity-v1.2-7b
+        object:
+          type: string
+          example: model
         name:
           type: string
           description: Name of the model.
-          example: Zephyr 7B
-        owned_by:
+          example: Trinity-v1.2 7B Q4
+        version:
           type: string
-          description: Compatibility field for OpenAI.
-          default: ""
-        created:
-          type: integer
-          format: int64
-          description: Unix timestamp representing the creation time.
+          default: "1.0"
+          description: The version number of the model.
         description:
           type: string
           description: Description of the model.
-        state:
-          type: string
-          enum:
-            - null
-            - downloading
-            - ready
-            - starting
-            - stopping
-          description: Current state of the model.
+          example:
+            Trinity is an experimental model merge using the Slerp method.
+            Recommended for daily assistance purposes.
         format:
           type: string
           description: State format of the model, distinct from the engine.
-          example: ggufv3
-        source:
-          type: array
-          items:
-            type: object
-            properties:
-              url:
-                format: uri
-                description: URL to the source of the model.
-                example: https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q4_K_M.gguf
-              filename:
-                type: string
-                description: Filename of the model.
-                example: zephyr-7b-beta.Q4_K_M.gguf
+          example: gguf
         settings:
           type: object
           properties:
             ctx_len:
-              type: string
+              type: integer
               description: Context length.
-              example: "4096"
-            ngl:
-              type: string
-              description: Number of layers.
-              example: "100"
-            embedding:
-              type: string
-              description: Indicates if embedding is enabled.
-              example: "true"
-            n_parallel:
+              example: 4096
+            prompt_template:
               type: string
-              description: Number of parallel processes.
-              example: "4"
+              example: "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant"
           additionalProperties: false
         parameters:
           type: object
           properties:
             temperature:
-              type: string
-              description: Temperature setting for the model.
-              example: "0.7"
-            token_limit:
-              type: string
-              description: Token limit for the model.
-              example: "4096"
-            top_k:
-              type: string
-              description: Top-k setting for the model.
-              example: "0"
+              example: 0.7
             top_p:
-              type: string
-              description: Top-p setting for the model.
-              example: "1"
+              example: 0.95
             stream:
-              type: string
-              description: Indicates if streaming is enabled.
-              example: "true"
+              example: true
+            max_tokens:
+              example: 4096
+            stop:
+              example: []
+            frequency_penalty:
+              example: 0
+            presence_penalty:
+              example: 0
           additionalProperties: false
         metadata:
-          type: object
-          description: Additional metadata.
-        assets:
-          type: array
-          items:
+          author:
             type: string
-          description: List of assets related to the model.
-      required:
-        - source
+            example: Jan
+          tags:
+            example:
+              - 7B
+              - Merged
+              - Featured
+          size:
+            example: 4370000000,
+          cover:
+            example: https://raw.githubusercontent.com/janhq/jan/main/models/trinity-v1.2-7b/cover.png
+        engine:
+          example: nitro
     ModelObject:
       type: object
       properties:
@@ -133,7 +101,7 @@ components:
           type: string
           description: |
             The identifier of the model.
-          example: zephyr-7b
+          example: trinity-v1.2-7b
         object:
           type: string
           description: |
@@ -153,197 +121,89 @@ components:
     GetModelResponse:
       type: object
       properties:
+        source_url:
+          type: string
+          format: uri
+          description: URL to the source of the model.
+          example: https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_K_M.gguf
         id:
           type: string
-          description: The identifier of the model.
-          example: zephyr-7b
+          description:
+            Unique identifier used in chat-completions model_name, matches
+            folder name.
+          example: mistral-ins-7b-q4
         object:
           type: string
-          description: Type of the object, indicating it's a model.
-          default: model
-        created:
-          type: integer
-          format: int64
-          description: Unix timestamp representing the creation time of the model.
-        owned_by:
+          example: model
+        name:
           type: string
-          description: The entity that owns the model.
-          example: _
-        state:
+          description: Name of the model.
+          example: Mistral Instruct 7B Q4
+        version:
           type: string
-          enum:
-            - not_downloaded
-            - downloaded
-            - running
-            - stopped
-          description: The current state of the model.
-        source:
-          type: array
-          items:
-            type: object
-            properties:
-              url:
-                format: uri
-                description: URL to the source of the model.
-                example: https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q4_K_M.gguf
-              filename:
-                type: string
-                description: Filename of the model.
-                example: zephyr-7b-beta.Q4_K_M.gguf
-        engine_parameters:
+          default: "1.0"
+          description: The version number of the model.
+        description:
+          type: string
+          description: Description of the model.
+          example:
+            Trinity is an experimental model merge using the Slerp method.
+            Recommended for daily assistance purposes.
+        format:
+          type: string
+          description: State format of the model, distinct from the engine.
+          example: gguf
+        settings:
           type: object
           properties:
-            pre_prompt:
-              type: string
-              description: Predefined prompt used for setting up internal configurations.
-              default: ""
-              example: Initial setup complete.
-            system_prompt:
-              type: string
-              description: Prefix used for system-level prompts.
-              default: "SYSTEM: "
-            user_prompt:
-              type: string
-              description: Prefix used for user prompts.
-              default: "USER: "
-            ai_prompt:
-              type: string
-              description: Prefix used for assistant prompts.
-              default: "ASSISTANT: "
-            ngl:
-              type: integer
-              description: Number of neural network layers loaded onto the GPU for
-                acceleration.
-              minimum: 0
-              maximum: 100
-              default: 100
-              example: 100
             ctx_len:
               type: integer
-              description: Context length for model operations, varies based on the specific
-                model.
-              minimum: 128
-              maximum: 4096
-              default: 4096
+              description: Context length.
               example: 4096
-            n_parallel:
-              type: integer
-              description: Number of parallel operations, relevant when continuous batching is
-                enabled.
-              minimum: 1
-              maximum: 10
-              default: 1
-              example: 4
-            cont_batching:
-              type: boolean
-              description: Indicates if continuous batching is used for processing.
-              default: false
-              example: false
-            cpu_threads:
-              type: integer
-              description: Number of threads allocated for CPU-based inference.
-              minimum: 1
-              example: 8
-            embedding:
-              type: boolean
-              description: Indicates if embedding layers are enabled in the model.
-              default: true
-              example: true
-        model_parameters:
+            prompt_template:
+              type: string
+              example: "[INST] {prompt} [/INST]"
+          additionalProperties: false
+        parameters:
           type: object
           properties:
-            ctx_len:
-              type: integer
-              description: Maximum context length the model can handle.
-              minimum: 0
-              maximum: 4096
-              default: 4096
-              example: 4096
-            ngl:
-              type: integer
-              description: Number of layers in the neural network.
-              minimum: 1
-              maximum: 100
-              default: 100
-              example: 100
-            embedding:
-              type: boolean
-              description: Indicates if embedding layers are used.
-              default: true
-              example: true
-            n_parallel:
-              type: integer
-              description: Number of parallel processes the model can run.
-              minimum: 1
-              maximum: 10
-              default: 1
-              example: 4
             temperature:
-              type: number
-              description: Controls randomness in model's responses. Higher values lead to
-                more random responses.
-              minimum: 0
-              maximum: 2
-              default: 0.7
               example: 0.7
-            token_limit:
-              type: integer
-              description: Maximum number of tokens the model can generate in a single
-                response.
-              minimum: 1
-              maximum: 4096
-              default: 4096
+            top_p:
+              example: 0.95
+            stream:
+              example: true
+            max_tokens:
               example: 4096
-            top_k:
-              type: integer
-              description: Limits the model to consider only the top k most likely next tokens
-                at each step.
-              minimum: 0
-              maximum: 100
-              default: 0
+            stop:
+              example: []
+            frequency_penalty:
               example: 0
-            top_p:
-              type: number
-              description: Nucleus sampling parameter. The model considers the smallest set of
-                tokens whose cumulative probability exceeds the top_p value.
-              minimum: 0
-              maximum: 1
-              default: 1
-              example: 1
+            presence_penalty:
+              example: 0
+          additionalProperties: false
         metadata:
-          type: object
-          properties:
-            engine:
-              type: string
-              description: The engine used by the model.
-              enum:
-                - nitro
-                - openai
-                - hf_inference
-            quantization:
-              type: string
-              description: Quantization parameter of the model.
-              example: Q3_K_L
-            size:
-              type: string
-              description: Size of the model.
-              example: 7B
-      required:
-        - id
-        - object
-        - created
-        - owned_by
-        - state
-        - source
-        - parameters
-        - metadata
+          author:
+            type: string
+            example: MistralAI
+          tags:
+            example:
+              - 7B
+              - Featured
+              - Foundation Model
+          size:
+            example: 4370000000,
+          cover:
+            example: https://raw.githubusercontent.com/janhq/jan/main/models/mistral-ins-7b-q4/cover.png
+        engine:
+          example: nitro
     DeleteModelResponse:
       type: object
       properties:
         id:
           type: string
           description: The identifier of the model that was deleted.
-          example: model-zephyr-7B
+          example: mistral-ins-7b-q4
         object:
           type: string
           description: Type of the object, indicating it's a model.
diff --git a/docs/openapi/specs/threads.yaml b/docs/openapi/specs/threads.yaml
index fe00f75884..40b2463fa5 100644
--- a/docs/openapi/specs/threads.yaml
+++ b/docs/openapi/specs/threads.yaml
@@ -142,7 +142,7 @@ components:
                 example: Jan
               instructions:
                 type: string
-                description: |
+                description: >
                   The instruction of assistant, defaults to "Be my grammar corrector"
               model:
                 type: object
@@ -224,4 +224,4 @@ components:
         deleted:
           type: boolean
           description: Indicates whether the thread was successfully deleted.
-          example: true
\ No newline at end of file
+          example: true
diff --git a/electron/.prettierrc b/electron/.prettierrc
deleted file mode 100644
index 46f1abcb02..0000000000
--- a/electron/.prettierrc
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-  "semi": false,
-  "singleQuote": true,
-  "quoteProps": "consistent",
-  "trailingComma": "es5",
-  "endOfLine": "auto",
-  "plugins": ["prettier-plugin-tailwindcss"]
-}
diff --git a/electron/handlers/app.ts b/electron/handlers/app.ts
deleted file mode 100644
index c1f431ef3c..0000000000
--- a/electron/handlers/app.ts
+++ /dev/null
@@ -1,173 +0,0 @@
-import { app, ipcMain, dialog, shell } from 'electron'
-import { join, basename, relative as getRelative, isAbsolute } from 'path'
-import { WindowManager } from './../managers/window'
-import { getResourcePath } from './../utils/path'
-import { AppRoute, AppConfiguration } from '@janhq/core'
-import { ServerConfig, startServer, stopServer } from '@janhq/server'
-import {
-  ModuleManager,
-  getJanDataFolderPath,
-  getJanExtensionsPath,
-  init,
-  log,
-  logServer,
-  getAppConfigurations,
-  updateAppConfiguration,
-} from '@janhq/core/node'
-
-export function handleAppIPCs() {
-  /**
-   * Handles the "openAppDirectory" IPC message by opening the app's user data directory.
-   * The `shell.openPath` method is used to open the directory in the user's default file explorer.
-   * @param _event - The IPC event object.
-   */
-  ipcMain.handle(AppRoute.openAppDirectory, async (_event) => {
-    shell.openPath(getJanDataFolderPath())
-  })
-
-  /**
-   * Opens a URL in the user's default browser.
-   * @param _event - The IPC event object.
-   * @param url - The URL to open.
-   */
-  ipcMain.handle(AppRoute.openExternalUrl, async (_event, url) => {
-    shell.openExternal(url)
-  })
-
-  /**
-   * Opens a URL in the user's default browser.
-   * @param _event - The IPC event object.
-   * @param url - The URL to open.
-   */
-  ipcMain.handle(AppRoute.openFileExplore, async (_event, url) => {
-    shell.openPath(url)
-  })
-
-  /**
-   * Joins multiple paths together, respect to the current OS.
-   */
-  ipcMain.handle(AppRoute.joinPath, async (_event, paths: string[]) =>
-    join(...paths)
-  )
-
-  /**
-   * Checks if the given path is a subdirectory of the given directory.
-   *
-   * @param _event - The IPC event object.
-   * @param from - The path to check.
-   * @param to - The directory to check against.
-   *
-   * @returns {Promise<boolean>} - A promise that resolves with the result.
-   */
-  ipcMain.handle(
-    AppRoute.isSubdirectory,
-    async (_event, from: string, to: string) => {
-      const relative = getRelative(from, to)
-      const isSubdir =
-        relative && !relative.startsWith('..') && !isAbsolute(relative)
-
-      if (isSubdir === '') return false
-      else return isSubdir
-    }
-  )
-
-  /**
-   * Retrieve basename from given path, respect to the current OS.
-   */
-  ipcMain.handle(AppRoute.baseName, async (_event, path: string) =>
-    basename(path)
-  )
-
-  /**
-   * Start Jan API Server.
-   */
-  ipcMain.handle(AppRoute.startServer, async (_event, configs?: ServerConfig) =>
-    startServer({
-      host: configs?.host,
-      port: configs?.port,
-      isCorsEnabled: configs?.isCorsEnabled,
-      isVerboseEnabled: configs?.isVerboseEnabled,
-      schemaPath: app.isPackaged
-        ? join(getResourcePath(), 'docs', 'openapi', 'jan.yaml')
-        : undefined,
-      baseDir: app.isPackaged
-        ? join(getResourcePath(), 'docs', 'openapi')
-        : undefined,
-    })
-  )
-
-  /**
-   * Stop Jan API Server.
-   */
-  ipcMain.handle(AppRoute.stopServer, stopServer)
-
-  /**
-   * Relaunches the app in production - reload window in development.
-   * @param _event - The IPC event object.
-   * @param url - The URL to reload.
-   */
-  ipcMain.handle(AppRoute.relaunch, async (_event) => {
-    ModuleManager.instance.clearImportedModules()
-
-    if (app.isPackaged) {
-      app.relaunch()
-      app.exit()
-    } else {
-      for (const modulePath in ModuleManager.instance.requiredModules) {
-        delete require.cache[
-          require.resolve(join(getJanExtensionsPath(), modulePath))
-        ]
-      }
-      init({
-        // Function to check from the main process that user wants to install a extension
-        confirmInstall: async (_extensions: string[]) => {
-          return true
-        },
-        // Path to install extension to
-        extensionsPath: getJanExtensionsPath(),
-      })
-      WindowManager.instance.currentWindow?.reload()
-    }
-  })
-
-  /**
-   * Log message to log file.
-   */
-  ipcMain.handle(AppRoute.log, async (_event, message) => log(message))
-
-  /**
-   * Log message to log file.
-   */
-  ipcMain.handle(AppRoute.logServer, async (_event, message) =>
-    logServer(message)
-  )
-
-  ipcMain.handle(AppRoute.selectDirectory, async () => {
-    const mainWindow = WindowManager.instance.currentWindow
-    if (!mainWindow) {
-      console.error('No main window found')
-      return
-    }
-    const { canceled, filePaths } = await dialog.showOpenDialog(mainWindow, {
-      title: 'Select a folder',
-      buttonLabel: 'Select Folder',
-      properties: ['openDirectory', 'createDirectory'],
-    })
-    if (canceled) {
-      return
-    } else {
-      return filePaths[0]
-    }
-  })
-
-  ipcMain.handle(AppRoute.getAppConfigurations, async () =>
-    getAppConfigurations()
-  )
-
-  ipcMain.handle(
-    AppRoute.updateAppConfiguration,
-    async (_event, appConfiguration: AppConfiguration) => {
-      await updateAppConfiguration(appConfiguration)
-    }
-  )
-}
diff --git a/electron/handlers/common.ts b/electron/handlers/common.ts
new file mode 100644
index 0000000000..5a54a92bdf
--- /dev/null
+++ b/electron/handlers/common.ts
@@ -0,0 +1,25 @@
+import { Handler, RequestHandler } from '@janhq/core/node'
+import { ipcMain } from 'electron'
+import { WindowManager } from '../managers/window'
+
+export function injectHandler() {
+  const ipcWrapper: Handler = (
+    route: string,
+    listener: (...args: any[]) => any
+  ) => {
+    return ipcMain.handle(route, async (event, ...args: any[]) => {
+      return listener(...args)
+    })
+  }
+
+  const handler = new RequestHandler(
+    ipcWrapper,
+    (channel: string, args: any) => {
+      return WindowManager.instance.currentWindow?.webContents.send(
+        channel,
+        args
+      )
+    }
+  )
+  handler.handle()
+}
diff --git a/electron/handlers/download.ts b/electron/handlers/download.ts
deleted file mode 100644
index f63e56f6bb..0000000000
--- a/electron/handlers/download.ts
+++ /dev/null
@@ -1,121 +0,0 @@
-import { ipcMain } from 'electron'
-import { resolve } from 'path'
-import { WindowManager } from './../managers/window'
-import request from 'request'
-import { createWriteStream, renameSync } from 'fs'
-import { DownloadEvent, DownloadRoute } from '@janhq/core'
-const progress = require('request-progress')
-import { DownloadManager, getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
-
-export function handleDownloaderIPCs() {
-  /**
-   * Handles the "pauseDownload" IPC message by pausing the download associated with the provided fileName.
-   * @param _event - The IPC event object.
-   * @param fileName - The name of the file being downloaded.
-   */
-  ipcMain.handle(DownloadRoute.pauseDownload, async (_event, fileName) => {
-    DownloadManager.instance.networkRequests[fileName]?.pause()
-  })
-
-  /**
-   * Handles the "resumeDownload" IPC message by resuming the download associated with the provided fileName.
-   * @param _event - The IPC event object.
-   * @param fileName - The name of the file being downloaded.
-   */
-  ipcMain.handle(DownloadRoute.resumeDownload, async (_event, fileName) => {
-    DownloadManager.instance.networkRequests[fileName]?.resume()
-  })
-
-  /**
-   * Handles the "abortDownload" IPC message by aborting the download associated with the provided fileName.
-   * The network request associated with the fileName is then removed from the networkRequests object.
-   * @param _event - The IPC event object.
-   * @param fileName - The name of the file being downloaded.
-   */
-  ipcMain.handle(DownloadRoute.abortDownload, async (_event, fileName) => {
-    const rq = DownloadManager.instance.networkRequests[fileName]
-    if (rq) {
-      DownloadManager.instance.networkRequests[fileName] = undefined
-      rq?.abort()
-    } else {
-      WindowManager?.instance.currentWindow?.webContents.send(
-        DownloadEvent.onFileDownloadError,
-        {
-          fileName,
-          err: { message: 'aborted' },
-        }
-      )
-    }
-  })
-
-  /**
-   * Downloads a file from a given URL.
-   * @param _event - The IPC event object.
-   * @param url - The URL to download the file from.
-   * @param fileName - The name to give the downloaded file.
-   */
-  ipcMain.handle(
-    DownloadRoute.downloadFile,
-    async (_event, url, fileName, network) => {
-      const strictSSL = !network?.ignoreSSL
-      const proxy = network?.proxy?.startsWith('http')
-        ? network.proxy
-        : undefined
-
-      if (typeof fileName === 'string') {
-        fileName = normalizeFilePath(fileName)
-      }
-      const destination = resolve(getJanDataFolderPath(), fileName)
-      const rq = request({ url, strictSSL, proxy })
-
-      // Put request to download manager instance
-      DownloadManager.instance.setRequest(fileName, rq)
-
-      // Downloading file to a temp file first
-      const downloadingTempFile = `${destination}.download`
-
-      progress(rq, {})
-        .on('progress', function (state: any) {
-          WindowManager?.instance.currentWindow?.webContents.send(
-            DownloadEvent.onFileDownloadUpdate,
-            {
-              ...state,
-              fileName,
-            }
-          )
-        })
-        .on('error', function (err: Error) {
-          WindowManager?.instance.currentWindow?.webContents.send(
-            DownloadEvent.onFileDownloadError,
-            {
-              fileName,
-              err,
-            }
-          )
-        })
-        .on('end', function () {
-          if (DownloadManager.instance.networkRequests[fileName]) {
-            // Finished downloading, rename temp file to actual file
-            renameSync(downloadingTempFile, destination)
-
-            WindowManager?.instance.currentWindow?.webContents.send(
-              DownloadEvent.onFileDownloadSuccess,
-              {
-                fileName,
-              }
-            )
-            DownloadManager.instance.setRequest(fileName, undefined)
-          } else {
-            WindowManager?.instance.currentWindow?.webContents.send(
-              DownloadEvent.onFileDownloadError,
-              {
-                fileName,
-                err: { message: 'aborted' },
-              }
-            )
-          }
-        })
-        .pipe(createWriteStream(downloadingTempFile))
-    }
-  )
-}
diff --git a/electron/handlers/extension.ts b/electron/handlers/extension.ts
deleted file mode 100644
index 763c4cdecb..0000000000
--- a/electron/handlers/extension.ts
+++ /dev/null
@@ -1,104 +0,0 @@
-import { ipcMain, webContents } from 'electron'
-import { readdirSync } from 'fs'
-import { join, extname } from 'path'
-
-import {
-  installExtensions,
-  getExtension,
-  removeExtension,
-  getActiveExtensions,
-  ModuleManager,
-  getJanExtensionsPath,
-} from '@janhq/core/node'
-
-import { getResourcePath } from './../utils/path'
-import { ExtensionRoute } from '@janhq/core'
-
-export function handleExtensionIPCs() {
-  /**MARK: General handlers */
-  /**
-   * Invokes a function from a extension module in main node process.
-   * @param _event - The IPC event object.
-   * @param modulePath - The path to the extension module.
-   * @param method - The name of the function to invoke.
-   * @param args - The arguments to pass to the function.
-   * @returns The result of the invoked function.
-   */
-  ipcMain.handle(
-    ExtensionRoute.invokeExtensionFunc,
-    async (_event, modulePath, method, ...args) => {
-      const module = require(
-        /* webpackIgnore: true */ join(getJanExtensionsPath(), modulePath)
-      )
-      ModuleManager.instance.setModule(modulePath, module)
-
-      if (typeof module[method] === 'function') {
-        return module[method](...args)
-      } else {
-        console.debug(module[method])
-        console.error(`Function "${method}" does not exist in the module.`)
-      }
-    }
-  )
-
-  /**
-   * Returns the paths of the base extensions.
-   * @param _event - The IPC event object.
-   * @returns An array of paths to the base extensions.
-   */
-  ipcMain.handle(ExtensionRoute.baseExtensions, async (_event) => {
-    const baseExtensionPath = join(getResourcePath(), 'pre-install')
-    return readdirSync(baseExtensionPath)
-      .filter((file) => extname(file) === '.tgz')
-      .map((file) => join(baseExtensionPath, file))
-  })
-
-  /**MARK: Extension Manager handlers */
-  ipcMain.handle(ExtensionRoute.installExtension, async (e, extensions) => {
-    // Install and activate all provided extensions
-    const installed = await installExtensions(extensions)
-    return JSON.parse(JSON.stringify(installed))
-  })
-
-  // Register IPC route to uninstall a extension
-  ipcMain.handle(
-    ExtensionRoute.uninstallExtension,
-    async (e, extensions, reload) => {
-      // Uninstall all provided extensions
-      for (const ext of extensions) {
-        const extension = getExtension(ext)
-        await extension.uninstall()
-        if (extension.name) removeExtension(extension.name)
-      }
-
-      // Reload all renderer pages if needed
-      reload && webContents.getAllWebContents().forEach((wc) => wc.reload())
-      return true
-    }
-  )
-
-  // Register IPC route to update a extension
-  ipcMain.handle(
-    ExtensionRoute.updateExtension,
-    async (e, extensions, reload) => {
-      // Update all provided extensions
-      const updated: any[] = []
-      for (const ext of extensions) {
-        const extension = getExtension(ext)
-        const res = await extension.update()
-        if (res) updated.push(extension)
-      }
-
-      // Reload all renderer pages if needed
-      if (updated.length && reload)
-        webContents.getAllWebContents().forEach((wc) => wc.reload())
-
-      return JSON.parse(JSON.stringify(updated))
-    }
-  )
-
-  // Register IPC route to get the list of active extensions
-  ipcMain.handle(ExtensionRoute.getActiveExtensions, () => {
-    return JSON.parse(JSON.stringify(getActiveExtensions()))
-  })
-}
diff --git a/electron/handlers/fileManager.ts b/electron/handlers/fileManager.ts
deleted file mode 100644
index e328cb53b7..0000000000
--- a/electron/handlers/fileManager.ts
+++ /dev/null
@@ -1,82 +0,0 @@
-import { ipcMain, app } from 'electron'
-// @ts-ignore
-import reflect from '@alumna/reflect'
-
-import { FileManagerRoute, FileStat } from '@janhq/core'
-import { getResourcePath } from './../utils/path'
-import fs from 'fs'
-import { join } from 'path'
-import { getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
-
-/**
- * Handles file system extensions operations.
- */
-export function handleFileMangerIPCs() {
-  // Handles the 'syncFile' IPC event. This event is triggered to synchronize a file from a source path to a destination path.
-  ipcMain.handle(
-    FileManagerRoute.syncFile,
-    async (_event, src: string, dest: string) => {
-      return reflect({
-        src,
-        dest,
-        recursive: true,
-        delete: false,
-        overwrite: true,
-        errorOnExist: false,
-      })
-    }
-  )
-
-  // Handles the 'getJanDataFolderPath' IPC event. This event is triggered to get the user space path.
-  ipcMain.handle(
-    FileManagerRoute.getJanDataFolderPath,
-    (): Promise<string> => Promise.resolve(getJanDataFolderPath())
-  )
-
-  // Handles the 'getResourcePath' IPC event. This event is triggered to get the resource path.
-  ipcMain.handle(FileManagerRoute.getResourcePath, async (_event) =>
-    getResourcePath()
-  )
-
-  ipcMain.handle(FileManagerRoute.getUserHomePath, async (_event) =>
-    app.getPath('home')
-  )
-
-  // handle fs is directory here
-  ipcMain.handle(
-    FileManagerRoute.fileStat,
-    async (_event, path: string): Promise<FileStat | undefined> => {
-      const normalizedPath = normalizeFilePath(path)
-
-      const fullPath = join(getJanDataFolderPath(), normalizedPath)
-      const isExist = fs.existsSync(fullPath)
-      if (!isExist) return undefined
-
-      const isDirectory = fs.lstatSync(fullPath).isDirectory()
-      const size = fs.statSync(fullPath).size
-
-      const fileStat: FileStat = {
-        isDirectory,
-        size,
-      }
-
-      return fileStat
-    }
-  )
-
-  ipcMain.handle(
-    FileManagerRoute.writeBlob,
-    async (_event, path: string, data: string): Promise<void> => {
-      try {
-        const normalizedPath = normalizeFilePath(path)
-        const dataBuffer = Buffer.from(data, 'base64')
-        fs.writeFileSync(
-          join(getJanDataFolderPath(), normalizedPath),
-          dataBuffer
-        )
-      } catch (err) {
-        console.error(`writeFile ${path} result: ${err}`)
-      }
-    }
-  )
-}
diff --git a/electron/handlers/fs.ts b/electron/handlers/fs.ts
deleted file mode 100644
index 34026b9409..0000000000
--- a/electron/handlers/fs.ts
+++ /dev/null
@@ -1,26 +0,0 @@
-import { ipcMain } from 'electron'
-
-import { getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
-import fs from 'fs'
-import { FileManagerRoute, FileSystemRoute } from '@janhq/core'
-import { join } from 'path'
-/**
- * Handles file system operations.
- */
-export function handleFsIPCs() {
-  const moduleName = 'fs'
-  Object.values(FileSystemRoute).forEach((route) => {
-    ipcMain.handle(route, async (event, ...args) => {
-      return import(moduleName).then((mdl) =>
-        mdl[route](
-          ...args.map((arg) =>
-            typeof arg === 'string' &&
-            (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
-              ? join(getJanDataFolderPath(), normalizeFilePath(arg))
-              : arg
-          )
-        )
-      )
-    })
-  })
-}
diff --git a/electron/handlers/native.ts b/electron/handlers/native.ts
new file mode 100644
index 0000000000..14ead07bd3
--- /dev/null
+++ b/electron/handlers/native.ts
@@ -0,0 +1,86 @@
+import { app, ipcMain, dialog, shell } from 'electron'
+import { join } from 'path'
+import { WindowManager } from '../managers/window'
+import {
+  ModuleManager,
+  getJanDataFolderPath,
+  getJanExtensionsPath,
+  init,
+} from '@janhq/core/node'
+import { NativeRoute } from '@janhq/core'
+
+export function handleAppIPCs() {
+  /**
+   * Handles the "openAppDirectory" IPC message by opening the app's user data directory.
+   * The `shell.openPath` method is used to open the directory in the user's default file explorer.
+   * @param _event - The IPC event object.
+   */
+  ipcMain.handle(NativeRoute.openAppDirectory, async (_event) => {
+    shell.openPath(getJanDataFolderPath())
+  })
+
+  /**
+   * Opens a URL in the user's default browser.
+   * @param _event - The IPC event object.
+   * @param url - The URL to open.
+   */
+  ipcMain.handle(NativeRoute.openExternalUrl, async (_event, url) => {
+    shell.openExternal(url)
+  })
+
+  /**
+   * Opens a URL in the user's default browser.
+   * @param _event - The IPC event object.
+   * @param url - The URL to open.
+   */
+  ipcMain.handle(NativeRoute.openFileExplore, async (_event, url) => {
+    shell.openPath(url)
+  })
+
+  /**
+   * Relaunches the app in production - reload window in development.
+   * @param _event - The IPC event object.
+   * @param url - The URL to reload.
+   */
+  ipcMain.handle(NativeRoute.relaunch, async (_event) => {
+    ModuleManager.instance.clearImportedModules()
+
+    if (app.isPackaged) {
+      app.relaunch()
+      app.exit()
+    } else {
+      for (const modulePath in ModuleManager.instance.requiredModules) {
+        delete require.cache[
+          require.resolve(join(getJanExtensionsPath(), modulePath))
+        ]
+      }
+      init({
+        // Function to check from the main process that user wants to install a extension
+        confirmInstall: async (_extensions: string[]) => {
+          return true
+        },
+        // Path to install extension to
+        extensionsPath: getJanExtensionsPath(),
+      })
+      WindowManager.instance.currentWindow?.reload()
+    }
+  })
+
+  ipcMain.handle(NativeRoute.selectDirectory, async () => {
+    const mainWindow = WindowManager.instance.currentWindow
+    if (!mainWindow) {
+      console.error('No main window found')
+      return
+    }
+    const { canceled, filePaths } = await dialog.showOpenDialog(mainWindow, {
+      title: 'Select a folder',
+      buttonLabel: 'Select Folder',
+      properties: ['openDirectory', 'createDirectory'],
+    })
+    if (canceled) {
+      return
+    } else {
+      return filePaths[0]
+    }
+  })
+}
diff --git a/electron/handlers/update.ts b/electron/handlers/update.ts
index cbb34c22b5..0d8cc4cc07 100644
--- a/electron/handlers/update.ts
+++ b/electron/handlers/update.ts
@@ -11,7 +11,8 @@ export function handleAppUpdates() {
   /* New Update Available */
   autoUpdater.on('update-available', async (_info: any) => {
     const action = await dialog.showMessageBox({
-      message: `Update available. Do you want to download the latest update?`,
+      title: 'Update Available',
+      message: 'Would you like to download and install it now?',
       buttons: ['Download', 'Later'],
     })
     if (action.response === 0) await autoUpdater.downloadUpdate()
@@ -36,7 +37,7 @@ export function handleAppUpdates() {
   autoUpdater.on('error', (info: any) => {
     WindowManager.instance.currentWindow?.webContents.send(
       AppEvent.onAppUpdateDownloadError,
-      {}
+      info
     )
   })
 
diff --git a/electron/main.ts b/electron/main.ts
index 5d7e59c0f3..de18b8f9de 100644
--- a/electron/main.ts
+++ b/electron/main.ts
@@ -1,4 +1,4 @@
-import { app, BrowserWindow } from 'electron'
+import { app, BrowserWindow, shell } from 'electron'
 import { join } from 'path'
 /**
  * Managers
@@ -9,12 +9,9 @@ import { log } from '@janhq/core/node'
 /**
  * IPC Handlers
  **/
-import { handleDownloaderIPCs } from './handlers/download'
-import { handleExtensionIPCs } from './handlers/extension'
-import { handleFileMangerIPCs } from './handlers/fileManager'
-import { handleAppIPCs } from './handlers/app'
+import { injectHandler } from './handlers/common'
 import { handleAppUpdates } from './handlers/update'
-import { handleFsIPCs } from './handlers/fs'
+import { handleAppIPCs } from './handlers/native'
 
 /**
  * Utils
@@ -25,25 +22,12 @@ import { migrateExtensions } from './utils/migration'
 import { cleanUpAndQuit } from './utils/clean'
 import { setupExtensions } from './utils/extension'
 import { setupCore } from './utils/setup'
+import { setupReactDevTool } from './utils/dev'
+import { cleanLogs } from './utils/log'
 
 app
   .whenReady()
-  .then(async () => {
-    if (!app.isPackaged) {
-      // Which means you're running from source code
-      const { default: installExtension, REACT_DEVELOPER_TOOLS } = await import(
-        'electron-devtools-installer'
-      ) // Don't use import on top level, since the installer package is dev-only
-      try {
-        const name = installExtension(REACT_DEVELOPER_TOOLS)
-        console.log(`Added Extension: ${name}`)
-      } catch (err) {
-        console.log('An error occurred while installing devtools:')
-        console.error(err)
-        // Only log the error and don't throw it because it's not critical
-      }
-    }
-  })
+  .then(setupReactDevTool)
   .then(setupCore)
   .then(createUserSpace)
   .then(migrateExtensions)
@@ -59,6 +43,7 @@ app
       }
     })
   })
+  .then(() => cleanLogs())
 
 app.once('window-all-closed', () => {
   cleanUpAndQuit()
@@ -92,23 +77,24 @@ function createMainWindow() {
 
   /* Open external links in the default browser */
   mainWindow.webContents.setWindowOpenHandler(({ url }) => {
-    require('electron').shell.openExternal(url)
+    shell.openExternal(url)
     return { action: 'deny' }
   })
 
   /* Enable dev tools for development */
   if (!app.isPackaged) mainWindow.webContents.openDevTools()
+  log(`Version: ${app.getVersion()}`)
 }
 
 /**
  * Handles various IPC messages from the renderer process.
  */
 function handleIPCs() {
-  handleFsIPCs()
-  handleDownloaderIPCs()
-  handleExtensionIPCs()
+  // Inject core handlers for IPCs
+  injectHandler()
+
+  // Handle native IPCs
   handleAppIPCs()
-  handleFileMangerIPCs()
 }
 
 /*
diff --git a/electron/merge-latest-ymls.js b/electron/merge-latest-ymls.js
index 8172a31768..ee8caf825d 100644
--- a/electron/merge-latest-ymls.js
+++ b/electron/merge-latest-ymls.js
@@ -9,7 +9,9 @@ const file3 = args[2]
 
 // check that all arguments are present and throw error instead
 if (!file1 || !file2 || !file3) {
-  throw new Error('Please provide 3 file paths as arguments: path to file1, to file2 and destination path')
+  throw new Error(
+    'Please provide 3 file paths as arguments: path to file1, to file2 and destination path'
+  )
 }
 
 const doc1 = yaml.load(fs.readFileSync(file1, 'utf8'))
diff --git a/electron/package.json b/electron/package.json
index 08f15b2626..a89803077c 100644
--- a/electron/package.json
+++ b/electron/package.json
@@ -4,6 +4,7 @@
   "main": "./build/main.js",
   "author": "Jan <service@jan.ai>",
   "license": "MIT",
+  "productName": "Jan",
   "homepage": "https://github.com/janhq/jan/tree/main/electron",
   "description": "Use offline LLMs with your own data. Run open source models like Llama2 or Falcon on your internal computers/servers.",
   "build": {
@@ -11,7 +12,6 @@
     "productName": "Jan",
     "files": [
       "renderer/**/*",
-      "build/*.{js,map}",
       "build/**/*.{js,map}",
       "pre-install",
       "models/**/*",
@@ -57,16 +57,17 @@
   "scripts": {
     "lint": "eslint . --ext \".js,.jsx,.ts,.tsx\"",
     "test:e2e": "playwright test --workers=1",
-    "dev": "tsc -p . && electron .",
-    "build": "run-script-os",
-    "build:test": "run-script-os",
+    "copy:assets": "rimraf --glob \"./pre-install/*.tgz\" && cpx \"../pre-install/*.tgz\" \"./pre-install\"",
+    "dev": "yarn copy:assets && tsc -p . && electron .",
+    "build": "yarn copy:assets && run-script-os",
+    "build:test": "yarn copy:assets && run-script-os",
     "build:test:darwin": "tsc -p . && electron-builder -p never -m --dir",
     "build:test:win32": "tsc -p . && electron-builder -p never -w --dir",
     "build:test:linux": "tsc -p . && electron-builder -p never -l --dir",
     "build:darwin": "tsc -p . && electron-builder -p never -m",
     "build:win32": "tsc -p . && electron-builder -p never -w",
     "build:linux": "tsc -p . && electron-builder -p never -l deb -l AppImage",
-    "build:publish": "run-script-os",
+    "build:publish": "yarn copy:assets && run-script-os",
     "build:publish:darwin": "tsc -p . && electron-builder -p always -m",
     "build:publish:win32": "tsc -p . && electron-builder -p always -w",
     "build:publish:linux": "tsc -p . && electron-builder -p always -l deb -l AppImage"
@@ -76,7 +77,6 @@
     "@janhq/core": "link:./core",
     "@janhq/server": "link:./server",
     "@npmcli/arborist": "^7.1.0",
-    "@types/request": "^2.48.12",
     "@uiball/loaders": "^1.3.0",
     "electron-store": "^8.1.0",
     "electron-updater": "^6.1.7",
@@ -85,8 +85,6 @@
     "pacote": "^17.0.4",
     "request": "^2.88.2",
     "request-progress": "^3.0.0",
-    "rimraf": "^5.0.5",
-    "typescript": "^5.2.2",
     "ulid": "^2.3.0",
     "use-debounce": "^9.0.4"
   },
@@ -95,6 +93,7 @@
     "@playwright/test": "^1.38.1",
     "@types/npmcli__arborist": "^5.6.4",
     "@types/pacote": "^11.1.7",
+    "@types/request": "^2.48.12",
     "@typescript-eslint/eslint-plugin": "^6.7.3",
     "@typescript-eslint/parser": "^6.7.3",
     "electron": "28.0.0",
@@ -102,7 +101,9 @@
     "electron-devtools-installer": "^3.2.0",
     "electron-playwright-helpers": "^1.6.0",
     "eslint-plugin-react": "^7.33.2",
-    "run-script-os": "^1.1.6"
+    "rimraf": "^5.0.5",
+    "run-script-os": "^1.1.6",
+    "typescript": "^5.2.2"
   },
   "installConfig": {
     "hoistingLimits": "workspaces"
diff --git a/electron/playwright.config.ts b/electron/playwright.config.ts
index 1fa3313f27..d3dff40c6a 100644
--- a/electron/playwright.config.ts
+++ b/electron/playwright.config.ts
@@ -1,9 +1,14 @@
 import { PlaywrightTestConfig } from '@playwright/test'
 
 const config: PlaywrightTestConfig = {
-  testDir: './tests',
+  testDir: './tests/e2e',
   retries: 0,
-  globalTimeout: 300000,
+  globalTimeout: 350000,
+  use: {
+    screenshot: 'only-on-failure',
+    video: 'retain-on-failure',
+    trace: 'retain-on-failure',
+  },
+  reporter: [['html', { outputFolder: './playwright-report' }]],
 }
-
 export default config
diff --git a/electron/sign.js b/electron/sign.js
index 6e973eb6e3..73afedc4ef 100644
--- a/electron/sign.js
+++ b/electron/sign.js
@@ -1,44 +1,48 @@
-const { exec } = require('child_process');
-
-
-function sign({ path, name, certUrl, clientId, tenantId, clientSecret, certName, timestampServer, version }) {
-    return new Promise((resolve, reject) => {
-
-        const command = `azuresigntool.exe sign -kvu "${certUrl}" -kvi "${clientId}" -kvt "${tenantId}" -kvs "${clientSecret}" -kvc "${certName}" -tr "${timestampServer}" -v "${path}"`;
-
-
-        exec(command, (error, stdout, stderr) => {
-            if (error) {
-                console.error(`Error: ${error}`);
-                return reject(error);
-            }
-            console.log(`stdout: ${stdout}`);
-            console.error(`stderr: ${stderr}`);
-            resolve();
-        });
-    });
+const { exec } = require('child_process')
+
+function sign({
+  path,
+  name,
+  certUrl,
+  clientId,
+  tenantId,
+  clientSecret,
+  certName,
+  timestampServer,
+  version,
+}) {
+  return new Promise((resolve, reject) => {
+    const command = `azuresigntool.exe sign -kvu "${certUrl}" -kvi "${clientId}" -kvt "${tenantId}" -kvs "${clientSecret}" -kvc "${certName}" -tr "${timestampServer}" -v "${path}"`
+
+    exec(command, (error, stdout, stderr) => {
+      if (error) {
+        console.error(`Error: ${error}`)
+        return reject(error)
+      }
+      console.log(`stdout: ${stdout}`)
+      console.error(`stderr: ${stderr}`)
+      resolve()
+    })
+  })
 }
 
-
-exports.default = async function(options) {
-
-    const certUrl = process.env.AZURE_KEY_VAULT_URI;
-    const clientId = process.env.AZURE_CLIENT_ID;
-    const tenantId = process.env.AZURE_TENANT_ID;
-    const clientSecret = process.env.AZURE_CLIENT_SECRET;
-    const certName = process.env.AZURE_CERT_NAME;
-    const timestampServer = 'http://timestamp.globalsign.com/tsa/r6advanced1';
-
-
-    await sign({
-        path: options.path,
-        name: "jan-win-x64",
-        certUrl,
-        clientId,
-        tenantId,
-        clientSecret,
-        certName,
-        timestampServer,
-        version: options.version
-    });
-};
+exports.default = async function (options) {
+  const certUrl = process.env.AZURE_KEY_VAULT_URI
+  const clientId = process.env.AZURE_CLIENT_ID
+  const tenantId = process.env.AZURE_TENANT_ID
+  const clientSecret = process.env.AZURE_CLIENT_SECRET
+  const certName = process.env.AZURE_CERT_NAME
+  const timestampServer = 'http://timestamp.globalsign.com/tsa/r6advanced1'
+
+  await sign({
+    path: options.path,
+    name: 'jan-win-x64',
+    certUrl,
+    clientId,
+    tenantId,
+    clientSecret,
+    certName,
+    timestampServer,
+    version: options.version,
+  })
+}
diff --git a/electron/tests/config/constants.ts b/electron/tests/config/constants.ts
new file mode 100644
index 0000000000..7039ad58c3
--- /dev/null
+++ b/electron/tests/config/constants.ts
@@ -0,0 +1,4 @@
+export const Constants = {
+  VIDEO_DIR: './playwright-video',
+  TIMEOUT: '300000',
+}
diff --git a/electron/tests/config/fixtures.ts b/electron/tests/config/fixtures.ts
new file mode 100644
index 0000000000..680b097853
--- /dev/null
+++ b/electron/tests/config/fixtures.ts
@@ -0,0 +1,119 @@
+import {
+  _electron as electron,
+  BrowserContext,
+  ElectronApplication,
+  expect,
+  Page,
+  test as base,
+} from '@playwright/test'
+import {
+  ElectronAppInfo,
+  findLatestBuild,
+  parseElectronApp,
+  stubDialog,
+} from 'electron-playwright-helpers'
+import { Constants } from './constants'
+import { HubPage } from '../pages/hubPage'
+import { CommonActions } from '../pages/commonActions'
+
+export let electronApp: ElectronApplication
+export let page: Page
+export let appInfo: ElectronAppInfo
+export const TIMEOUT = parseInt(process.env.TEST_TIMEOUT || Constants.TIMEOUT)
+
+export async function setupElectron() {
+  process.env.CI = 'e2e'
+
+  const latestBuild = findLatestBuild('dist')
+  expect(latestBuild).toBeTruthy()
+
+  // parse the packaged Electron app and find paths and other info
+  appInfo = parseElectronApp(latestBuild)
+  expect(appInfo).toBeTruthy()
+
+  electronApp = await electron.launch({
+    args: [appInfo.main], // main file from package.json
+    executablePath: appInfo.executable, // path to the Electron executable
+    // recordVideo: { dir: Constants.VIDEO_DIR }, // Specify the directory for video recordings
+  })
+  await stubDialog(electronApp, 'showMessageBox', { response: 1 })
+
+  page = await electronApp.firstWindow({
+    timeout: TIMEOUT,
+  })
+}
+
+export async function teardownElectron() {
+  await page.close()
+  await electronApp.close()
+}
+
+/**
+ * this fixture is needed to record and attach videos / screenshot on failed tests when
+ * tests are run in serial mode (i.e. browser is not closed between tests)
+ */
+export const test = base.extend<
+  {
+    commonActions: CommonActions
+    hubPage: HubPage
+    attachVideoPage: Page
+    attachScreenshotsToReport: void
+  },
+  { createVideoContext: BrowserContext }
+>({
+  commonActions: async ({ request }, use, testInfo) => {
+    await use(new CommonActions(page, testInfo))
+  },
+  hubPage: async ({ commonActions }, use) => {
+    await use(new HubPage(page, commonActions))
+  },
+  createVideoContext: [
+    async ({ playwright }, use) => {
+      const context = electronApp.context()
+      await use(context)
+    },
+    { scope: 'worker' },
+  ],
+
+  attachVideoPage: [
+    async ({ createVideoContext }, use, testInfo) => {
+      await use(page)
+
+      if (testInfo.status !== testInfo.expectedStatus) {
+        const path = await createVideoContext.pages()[0].video()?.path()
+        await createVideoContext.close()
+        await testInfo.attach('video', {
+          path: path,
+        })
+      }
+    },
+    { scope: 'test', auto: true },
+  ],
+
+  attachScreenshotsToReport: [
+    async ({ commonActions }, use, testInfo) => {
+      await use()
+
+      // After the test, we can check whether the test passed or failed.
+      if (testInfo.status !== testInfo.expectedStatus) {
+        await commonActions.takeScreenshot('')
+      }
+    },
+    { auto: true },
+  ],
+})
+
+test.setTimeout(TIMEOUT)
+
+test.beforeAll(async () => {
+  await setupElectron()
+  await page.waitForSelector('img[alt="Jan - Logo"]', {
+    state: 'visible',
+    timeout: TIMEOUT,
+  })
+})
+
+test.afterAll(async () => {
+  // temporally disabling this due to the config for parallel testing WIP
+  // teardownElectron()
+})
diff --git a/electron/tests/e2e/hub.e2e.spec.ts b/electron/tests/e2e/hub.e2e.spec.ts
new file mode 100644
index 0000000000..d968e76419
--- /dev/null
+++ b/electron/tests/e2e/hub.e2e.spec.ts
@@ -0,0 +1,19 @@
+import { test, appInfo } from '../config/fixtures'
+import { expect } from '@playwright/test'
+
+test.beforeAll(async () => {
+  expect(appInfo).toMatchObject({
+    asar: true,
+    executable: expect.anything(),
+    main: expect.anything(),
+    name: 'jan',
+    packageJson: expect.objectContaining({ name: 'jan' }),
+    platform: process.platform,
+    resourcesDir: expect.anything(),
+  })
+})
+
+test('explores hub', async ({ hubPage }) => {
+  await hubPage.navigateByMenu()
+  await hubPage.verifyContainerVisible()
+})
diff --git a/electron/tests/e2e/navigation.e2e.spec.ts b/electron/tests/e2e/navigation.e2e.spec.ts
new file mode 100644
index 0000000000..66924ce786
--- /dev/null
+++ b/electron/tests/e2e/navigation.e2e.spec.ts
@@ -0,0 +1,24 @@
+import { expect } from '@playwright/test'
+import { page, test, TIMEOUT } from '../config/fixtures'
+
+test('renders left navigation panel', async () => {
+  const systemMonitorBtn = await page
+    .getByTestId('System Monitor')
+    .first()
+    .isEnabled({
+      timeout: TIMEOUT,
+    })
+  const settingsBtn = await page
+    .getByTestId('Thread')
+    .first()
+    .isEnabled({ timeout: TIMEOUT })
+  expect([systemMonitorBtn, settingsBtn].filter((e) => !e).length).toBe(0)
+  // Chat section should be there
+  await page.getByTestId('Local API Server').first().click({
+    timeout: TIMEOUT,
+  })
+  const localServer = page.getByTestId('local-server-testid').first()
+  await expect(localServer).toBeVisible({
+    timeout: TIMEOUT,
+  })
+})
diff --git a/electron/tests/e2e/settings.e2e.spec.ts b/electron/tests/e2e/settings.e2e.spec.ts
new file mode 100644
index 0000000000..06b4d1accf
--- /dev/null
+++ b/electron/tests/e2e/settings.e2e.spec.ts
@@ -0,0 +1,11 @@
+import { expect } from '@playwright/test'
+
+import { test, page, TIMEOUT } from '../config/fixtures'
+
+test('shows settings', async () => {
+  await page.getByTestId('Settings').first().click({
+    timeout: TIMEOUT,
+  })
+  const settingDescription = page.getByTestId('testid-setting-description')
+  await expect(settingDescription).toBeVisible({ timeout: TIMEOUT })
+})
diff --git a/electron/tests/hub.e2e.spec.ts b/electron/tests/hub.e2e.spec.ts
deleted file mode 100644
index cc72e037ea..0000000000
--- a/electron/tests/hub.e2e.spec.ts
+++ /dev/null
@@ -1,48 +0,0 @@
-import { _electron as electron } from 'playwright'
-import { ElectronApplication, Page, expect, test } from '@playwright/test'
-
-import {
-  findLatestBuild,
-  parseElectronApp,
-  stubDialog,
-} from 'electron-playwright-helpers'
-
-let electronApp: ElectronApplication
-let page: Page
-const TIMEOUT: number = parseInt(process.env.TEST_TIMEOUT || '300000')
-
-test.beforeAll(async () => {
-  process.env.CI = 'e2e'
-
-  const latestBuild = findLatestBuild('dist')
-  expect(latestBuild).toBeTruthy()
-
-  // parse the packaged Electron app and find paths and other info
-  const appInfo = parseElectronApp(latestBuild)
-  expect(appInfo).toBeTruthy()
-
-  electronApp = await electron.launch({
-    args: [appInfo.main], // main file from package.json
-    executablePath: appInfo.executable, // path to the Electron executable
-  })
-  await stubDialog(electronApp, 'showMessageBox', { response: 1 })
-
-  page = await electronApp.firstWindow({
-    timeout: TIMEOUT,
-  })
-})
-
-test.afterAll(async () => {
-  await electronApp.close()
-  await page.close()
-})
-
-test('explores hub', async () => {
-  test.setTimeout(TIMEOUT)
-  await page.getByTestId('Hub').first().click({
-    timeout: TIMEOUT,
-  })
-  await page.getByTestId('hub-container-test-id').isVisible({
-    timeout: TIMEOUT,
-  })
-})
diff --git a/electron/tests/navigation.e2e.spec.ts b/electron/tests/navigation.e2e.spec.ts
deleted file mode 100644
index 5c8721c2fa..0000000000
--- a/electron/tests/navigation.e2e.spec.ts
+++ /dev/null
@@ -1,61 +0,0 @@
-import { _electron as electron } from 'playwright'
-import { ElectronApplication, Page, expect, test } from '@playwright/test'
-
-import {
-  findLatestBuild,
-  parseElectronApp,
-  stubDialog,
-} from 'electron-playwright-helpers'
-
-let electronApp: ElectronApplication
-let page: Page
-const TIMEOUT: number = parseInt(process.env.TEST_TIMEOUT || '300000')
-
-test.beforeAll(async () => {
-  process.env.CI = 'e2e'
-
-  const latestBuild = findLatestBuild('dist')
-  expect(latestBuild).toBeTruthy()
-
-  // parse the packaged Electron app and find paths and other info
-  const appInfo = parseElectronApp(latestBuild)
-  expect(appInfo).toBeTruthy()
-
-  electronApp = await electron.launch({
-    args: [appInfo.main], // main file from package.json
-    executablePath: appInfo.executable, // path to the Electron executable
-  })
-  await stubDialog(electronApp, 'showMessageBox', { response: 1 })
-
-  page = await electronApp.firstWindow({
-    timeout: TIMEOUT,
-  })
-})
-
-test.afterAll(async () => {
-  await electronApp.close()
-  await page.close()
-})
-
-test('renders left navigation panel', async () => {
-  test.setTimeout(TIMEOUT)
-  const systemMonitorBtn = await page
-    .getByTestId('System Monitor')
-    .first()
-    .isEnabled({
-      timeout: TIMEOUT,
-    })
-  const settingsBtn = await page
-    .getByTestId('Thread')
-    .first()
-    .isEnabled({ timeout: TIMEOUT })
-  expect([systemMonitorBtn, settingsBtn].filter((e) => !e).length).toBe(0)
-  // Chat section should be there
-  await page.getByTestId('Local API Server').first().click({
-    timeout: TIMEOUT,
-  })
-  const localServer = await page.getByTestId('local-server-testid').first()
-  await expect(localServer).toBeVisible({
-    timeout: TIMEOUT,
-  })
-})
diff --git a/electron/tests/pages/basePage.ts b/electron/tests/pages/basePage.ts
new file mode 100644
index 0000000000..4e16a3c232
--- /dev/null
+++ b/electron/tests/pages/basePage.ts
@@ -0,0 +1,49 @@
+import { Page, expect } from '@playwright/test'
+import { CommonActions } from './commonActions'
+import { TIMEOUT } from '../config/fixtures'
+
+export class BasePage {
+  menuId: string
+
+  constructor(
+    protected readonly page: Page,
+    readonly action: CommonActions,
+    protected containerId: string
+  ) {}
+
+  public getValue(key: string) {
+    return this.action.getValue(key)
+  }
+
+  public setValue(key: string, value: string) {
+    this.action.setValue(key, value)
+  }
+
+  async takeScreenshot(name: string = '') {
+    await this.action.takeScreenshot(name)
+  }
+
+  async navigateByMenu() {
+    await this.page.getByTestId(this.menuId).first().click()
+  }
+
+  async verifyContainerVisible() {
+    const container = this.page.getByTestId(this.containerId)
+    expect(container.isVisible()).toBeTruthy()
+  }
+
+  async waitUpdateLoader() {
+    await this.isElementVisible('img[alt="Jan - Logo"]')
+  }
+
+  //wait and find a specific element with it's selector and return Visible
+  async isElementVisible(selector: any) {
+    let isVisible = true
+    await this.page
+      .waitForSelector(selector, { state: 'visible', timeout: TIMEOUT })
+      .catch(() => {
+        isVisible = false
+      })
+    return isVisible
+  }
+}
diff --git a/electron/tests/pages/commonActions.ts b/electron/tests/pages/commonActions.ts
new file mode 100644
index 0000000000..08ea15f92a
--- /dev/null
+++ b/electron/tests/pages/commonActions.ts
@@ -0,0 +1,34 @@
+import { Page, TestInfo } from '@playwright/test'
+import { page } from '../config/fixtures'
+
+export class CommonActions {
+  private testData = new Map<string, string>()
+
+  constructor(
+    public page: Page,
+    public testInfo: TestInfo
+  ) {}
+
+  async takeScreenshot(name: string) {
+    const screenshot = await page.screenshot({
+      fullPage: true,
+    })
+    const attachmentName = `${this.testInfo.title}_${name || new Date().toISOString().slice(5, 19).replace(/[-:]/g, '').replace('T', '_')}`
+    await this.testInfo.attach(attachmentName.replace(/\s+/g, ''), {
+      body: screenshot,
+      contentType: 'image/png',
+    })
+  }
+
+  async hooks() {
+    console.log('hook from the scenario page')
+  }
+
+  setValue(key: string, value: string) {
+    this.testData.set(key, value)
+  }
+
+  getValue(key: string) {
+    return this.testData.get(key)
+  }
+}
diff --git a/electron/tests/pages/hubPage.ts b/electron/tests/pages/hubPage.ts
new file mode 100644
index 0000000000..0299ab15d4
--- /dev/null
+++ b/electron/tests/pages/hubPage.ts
@@ -0,0 +1,15 @@
+import { Page } from '@playwright/test'
+import { BasePage } from './basePage'
+import { CommonActions } from './commonActions'
+
+export class HubPage extends BasePage {
+  readonly menuId: string = 'Hub'
+  static readonly containerId: string = 'hub-container-test-id'
+
+  constructor(
+    public page: Page,
+    readonly action: CommonActions
+  ) {
+    super(page, action, HubPage.containerId)
+  }
+}
diff --git a/electron/tests/settings.e2e.spec.ts b/electron/tests/settings.e2e.spec.ts
deleted file mode 100644
index ad2d7b4a49..0000000000
--- a/electron/tests/settings.e2e.spec.ts
+++ /dev/null
@@ -1,45 +0,0 @@
-import { _electron as electron } from 'playwright'
-import { ElectronApplication, Page, expect, test } from '@playwright/test'
-
-import {
-  findLatestBuild,
-  parseElectronApp,
-  stubDialog,
-} from 'electron-playwright-helpers'
-
-let electronApp: ElectronApplication
-let page: Page
-const TIMEOUT: number = parseInt(process.env.TEST_TIMEOUT || '300000')
-
-test.beforeAll(async () => {
-  process.env.CI = 'e2e'
-
-  const latestBuild = findLatestBuild('dist')
-  expect(latestBuild).toBeTruthy()
-
-  // parse the packaged Electron app and find paths and other info
-  const appInfo = parseElectronApp(latestBuild)
-  expect(appInfo).toBeTruthy()
-
-  electronApp = await electron.launch({
-    args: [appInfo.main], // main file from package.json
-    executablePath: appInfo.executable, // path to the Electron executable
-  })
-  await stubDialog(electronApp, 'showMessageBox', { response: 1 })
-
-  page = await electronApp.firstWindow({
-    timeout: TIMEOUT,
-  })
-})
-
-test.afterAll(async () => {
-  await electronApp.close()
-  await page.close()
-})
-
-test('shows settings', async () => {
-  test.setTimeout(TIMEOUT)
-  await page.getByTestId('Settings').first().click({ timeout: TIMEOUT })
-  const settingDescription = page.getByTestId('testid-setting-description')
-  await expect(settingDescription).toBeVisible({ timeout: TIMEOUT })
-})
diff --git a/electron/utils/dev.ts b/electron/utils/dev.ts
new file mode 100644
index 0000000000..b2a4928866
--- /dev/null
+++ b/electron/utils/dev.ts
@@ -0,0 +1,18 @@
+import { app } from 'electron'
+
+export const setupReactDevTool = async () => {
+  if (!app.isPackaged) {
+    // Which means you're running from source code
+    const { default: installExtension, REACT_DEVELOPER_TOOLS } = await import(
+      'electron-devtools-installer'
+    ) // Don't use import on top level, since the installer package is dev-only
+    try {
+      const name = await installExtension(REACT_DEVELOPER_TOOLS)
+      console.log(`Added Extension: ${name}`)
+    } catch (err) {
+      console.log('An error occurred while installing devtools:')
+      console.error(err)
+      // Only log the error and don't throw it because it's not critical
+    }
+  }
+}
diff --git a/electron/utils/disposable.ts b/electron/utils/disposable.ts
index 462f7e3e51..59018a7751 100644
--- a/electron/utils/disposable.ts
+++ b/electron/utils/disposable.ts
@@ -1,8 +1,8 @@
 export function dispose(requiredModules: Record<string, any>) {
   for (const key in requiredModules) {
-    const module = requiredModules[key];
-    if (typeof module["dispose"] === "function") {
-      module["dispose"]();
+    const module = requiredModules[key]
+    if (typeof module['dispose'] === 'function') {
+      module['dispose']()
     }
   }
 }
diff --git a/electron/utils/log.ts b/electron/utils/log.ts
new file mode 100644
index 0000000000..84c185d754
--- /dev/null
+++ b/electron/utils/log.ts
@@ -0,0 +1,67 @@
+import { getJanDataFolderPath } from '@janhq/core/node'
+import * as fs from 'fs'
+import * as path from 'path'
+
+export function cleanLogs(
+  maxFileSizeBytes?: number | undefined,
+  daysToKeep?: number | undefined,
+  delayMs?: number | undefined
+): void {
+  const size = maxFileSizeBytes ?? 1 * 1024 * 1024 // 1 MB
+  const days = daysToKeep ?? 7 // 7 days
+  const delays = delayMs ?? 10000 // 10 seconds
+  const logDirectory = path.join(getJanDataFolderPath(), 'logs')
+
+  // Perform log cleaning
+  const currentDate = new Date()
+  fs.readdir(logDirectory, (err, files) => {
+    if (err) {
+      console.error('Error reading log directory:', err)
+      return
+    }
+
+    files.forEach((file) => {
+      const filePath = path.join(logDirectory, file)
+      fs.stat(filePath, (err, stats) => {
+        if (err) {
+          console.error('Error getting file stats:', err)
+          return
+        }
+
+        // Check size
+        if (stats.size > size) {
+          fs.unlink(filePath, (err) => {
+            if (err) {
+              console.error('Error deleting log file:', err)
+              return
+            }
+            console.log(
+              `Deleted log file due to exceeding size limit: ${filePath}`
+            )
+          })
+        } else {
+          // Check age
+          const creationDate = new Date(stats.ctime)
+          const daysDifference = Math.floor(
+            (currentDate.getTime() - creationDate.getTime()) /
+              (1000 * 3600 * 24)
+          )
+          if (daysDifference > days) {
+            fs.unlink(filePath, (err) => {
+              if (err) {
+                console.error('Error deleting log file:', err)
+                return
+              }
+              console.log(`Deleted old log file: ${filePath}`)
+            })
+          }
+        }
+      })
+    })
+  })
+
+  // Schedule the next execution with doubled delays
+  setTimeout(() => {
+    cleanLogs(maxFileSizeBytes, daysToKeep, delays * 2)
+  }, delays)
+}
diff --git a/electron/utils/menu.ts b/electron/utils/menu.ts
index 7721b7c78b..893907c48a 100644
--- a/electron/utils/menu.ts
+++ b/electron/utils/menu.ts
@@ -1,19 +1,41 @@
 // @ts-nocheck
-import { app, Menu, dialog, shell } from 'electron'
-const isMac = process.platform === 'darwin'
+import { app, Menu, shell, dialog } from 'electron'
 import { autoUpdater } from 'electron-updater'
-import { compareSemanticVersions } from './versionDiff'
+import { log } from '@janhq/core/node'
+const isMac = process.platform === 'darwin'
 
 const template: (Electron.MenuItemConstructorOptions | Electron.MenuItem)[] = [
   {
     label: app.name,
     submenu: [
-      { role: 'about' },
+      {
+        label: `About ${app.name}`,
+        click: () =>
+          dialog.showMessageBox({
+            title: `Jan`,
+            message: `Jan Version v${app.getVersion()}\n\nCopyright © 2024 Jan`,
+          }),
+      },
       {
         label: 'Check for Updates...',
         click: () =>
           // Check for updates and notify user if there are any
-          autoUpdater.checkForUpdatesAndNotify(),
+          autoUpdater
+            .checkForUpdatesAndNotify()
+            .then((updateCheckResult) => {
+              if (
+                !updateCheckResult?.updateInfo ||
+                updateCheckResult?.updateInfo.version === app.getVersion()
+              ) {
+                dialog.showMessageBox({
+                  message: `No updates available.`,
+                })
+                return
+              }
+            })
+            .catch((error) => {
+              log('Error checking for updates:' + JSON.stringify(error))
+            }),
       },
       { type: 'separator' },
       { role: 'services' },
diff --git a/electron/utils/path.ts b/electron/utils/path.ts
index 4e47cc312b..4438156bcb 100644
--- a/electron/utils/path.ts
+++ b/electron/utils/path.ts
@@ -1,5 +1,3 @@
-import { join } from 'path'
-import { app } from 'electron'
 import { mkdir } from 'fs-extra'
 import { existsSync } from 'fs'
 import { getJanDataFolderPath } from '@janhq/core/node'
@@ -16,13 +14,3 @@ export async function createUserSpace(): Promise<void> {
     }
   }
 }
-
-export function getResourcePath() {
-  let appPath = join(app.getAppPath(), '..', 'app.asar.unpacked')
-
-  if (!app.isPackaged) {
-    // for development mode
-    appPath = join(__dirname, '..', '..')
-  }
-  return appPath
-}
diff --git a/electron/utils/setup.ts b/electron/utils/setup.ts
index 887c3c2b7a..01b0b31da2 100644
--- a/electron/utils/setup.ts
+++ b/electron/utils/setup.ts
@@ -1,9 +1,9 @@
 import { app } from 'electron'
 
 export const setupCore = async () => {
-    // Setup core api for main process
-    global.core = {
-        // Define appPath function for app to retrieve app path globaly
-        appPath: () => app.getPath('userData')
-    }
-}
\ No newline at end of file
+  // Setup core api for main process
+  global.core = {
+    // Define appPath function for app to retrieve app path globaly
+    appPath: () => app.getPath('userData'),
+  }
+}
diff --git a/electron/utils/versionDiff.ts b/electron/utils/versionDiff.ts
deleted file mode 100644
index 25934e87f0..0000000000
--- a/electron/utils/versionDiff.ts
+++ /dev/null
@@ -1,21 +0,0 @@
-export const compareSemanticVersions = (a: string, b: string) => {
- 
-    // 1. Split the strings into their parts.
-    const a1 = a.split('.');
-    const b1 = b.split('.');
-    // 2. Contingency in case there's a 4th or 5th version
-    const len = Math.min(a1.length, b1.length);
-    // 3. Look through each version number and compare.
-    for (let i = 0; i < len; i++) {
-        const a2 = +a1[ i ] || 0;
-        const b2 = +b1[ i ] || 0;
-        
-        if (a2 !== b2) {
-            return a2 > b2 ? 1 : -1;        
-        }
-    }
-    
-    // 4. We hit this if the all checked versions so far are equal
-    //
-    return b1.length - a1.length;
-};
\ No newline at end of file
diff --git a/extensions/assistant-extension/package.json b/extensions/assistant-extension/package.json
index 84bcdf47e2..baa8586557 100644
--- a/extensions/assistant-extension/package.json
+++ b/extensions/assistant-extension/package.json
@@ -1,16 +1,17 @@
 {
   "name": "@janhq/assistant-extension",
-  "version": "1.0.0",
+  "version": "1.0.1",
   "description": "This extension enables assistants, including Jan, a default assistant that can call all downloaded models",
   "main": "dist/index.js",
   "node": "dist/node/index.js",
   "author": "Jan <service@jan.ai>",
   "license": "AGPL-3.0",
   "scripts": {
-    "build": "tsc --module commonjs && rollup -c rollup.config.ts",
-    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install",
-    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && ../../.github/scripts/auto-sign.sh && npm pack && cpx *.tgz ../../electron/pre-install",
-    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install",
+    "clean:modules": "rimraf node_modules/pdf-parse/test && cd node_modules/pdf-parse/lib/pdf.js && rimraf v1.9.426 v1.10.88 v2.0.550",
+    "build": "yarn clean:modules && tsc --module commonjs && rollup -c rollup.config.ts",
+    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install",
+    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && ../../.github/scripts/auto-sign.sh && npm pack && cpx *.tgz ../../pre-install",
+    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install",
     "build:publish": "run-script-os"
   },
   "devDependencies": {
@@ -25,7 +26,7 @@
     "rollup-plugin-define": "^1.0.1",
     "rollup-plugin-sourcemaps": "^0.6.3",
     "rollup-plugin-typescript2": "^0.36.0",
-    "typescript": "^5.3.3",
+    "typescript": "^5.2.2",
     "run-script-os": "^1.1.6"
   },
   "dependencies": {
@@ -44,9 +45,6 @@
   ],
   "bundleDependencies": [
     "@janhq/core",
-    "@langchain/community",
-    "hnswlib-node",
-    "langchain",
-    "pdf-parse"
+    "hnswlib-node"
   ]
 }
diff --git a/extensions/assistant-extension/rollup.config.ts b/extensions/assistant-extension/rollup.config.ts
index 7916ef9c82..d3c39cab2d 100644
--- a/extensions/assistant-extension/rollup.config.ts
+++ b/extensions/assistant-extension/rollup.config.ts
@@ -1,22 +1,22 @@
-import resolve from "@rollup/plugin-node-resolve";
-import commonjs from "@rollup/plugin-commonjs";
-import sourceMaps from "rollup-plugin-sourcemaps";
-import typescript from "rollup-plugin-typescript2";
-import json from "@rollup/plugin-json";
-import replace from "@rollup/plugin-replace";
+import resolve from '@rollup/plugin-node-resolve'
+import commonjs from '@rollup/plugin-commonjs'
+import sourceMaps from 'rollup-plugin-sourcemaps'
+import typescript from 'rollup-plugin-typescript2'
+import json from '@rollup/plugin-json'
+import replace from '@rollup/plugin-replace'
 
-const packageJson = require("./package.json");
+const packageJson = require('./package.json')
 
-const pkg = require("./package.json");
+const pkg = require('./package.json')
 
 export default [
   {
     input: `src/index.ts`,
-    output: [{ file: pkg.main, format: "es", sourcemap: true }],
+    output: [{ file: pkg.main, format: 'es', sourcemap: true }],
     // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
     external: [],
     watch: {
-      include: "src/**",
+      include: 'src/**',
     },
     plugins: [
       replace({
@@ -35,7 +35,7 @@ export default [
       // which external modules to include in the bundle
       // https://github.com/rollup/rollup-plugin-node-resolve#usage
       resolve({
-        extensions: [".js", ".ts", ".svelte"],
+        extensions: ['.js', '.ts', '.svelte'],
       }),
 
       // Resolve source maps to the original source
@@ -44,18 +44,11 @@ export default [
   },
   {
     input: `src/node/index.ts`,
-    output: [{ dir: "dist/node", format: "cjs", sourcemap: false }],
+    output: [{ dir: 'dist/node', format: 'cjs', sourcemap: false }],
     // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
-    external: [
-      "@janhq/core/node",
-      "@langchain/community",
-      "langchain",
-      "langsmith",
-      "path",
-      "hnswlib-node",
-    ],
+    external: ['@janhq/core/node', 'path', 'hnswlib-node'],
     watch: {
-      include: "src/node/**",
+      include: 'src/node/**',
     },
     // inlineDynamicImports: true,
     plugins: [
@@ -71,11 +64,11 @@ export default [
       // which external modules to include in the bundle
       // https://github.com/rollup/rollup-plugin-node-resolve#usage
       resolve({
-        extensions: [".ts", ".js", ".json"],
+        extensions: ['.ts', '.js', '.json'],
       }),
 
       // Resolve source maps to the original source
       // sourceMaps(),
     ],
   },
-];
+]
diff --git a/extensions/assistant-extension/src/@types/global.d.ts b/extensions/assistant-extension/src/@types/global.d.ts
index dc11709a4f..bc97157cdf 100644
--- a/extensions/assistant-extension/src/@types/global.d.ts
+++ b/extensions/assistant-extension/src/@types/global.d.ts
@@ -1,3 +1,3 @@
-declare const NODE: string;
-declare const EXTENSION_NAME: string;
-declare const VERSION: string;
+declare const NODE: string
+declare const EXTENSION_NAME: string
+declare const VERSION: string
diff --git a/extensions/assistant-extension/src/index.ts b/extensions/assistant-extension/src/index.ts
index 6495ea7869..0a5319c8a7 100644
--- a/extensions/assistant-extension/src/index.ts
+++ b/extensions/assistant-extension/src/index.ts
@@ -9,143 +9,169 @@ import {
   joinPath,
   executeOnMain,
   AssistantExtension,
-} from "@janhq/core";
+  AssistantEvent,
+} from '@janhq/core'
 
 export default class JanAssistantExtension extends AssistantExtension {
-  private static readonly _homeDir = "file://assistants";
+  private static readonly _homeDir = 'file://assistants'
+  private static readonly _threadDir = 'file://threads'
 
-  controller = new AbortController();
-  isCancelled = false;
-  retrievalThreadId: string | undefined = undefined;
+  controller = new AbortController()
+  isCancelled = false
+  retrievalThreadId: string | undefined = undefined
 
   async onLoad() {
     // making the assistant directory
     const assistantDirExist = await fs.existsSync(
-      JanAssistantExtension._homeDir,
-    );
+      JanAssistantExtension._homeDir
+    )
     if (
       localStorage.getItem(`${EXTENSION_NAME}-version`) !== VERSION ||
       !assistantDirExist
     ) {
-      if (!assistantDirExist)
-        await fs.mkdirSync(JanAssistantExtension._homeDir);
+      if (!assistantDirExist) await fs.mkdirSync(JanAssistantExtension._homeDir)
 
       // Write assistant metadata
-      this.createJanAssistant();
+      await this.createJanAssistant()
       // Finished migration
-      localStorage.setItem(`${EXTENSION_NAME}-version`, VERSION);
+      localStorage.setItem(`${EXTENSION_NAME}-version`, VERSION)
+      // Update the assistant list
+      events.emit(AssistantEvent.OnAssistantsUpdate, {})
     }
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      JanAssistantExtension.handleMessageRequest(data, this),
-    );
+      JanAssistantExtension.handleMessageRequest(data, this)
+    )
 
     events.on(InferenceEvent.OnInferenceStopped, () => {
-      JanAssistantExtension.handleInferenceStopped(this);
-    });
+      JanAssistantExtension.handleInferenceStopped(this)
+    })
   }
 
   private static async handleInferenceStopped(instance: JanAssistantExtension) {
-    instance.isCancelled = true;
-    instance.controller?.abort();
+    instance.isCancelled = true
+    instance.controller?.abort()
   }
 
   private static async handleMessageRequest(
     data: MessageRequest,
-    instance: JanAssistantExtension,
+    instance: JanAssistantExtension
   ) {
-    instance.isCancelled = false;
-    instance.controller = new AbortController();
+    instance.isCancelled = false
+    instance.controller = new AbortController()
 
     if (
       data.model?.engine !== InferenceEngine.tool_retrieval_enabled ||
       !data.messages ||
+      // TODO: Since the engine is defined, its unsafe to assume that assistant tools are defined
+      // That could lead to an issue where thread stuck at generating response
       !data.thread?.assistants[0]?.tools
     ) {
-      return;
+      return
     }
 
-    const latestMessage = data.messages[data.messages.length - 1];
+    const latestMessage = data.messages[data.messages.length - 1]
 
-    // Ingest the document if needed
+    // 1. Ingest the document if needed
     if (
       latestMessage &&
       latestMessage.content &&
-      typeof latestMessage.content !== "string"
+      typeof latestMessage.content !== 'string' &&
+      latestMessage.content.length > 1
     ) {
-      const docFile = latestMessage.content[1]?.doc_url?.url;
+      const docFile = latestMessage.content[1]?.doc_url?.url
       if (docFile) {
         await executeOnMain(
           NODE,
-          "toolRetrievalIngestNewDocument",
+          'toolRetrievalIngestNewDocument',
           docFile,
-          data.model?.proxyEngine,
-        );
+          data.model?.proxyEngine
+        )
+      }
+    } else if (
+      // Check whether we need to ingest document or not
+      // Otherwise wrong context will be sent
+      !(await fs.existsSync(
+        await joinPath([
+          JanAssistantExtension._threadDir,
+          data.threadId,
+          'memory',
+        ])
+      ))
+    ) {
+      // No document ingested, reroute the result to inference engine
+      const output = {
+        ...data,
+        model: {
+          ...data.model,
+          engine: data.model.proxyEngine,
+        },
       }
+      events.emit(MessageEvent.OnMessageSent, output)
+      return
     }
-
-    // Load agent on thread changed
+    // 2. Load agent on thread changed
     if (instance.retrievalThreadId !== data.threadId) {
-      await executeOnMain(NODE, "toolRetrievalLoadThreadMemory", data.threadId);
+      await executeOnMain(NODE, 'toolRetrievalLoadThreadMemory', data.threadId)
 
-      instance.retrievalThreadId = data.threadId;
+      instance.retrievalThreadId = data.threadId
 
       // Update the text splitter
       await executeOnMain(
         NODE,
-        "toolRetrievalUpdateTextSplitter",
+        'toolRetrievalUpdateTextSplitter',
         data.thread.assistants[0].tools[0]?.settings?.chunk_size ?? 4000,
-        data.thread.assistants[0].tools[0]?.settings?.chunk_overlap ?? 200,
-      );
+        data.thread.assistants[0].tools[0]?.settings?.chunk_overlap ?? 200
+      )
     }
 
+    // 3. Using the retrieval template with the result and query
     if (latestMessage.content) {
       const prompt =
-        typeof latestMessage.content === "string"
+        typeof latestMessage.content === 'string'
           ? latestMessage.content
-          : latestMessage.content[0].text;
+          : latestMessage.content[0].text
       // Retrieve the result
-      console.debug("toolRetrievalQuery", latestMessage.content);
       const retrievalResult = await executeOnMain(
         NODE,
-        "toolRetrievalQueryResult",
-        prompt,
-      );
+        'toolRetrievalQueryResult',
+        prompt
+      )
+      console.debug('toolRetrievalQueryResult', retrievalResult)
 
-      // Update the message content
-      // Using the retrieval template with the result and query
-      if (data.thread?.assistants[0].tools)
+      // Update message content
+      if (data.thread?.assistants[0]?.tools && retrievalResult)
         data.messages[data.messages.length - 1].content =
           data.thread.assistants[0].tools[0].settings?.retrieval_template
-            ?.replace("{CONTEXT}", retrievalResult)
-            .replace("{QUESTION}", prompt);
+            ?.replace('{CONTEXT}', retrievalResult)
+            .replace('{QUESTION}', prompt)
     }
 
     // Filter out all the messages that are not text
     data.messages = data.messages.map((message) => {
       if (
         message.content &&
-        typeof message.content !== "string" &&
+        typeof message.content !== 'string' &&
         (message.content.length ?? 0) > 0
       ) {
         return {
           ...message,
           content: [message.content[0]],
-        };
+        }
       }
-      return message;
-    });
+      return message
+    })
 
-    // Reroute the result to inference engine
+    // 4. Reroute the result to inference engine
     const output = {
       ...data,
       model: {
         ...data.model,
         engine: data.model.proxyEngine,
       },
-    };
-    events.emit(MessageEvent.OnMessageSent, output);
+    }
+    events.emit(MessageEvent.OnMessageSent, output)
   }
 
   /**
@@ -157,107 +183,107 @@ export default class JanAssistantExtension extends AssistantExtension {
     const assistantDir = await joinPath([
       JanAssistantExtension._homeDir,
       assistant.id,
-    ]);
-    if (!(await fs.existsSync(assistantDir))) await fs.mkdirSync(assistantDir);
+    ])
+    if (!(await fs.existsSync(assistantDir))) await fs.mkdirSync(assistantDir)
 
     // store the assistant metadata json
     const assistantMetadataPath = await joinPath([
       assistantDir,
-      "assistant.json",
-    ]);
+      'assistant.json',
+    ])
     try {
       await fs.writeFileSync(
         assistantMetadataPath,
-        JSON.stringify(assistant, null, 2),
-      );
+        JSON.stringify(assistant, null, 2)
+      )
     } catch (err) {
-      console.error(err);
+      console.error(err)
     }
   }
 
   async getAssistants(): Promise<Assistant[]> {
     // get all the assistant directories
     // get all the assistant metadata json
-    const results: Assistant[] = [];
+    const results: Assistant[] = []
     const allFileName: string[] = await fs.readdirSync(
-      JanAssistantExtension._homeDir,
-    );
+      JanAssistantExtension._homeDir
+    )
     for (const fileName of allFileName) {
       const filePath = await joinPath([
         JanAssistantExtension._homeDir,
         fileName,
-      ]);
+      ])
 
-      if (filePath.includes(".DS_Store")) continue;
+      if (filePath.includes('.DS_Store')) continue
       const jsonFiles: string[] = (await fs.readdirSync(filePath)).filter(
-        (file: string) => file === "assistant.json",
-      );
+        (file: string) => file === 'assistant.json'
+      )
 
       if (jsonFiles.length !== 1) {
         // has more than one assistant file -> ignore
-        continue;
+        continue
       }
 
       const content = await fs.readFileSync(
         await joinPath([filePath, jsonFiles[0]]),
-        "utf-8",
-      );
+        'utf-8'
+      )
       const assistant: Assistant =
-        typeof content === "object" ? content : JSON.parse(content);
+        typeof content === 'object' ? content : JSON.parse(content)
 
-      results.push(assistant);
+      results.push(assistant)
     }
 
-    return results;
+    return results
   }
 
   async deleteAssistant(assistant: Assistant): Promise<void> {
-    if (assistant.id === "jan") {
-      return Promise.reject("Cannot delete Jan Assistant");
+    if (assistant.id === 'jan') {
+      return Promise.reject('Cannot delete Jan Assistant')
     }
 
     // remove the directory
     const assistantDir = await joinPath([
       JanAssistantExtension._homeDir,
       assistant.id,
-    ]);
-    await fs.rmdirSync(assistantDir);
-    return Promise.resolve();
+    ])
+    await fs.rmdirSync(assistantDir)
+    return Promise.resolve()
   }
 
   private async createJanAssistant(): Promise<void> {
     const janAssistant: Assistant = {
-      avatar: "",
+      avatar: '',
       thread_location: undefined,
-      id: "jan",
-      object: "assistant",
+      id: 'jan',
+      object: 'assistant',
       created_at: Date.now(),
-      name: "Jan",
-      description: "A default assistant that can use all downloaded models",
-      model: "*",
-      instructions: "",
+      name: 'Jan',
+      description: 'A default assistant that can use all downloaded models',
+      model: '*',
+      instructions: '',
       tools: [
         {
-          type: "retrieval",
+          type: 'retrieval',
           enabled: false,
           settings: {
             top_k: 2,
             chunk_size: 1024,
             chunk_overlap: 64,
             retrieval_template: `Use the following pieces of context to answer the question at the end. If you don't know the answer, just say that you don't know, don't try to make up an answer.
-            ----------------
-            CONTEXT: {CONTEXT}
-            ----------------
-            QUESTION: {QUESTION}
-            ----------------
-            Helpful Answer:`,
+----------------
+CONTEXT: {CONTEXT}
+----------------
+QUESTION: {QUESTION}
+----------------
+Helpful Answer:`,
           },
         },
       ],
       file_ids: [],
       metadata: undefined,
-    };
+    }
 
-    await this.createAssistant(janAssistant);
+    await this.createAssistant(janAssistant)
   }
 }
diff --git a/extensions/assistant-extension/src/node/engine.ts b/extensions/assistant-extension/src/node/engine.ts
index 54b2a6ba16..70d02af1f5 100644
--- a/extensions/assistant-extension/src/node/engine.ts
+++ b/extensions/assistant-extension/src/node/engine.ts
@@ -1,13 +1,13 @@
-import fs from "fs";
-import path from "path";
-import { getJanDataFolderPath } from "@janhq/core/node";
+import fs from 'fs'
+import path from 'path'
+import { getJanDataFolderPath } from '@janhq/core/node'
 
 // Sec: Do not send engine settings over requests
 // Read it manually instead
 export const readEmbeddingEngine = (engineName: string) => {
   const engineSettings = fs.readFileSync(
-    path.join(getJanDataFolderPath(), "engines", `${engineName}.json`),
-    "utf-8",
-  );
-  return JSON.parse(engineSettings);
-};
+    path.join(getJanDataFolderPath(), 'engines', `${engineName}.json`),
+    'utf-8'
+  )
+  return JSON.parse(engineSettings)
+}
diff --git a/extensions/assistant-extension/src/node/index.ts b/extensions/assistant-extension/src/node/index.ts
index 95a7243a43..d52a4b23e3 100644
--- a/extensions/assistant-extension/src/node/index.ts
+++ b/extensions/assistant-extension/src/node/index.ts
@@ -1,39 +1,39 @@
-import { getJanDataFolderPath, normalizeFilePath } from "@janhq/core/node";
-import { Retrieval } from "./tools/retrieval";
-import path from "path";
+import { getJanDataFolderPath, normalizeFilePath } from '@janhq/core/node'
+import { retrieval } from './tools/retrieval'
+import path from 'path'
 
-const retrieval = new Retrieval();
-
-export async function toolRetrievalUpdateTextSplitter(
+export function toolRetrievalUpdateTextSplitter(
   chunkSize: number,
-  chunkOverlap: number,
+  chunkOverlap: number
 ) {
-  retrieval.updateTextSplitter(chunkSize, chunkOverlap);
-  return Promise.resolve();
+  retrieval.updateTextSplitter(chunkSize, chunkOverlap)
 }
 export async function toolRetrievalIngestNewDocument(
   file: string,
-  engine: string,
+  engine: string
 ) {
-  const filePath = path.join(getJanDataFolderPath(), normalizeFilePath(file));
-  const threadPath = path.dirname(filePath.replace("files", ""));
-  retrieval.updateEmbeddingEngine(engine);
-  await retrieval.ingestAgentKnowledge(filePath, `${threadPath}/memory`);
-  return Promise.resolve();
+  const filePath = path.join(getJanDataFolderPath(), normalizeFilePath(file))
+  const threadPath = path.dirname(filePath.replace('files', ''))
+  retrieval.updateEmbeddingEngine(engine)
+  return retrieval
+    .ingestAgentKnowledge(filePath, `${threadPath}/memory`)
+    .catch((err) => {
+      console.error(err)
+    })
 }
 
 export async function toolRetrievalLoadThreadMemory(threadId: string) {
-  try {
-    await retrieval.loadRetrievalAgent(
-      path.join(getJanDataFolderPath(), "threads", threadId, "memory"),
-    );
-    return Promise.resolve();
-  } catch (err) {
-    console.debug(err);
-  }
+  return retrieval
+    .loadRetrievalAgent(
+      path.join(getJanDataFolderPath(), 'threads', threadId, 'memory')
+    )
+    .catch((err) => {
+      console.error(err)
+    })
 }
 
 export async function toolRetrievalQueryResult(query: string) {
-  const res = await retrieval.generateResult(query);
-  return Promise.resolve(res);
+  return retrieval.generateResult(query).catch((err) => {
+    console.error(err)
+  })
 }
diff --git a/extensions/assistant-extension/src/node/tools/retrieval/index.ts b/extensions/assistant-extension/src/node/tools/retrieval/index.ts
index 8c7a6aa2bc..e58ec0c46c 100644
--- a/extensions/assistant-extension/src/node/tools/retrieval/index.ts
+++ b/extensions/assistant-extension/src/node/tools/retrieval/index.ts
@@ -1,77 +1,80 @@
-import { RecursiveCharacterTextSplitter } from "langchain/text_splitter";
-import { formatDocumentsAsString } from "langchain/util/document";
-import { PDFLoader } from "langchain/document_loaders/fs/pdf";
+import { RecursiveCharacterTextSplitter } from 'langchain/text_splitter'
+import { formatDocumentsAsString } from 'langchain/util/document'
+import { PDFLoader } from 'langchain/document_loaders/fs/pdf'
 
-import { HNSWLib } from "langchain/vectorstores/hnswlib";
+import { HNSWLib } from 'langchain/vectorstores/hnswlib'
 
-import { OpenAIEmbeddings } from "langchain/embeddings/openai";
-import { readEmbeddingEngine } from "../../engine";
+import { OpenAIEmbeddings } from 'langchain/embeddings/openai'
+import { readEmbeddingEngine } from '../../engine'
 
 export class Retrieval {
-  public chunkSize: number = 100;
-  public chunkOverlap?: number = 0;
-  private retriever: any;
+  public chunkSize: number = 100
+  public chunkOverlap?: number = 0
+  private retriever: any
 
-  private embeddingModel?: OpenAIEmbeddings = undefined;
-  private textSplitter?: RecursiveCharacterTextSplitter;
+  private embeddingModel?: OpenAIEmbeddings = undefined
+  private textSplitter?: RecursiveCharacterTextSplitter
 
   constructor(chunkSize: number = 4000, chunkOverlap: number = 200) {
-    this.updateTextSplitter(chunkSize, chunkOverlap);
+    this.updateTextSplitter(chunkSize, chunkOverlap)
   }
 
   public updateTextSplitter(chunkSize: number, chunkOverlap: number): void {
-    this.chunkSize = chunkSize;
-    this.chunkOverlap = chunkOverlap;
+    this.chunkSize = chunkSize
+    this.chunkOverlap = chunkOverlap
     this.textSplitter = new RecursiveCharacterTextSplitter({
       chunkSize: chunkSize,
       chunkOverlap: chunkOverlap,
-    });
+    })
   }
 
   public updateEmbeddingEngine(engine: string): void {
     // Engine settings are not compatible with the current embedding model params
     // Switch case manually for now
-    const settings = readEmbeddingEngine(engine);
-    if (engine === "nitro") {
+    const settings = readEmbeddingEngine(engine)
+    if (engine === 'nitro') {
       this.embeddingModel = new OpenAIEmbeddings(
-        { openAIApiKey: "nitro-embedding" },
-        { basePath: "http://127.0.0.1:3928/v1" },
-      );
+        { openAIApiKey: 'nitro-embedding' },
+        // TODO: Raw settings
+        { basePath: 'http://127.0.0.1:3928/v1' }
+      )
     } else {
       // Fallback to OpenAI Settings
       this.embeddingModel = new OpenAIEmbeddings({
         openAIApiKey: settings.api_key,
-      });
+      })
     }
   }
 
   public ingestAgentKnowledge = async (
     filePath: string,
-    memoryPath: string,
+    memoryPath: string
   ): Promise<any> => {
     const loader = new PDFLoader(filePath, {
       splitPages: true,
-    });
-    if (!this.embeddingModel) return Promise.reject();
-    const doc = await loader.load();
-    const docs = await this.textSplitter!.splitDocuments(doc);
-    const vectorStore = await HNSWLib.fromDocuments(docs, this.embeddingModel);
-    return vectorStore.save(memoryPath);
-  };
+    })
+    if (!this.embeddingModel) return Promise.reject()
+    const doc = await loader.load()
+    const docs = await this.textSplitter!.splitDocuments(doc)
+    const vectorStore = await HNSWLib.fromDocuments(docs, this.embeddingModel)
+    return vectorStore.save(memoryPath)
+  }
 
   public loadRetrievalAgent = async (memoryPath: string): Promise<void> => {
-    if (!this.embeddingModel) return Promise.reject();
-    const vectorStore = await HNSWLib.load(memoryPath, this.embeddingModel);
-    this.retriever = vectorStore.asRetriever(2);
-    return Promise.resolve();
-  };
+    if (!this.embeddingModel) return Promise.reject()
+    const vectorStore = await HNSWLib.load(memoryPath, this.embeddingModel)
+    this.retriever = vectorStore.asRetriever(2)
+    return Promise.resolve()
+  }
 
   public generateResult = async (query: string): Promise<string> => {
     if (!this.retriever) {
-      return Promise.resolve(" ");
+      return Promise.resolve(' ')
     }
-    const relevantDocs = await this.retriever.getRelevantDocuments(query);
-    const serializedDoc = formatDocumentsAsString(relevantDocs);
-    return Promise.resolve(serializedDoc);
-  };
+    const relevantDocs = await this.retriever.getRelevantDocuments(query)
+    const serializedDoc = formatDocumentsAsString(relevantDocs)
+    return Promise.resolve(serializedDoc)
+  }
 }
+
+export const retrieval = new Retrieval()
diff --git a/extensions/assistant-extension/tsconfig.json b/extensions/assistant-extension/tsconfig.json
index d3794cace9..e425358c35 100644
--- a/extensions/assistant-extension/tsconfig.json
+++ b/extensions/assistant-extension/tsconfig.json
@@ -14,7 +14,7 @@
     "outDir": "dist",
     "importHelpers": true,
     "typeRoots": ["node_modules/@types"],
-    "skipLibCheck": true,
+    "skipLibCheck": true
   },
-  "include": ["src"],
+  "include": ["src"]
 }
diff --git a/extensions/conversational-extension/.prettierrc b/extensions/conversational-extension/.prettierrc
deleted file mode 100644
index 46f1abcb02..0000000000
--- a/extensions/conversational-extension/.prettierrc
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-  "semi": false,
-  "singleQuote": true,
-  "quoteProps": "consistent",
-  "trailingComma": "es5",
-  "endOfLine": "auto",
-  "plugins": ["prettier-plugin-tailwindcss"]
-}
diff --git a/extensions/conversational-extension/package.json b/extensions/conversational-extension/package.json
index a60c12339f..8a6da14e50 100644
--- a/extensions/conversational-extension/package.json
+++ b/extensions/conversational-extension/package.json
@@ -7,7 +7,7 @@
   "license": "MIT",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "exports": {
     ".": "./dist/index.js",
@@ -17,12 +17,12 @@
     "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
-    "path-browserify": "^1.0.1",
-    "ts-loader": "^9.5.0"
+    "path-browserify": "^1.0.1"
   },
   "engines": {
     "node": ">=18.0.0"
diff --git a/extensions/conversational-extension/src/index.ts b/extensions/conversational-extension/src/index.ts
index 3d28a9c1d5..bf8c213add 100644
--- a/extensions/conversational-extension/src/index.ts
+++ b/extensions/conversational-extension/src/index.ts
@@ -12,7 +12,7 @@ import {
  * functionality for managing threads.
  */
 export default class JSONConversationalExtension extends ConversationalExtension {
-  private static readonly _homeDir = 'file://threads'
+  private static readonly _threadFolder = 'file://threads'
   private static readonly _threadInfoFileName = 'thread.json'
   private static readonly _threadMessagesFileName = 'messages.jsonl'
 
@@ -20,8 +20,8 @@ export default class JSONConversationalExtension extends ConversationalExtension
    * Called when the extension is loaded.
    */
   async onLoad() {
-    if (!(await fs.existsSync(JSONConversationalExtension._homeDir)))
-      await fs.mkdirSync(JSONConversationalExtension._homeDir)
+    if (!(await fs.existsSync(JSONConversationalExtension._threadFolder)))
+      await fs.mkdirSync(JSONConversationalExtension._threadFolder)
     console.debug('JSONConversationalExtension loaded')
   }
 
@@ -68,7 +68,7 @@ export default class JSONConversationalExtension extends ConversationalExtension
   async saveThread(thread: Thread): Promise<void> {
     try {
       const threadDirPath = await joinPath([
-        JSONConversationalExtension._homeDir,
+        JSONConversationalExtension._threadFolder,
         thread.id,
       ])
       const threadJsonPath = await joinPath([
@@ -92,7 +92,7 @@ export default class JSONConversationalExtension extends ConversationalExtension
    */
   async deleteThread(threadId: string): Promise<void> {
     const path = await joinPath([
-      JSONConversationalExtension._homeDir,
+      JSONConversationalExtension._threadFolder,
       `${threadId}`,
     ])
     try {
@@ -109,7 +109,7 @@ export default class JSONConversationalExtension extends ConversationalExtension
   async addNewMessage(message: ThreadMessage): Promise<void> {
     try {
       const threadDirPath = await joinPath([
-        JSONConversationalExtension._homeDir,
+        JSONConversationalExtension._threadFolder,
         message.thread_id,
       ])
       const threadMessagePath = await joinPath([
@@ -177,7 +177,7 @@ export default class JSONConversationalExtension extends ConversationalExtension
   ): Promise<void> {
     try {
       const threadDirPath = await joinPath([
-        JSONConversationalExtension._homeDir,
+        JSONConversationalExtension._threadFolder,
         threadId,
       ])
       const threadMessagePath = await joinPath([
@@ -205,7 +205,7 @@ export default class JSONConversationalExtension extends ConversationalExtension
   private async readThread(threadDirName: string): Promise<any> {
     return fs.readFileSync(
       await joinPath([
-        JSONConversationalExtension._homeDir,
+        JSONConversationalExtension._threadFolder,
         threadDirName,
         JSONConversationalExtension._threadInfoFileName,
       ]),
@@ -219,14 +219,14 @@ export default class JSONConversationalExtension extends ConversationalExtension
    */
   private async getValidThreadDirs(): Promise<string[]> {
     const fileInsideThread: string[] = await fs.readdirSync(
-      JSONConversationalExtension._homeDir
+      JSONConversationalExtension._threadFolder
     )
 
     const threadDirs: string[] = []
     for (let i = 0; i < fileInsideThread.length; i++) {
       if (fileInsideThread[i].includes('.DS_Store')) continue
       const path = await joinPath([
-        JSONConversationalExtension._homeDir,
+        JSONConversationalExtension._threadFolder,
         fileInsideThread[i],
       ])
 
@@ -246,7 +246,7 @@ export default class JSONConversationalExtension extends ConversationalExtension
   async getAllMessages(threadId: string): Promise<ThreadMessage[]> {
     try {
       const threadDirPath = await joinPath([
-        JSONConversationalExtension._homeDir,
+        JSONConversationalExtension._threadFolder,
         threadId,
       ])
 
@@ -263,22 +263,17 @@ export default class JSONConversationalExtension extends ConversationalExtension
         JSONConversationalExtension._threadMessagesFileName,
       ])
 
-      const result = await fs
-        .readFileSync(messageFilePath, 'utf-8')
-        .then((content) =>
-          content
-            .toString()
-            .split('\n')
-            .filter((line) => line !== '')
-        )
+      let readResult = await fs.readFileSync(messageFilePath, 'utf-8')
+
+      if (typeof readResult === 'object') {
+        readResult = JSON.stringify(readResult)
+      }
+
+      const result = readResult.split('\n').filter((line) => line !== '')
 
       const messages: ThreadMessage[] = []
       result.forEach((line: string) => {
-        try {
-          messages.push(JSON.parse(line) as ThreadMessage)
-        } catch (err) {
-          console.error(err)
-        }
+        messages.push(JSON.parse(line))
       })
       return messages
     } catch (err) {
diff --git a/extensions/conversational-extension/webpack.config.js b/extensions/conversational-extension/webpack.config.js
index 36e3382953..a3eb873d71 100644
--- a/extensions/conversational-extension/webpack.config.js
+++ b/extensions/conversational-extension/webpack.config.js
@@ -1,27 +1,27 @@
-const path = require("path");
-const webpack = require("webpack");
+const path = require('path')
+const webpack = require('webpack')
 
 module.exports = {
   experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
+  entry: './src/index.ts', // Adjust the entry point to match your project's main file
+  mode: 'production',
   module: {
     rules: [
       {
         test: /\.tsx?$/,
-        use: "ts-loader",
+        use: 'ts-loader',
         exclude: /node_modules/,
       },
     ],
   },
   output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
+    filename: 'index.js', // Adjust the output file name as needed
+    path: path.resolve(__dirname, 'dist'),
+    library: { type: 'module' }, // Specify ESM output format
   },
   plugins: [new webpack.DefinePlugin({})],
   resolve: {
-    extensions: [".ts", ".js"],
+    extensions: ['.ts', '.js'],
     fallback: {
       path: require.resolve('path-browserify'),
     },
@@ -31,4 +31,4 @@ module.exports = {
     minimize: false,
   },
   // Add loaders and other configuration as needed for your project
-};
+}
diff --git a/extensions/inference-nitro-extension/README.md b/extensions/inference-nitro-extension/README.md
index 455783efb1..f499e0b9c5 100644
--- a/extensions/inference-nitro-extension/README.md
+++ b/extensions/inference-nitro-extension/README.md
@@ -64,10 +64,10 @@ There are a few things to keep in mind when writing your plugin code:
   In `index.ts`, you will see that the extension function will return a `Promise<any>`.
 
   ```typescript
-  import { core } from "@janhq/core";
+  import { core } from '@janhq/core'
 
   function onStart(): Promise<any> {
-    return core.invokePluginFunc(MODULE_PATH, "run", 0);
+    return core.invokePluginFunc(MODULE_PATH, 'run', 0)
   }
   ```
 
@@ -75,4 +75,3 @@ There are a few things to keep in mind when writing your plugin code:
   [documentation](https://github.com/janhq/jan/blob/main/core/README.md).
 
 So, what are you waiting for? Go ahead and start customizing your plugin!
-
diff --git a/extensions/inference-nitro-extension/bin/version.txt b/extensions/inference-nitro-extension/bin/version.txt
index c2c0004f0e..0b9c019963 100644
--- a/extensions/inference-nitro-extension/bin/version.txt
+++ b/extensions/inference-nitro-extension/bin/version.txt
@@ -1 +1 @@
-0.3.5
+0.3.12
diff --git a/extensions/inference-nitro-extension/download.bat b/extensions/inference-nitro-extension/download.bat
index 22e1c85b35..2ef3165c16 100644
--- a/extensions/inference-nitro-extension/download.bat
+++ b/extensions/inference-nitro-extension/download.bat
@@ -1,3 +1,3 @@
 @echo off
 set /p NITRO_VERSION=<./bin/version.txt
-.\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-cuda-12-0.tar.gz -e --strip 1 -o ./bin/win-cuda-12-0 && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-cuda-11-7.tar.gz -e --strip 1 -o ./bin/win-cuda-11-7 && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64.tar.gz -e --strip 1 -o ./bin/win-cpu
+.\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-cuda-12-0.tar.gz -e --strip 1 -o ./bin/win-cuda-12-0 && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-cuda-11-7.tar.gz -e --strip 1 -o ./bin/win-cuda-11-7 && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64.tar.gz -e --strip 1 -o ./bin/win-cpu && .\node_modules\.bin\download https://github.com/janhq/nitro/releases/download/v%NITRO_VERSION%/nitro-%NITRO_VERSION%-win-amd64-vulkan.tar.gz -e --strip 1 -o ./bin/win-vulkan && .\node_modules\.bin\download https://delta.jan.ai/vulkaninfoSDK.exe -o ./bin
diff --git a/extensions/inference-nitro-extension/package.json b/extensions/inference-nitro-extension/package.json
index 8ad516ad98..ba6b473ebf 100644
--- a/extensions/inference-nitro-extension/package.json
+++ b/extensions/inference-nitro-extension/package.json
@@ -8,13 +8,13 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc --module commonjs && rollup -c rollup.config.ts",
-    "downloadnitro:linux": "NITRO_VERSION=$(cat ./bin/version.txt) && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64.tar.gz -e --strip 1 -o ./bin/linux-cpu && chmod +x ./bin/linux-cpu/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-cuda-12-0.tar.gz -e --strip 1 -o ./bin/linux-cuda-12-0 && chmod +x ./bin/linux-cuda-12-0/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-cuda-11-7.tar.gz -e --strip 1 -o ./bin/linux-cuda-11-7 && chmod +x ./bin/linux-cuda-11-7/nitro",
+    "downloadnitro:linux": "NITRO_VERSION=$(cat ./bin/version.txt) && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64.tar.gz -e --strip 1 -o ./bin/linux-cpu && chmod +x ./bin/linux-cpu/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-cuda-12-0.tar.gz -e --strip 1 -o ./bin/linux-cuda-12-0 && chmod +x ./bin/linux-cuda-12-0/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-cuda-11-7.tar.gz -e --strip 1 -o ./bin/linux-cuda-11-7 && chmod +x ./bin/linux-cuda-11-7/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-linux-amd64-vulkan.tar.gz -e --strip 1 -o ./bin/linux-vulkan && chmod +x ./bin/linux-vulkan/nitro && download https://delta.jan.ai/vulkaninfo -o ./bin && chmod +x ./bin/vulkaninfo",
     "downloadnitro:darwin": "NITRO_VERSION=$(cat ./bin/version.txt) && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-mac-arm64.tar.gz -e --strip 1 -o ./bin/mac-arm64 && chmod +x ./bin/mac-arm64/nitro && download https://github.com/janhq/nitro/releases/download/v${NITRO_VERSION}/nitro-${NITRO_VERSION}-mac-amd64.tar.gz -e --strip 1 -o ./bin/mac-x64 && chmod +x ./bin/mac-x64/nitro",
     "downloadnitro:win32": "download.bat",
     "downloadnitro": "run-script-os",
-    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && ../../.github/scripts/auto-sign.sh && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../electron/pre-install",
-    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../electron/pre-install",
-    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && cpx \"bin/**\" \"dist/bin\" &&  npm pack && cpx *.tgz ../../electron/pre-install",
+    "build:publish:darwin": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && ../../.github/scripts/auto-sign.sh && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../pre-install",
+    "build:publish:win32": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../pre-install",
+    "build:publish:linux": "rimraf *.tgz --glob && npm run build && npm run downloadnitro && cpx \"bin/**\" \"dist/bin\" &&  npm pack && cpx *.tgz ../../pre-install",
     "build:publish": "run-script-os"
   },
   "exports": {
@@ -35,12 +35,12 @@
     "rollup-plugin-sourcemaps": "^0.6.3",
     "rollup-plugin-typescript2": "^0.36.0",
     "run-script-os": "^1.1.6",
-    "typescript": "^5.2.2"
+    "typescript": "^5.2.2",
+    "@types/os-utils": "^0.0.4",
+    "@rollup/plugin-replace": "^5.0.5"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
-    "@rollup/plugin-replace": "^5.0.5",
-    "@types/os-utils": "^0.0.4",
     "fetch-retry": "^5.0.6",
     "path-browserify": "^1.0.1",
     "rxjs": "^7.8.1",
diff --git a/extensions/inference-nitro-extension/rollup.config.ts b/extensions/inference-nitro-extension/rollup.config.ts
index 374a054cd5..ec8943f9cd 100644
--- a/extensions/inference-nitro-extension/rollup.config.ts
+++ b/extensions/inference-nitro-extension/rollup.config.ts
@@ -1,31 +1,34 @@
-import resolve from "@rollup/plugin-node-resolve";
-import commonjs from "@rollup/plugin-commonjs";
-import sourceMaps from "rollup-plugin-sourcemaps";
-import typescript from "rollup-plugin-typescript2";
-import json from "@rollup/plugin-json";
-import replace from "@rollup/plugin-replace";
-const packageJson = require("./package.json");
+import resolve from '@rollup/plugin-node-resolve'
+import commonjs from '@rollup/plugin-commonjs'
+import sourceMaps from 'rollup-plugin-sourcemaps'
+import typescript from 'rollup-plugin-typescript2'
+import json from '@rollup/plugin-json'
+import replace from '@rollup/plugin-replace'
+const packageJson = require('./package.json')
 
-const pkg = require("./package.json");
+const pkg = require('./package.json')
 
 export default [
   {
     input: `src/index.ts`,
-    output: [{ file: pkg.main, format: "es", sourcemap: true }],
+    output: [{ file: pkg.main, format: 'es', sourcemap: true }],
     // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
     external: [],
     watch: {
-      include: "src/**",
+      include: 'src/**',
     },
     plugins: [
       replace({
         NODE: JSON.stringify(`${packageJson.name}/${packageJson.node}`),
         INFERENCE_URL: JSON.stringify(
           process.env.INFERENCE_URL ||
-            "http://127.0.0.1:3928/inferences/llamacpp/chat_completion"
+            'http://127.0.0.1:3928/inferences/llamacpp/chat_completion'
         ),
         TROUBLESHOOTING_URL: JSON.stringify(
-          "https://jan.ai/guides/troubleshooting"
+          'https://jan.ai/guides/troubleshooting'
+        ),
+        JAN_SERVER_INFERENCE_URL: JSON.stringify(
+          'http://localhost:1337/v1/chat/completions'
         ),
       }),
       // Allow json resolution
@@ -39,7 +42,7 @@ export default [
       // which external modules to include in the bundle
       // https://github.com/rollup/rollup-plugin-node-resolve#usage
       resolve({
-        extensions: [".js", ".ts", ".svelte"],
+        extensions: ['.js', '.ts', '.svelte'],
       }),
 
       // Resolve source maps to the original source
@@ -49,12 +52,12 @@ export default [
   {
     input: `src/node/index.ts`,
     output: [
-      { file: "dist/node/index.cjs.js", format: "cjs", sourcemap: true },
+      { file: 'dist/node/index.cjs.js', format: 'cjs', sourcemap: true },
     ],
     // Indicate here external modules you don't wanna include in your bundle (i.e.: 'lodash')
-    external: ["@janhq/core/node"],
+    external: ['@janhq/core/node'],
     watch: {
-      include: "src/node/**",
+      include: 'src/node/**',
     },
     plugins: [
       // Allow json resolution
@@ -67,11 +70,11 @@ export default [
       // which external modules to include in the bundle
       // https://github.com/rollup/rollup-plugin-node-resolve#usage
       resolve({
-        extensions: [".ts", ".js", ".json"],
+        extensions: ['.ts', '.js', '.json'],
       }),
 
       // Resolve source maps to the original source
       sourceMaps(),
     ],
   },
-];
+]
diff --git a/extensions/inference-nitro-extension/src/@types/global.d.ts b/extensions/inference-nitro-extension/src/@types/global.d.ts
index bc126337f6..3a3d2aa325 100644
--- a/extensions/inference-nitro-extension/src/@types/global.d.ts
+++ b/extensions/inference-nitro-extension/src/@types/global.d.ts
@@ -1,12 +1,13 @@
-declare const NODE: string;
-declare const INFERENCE_URL: string;
-declare const TROUBLESHOOTING_URL: string;
+declare const NODE: string
+declare const INFERENCE_URL: string
+declare const TROUBLESHOOTING_URL: string
+declare const JAN_SERVER_INFERENCE_URL: string
 
 /**
  * The response from the initModel function.
  * @property error - An error message if the model fails to load.
  */
 interface ModelOperationResponse {
-  error?: any;
-  modelFile?: string;
+  error?: any
+  modelFile?: string
 }
diff --git a/extensions/inference-nitro-extension/src/helpers/sse.ts b/extensions/inference-nitro-extension/src/helpers/sse.ts
index c6352383d4..06176c9b9d 100644
--- a/extensions/inference-nitro-extension/src/helpers/sse.ts
+++ b/extensions/inference-nitro-extension/src/helpers/sse.ts
@@ -1,11 +1,12 @@
-import { Model } from "@janhq/core";
-import { Observable } from "rxjs";
+import { Model } from '@janhq/core'
+import { Observable } from 'rxjs'
 /**
  * Sends a request to the inference server to generate a response based on the recent messages.
  * @param recentMessages - An array of recent messages to use as context for the inference.
  * @returns An Observable that emits the generated response as a string.
  */
 export function requestInference(
+  inferenceUrl: string,
   recentMessages: any[],
   model: Model,
   controller?: AbortController
@@ -16,50 +17,50 @@ export function requestInference(
       model: model.id,
       stream: true,
       ...model.parameters,
-    });
-    fetch(INFERENCE_URL, {
-      method: "POST",
+    })
+    fetch(inferenceUrl, {
+      method: 'POST',
       headers: {
-        "Content-Type": "application/json",
-        "Access-Control-Allow-Origin": "*",
-        Accept: model.parameters.stream
-          ? "text/event-stream"
-          : "application/json",
+        'Content-Type': 'application/json',
+        'Access-Control-Allow-Origin': '*',
+        'Accept': model.parameters.stream
+          ? 'text/event-stream'
+          : 'application/json',
       },
       body: requestBody,
       signal: controller?.signal,
     })
       .then(async (response) => {
         if (model.parameters.stream === false) {
-          const data = await response.json();
-          subscriber.next(data.choices[0]?.message?.content ?? "");
+          const data = await response.json()
+          subscriber.next(data.choices[0]?.message?.content ?? '')
         } else {
-          const stream = response.body;
-          const decoder = new TextDecoder("utf-8");
-          const reader = stream?.getReader();
-          let content = "";
+          const stream = response.body
+          const decoder = new TextDecoder('utf-8')
+          const reader = stream?.getReader()
+          let content = ''
 
           while (true && reader) {
-            const { done, value } = await reader.read();
+            const { done, value } = await reader.read()
             if (done) {
-              break;
+              break
             }
-            const text = decoder.decode(value);
-            const lines = text.trim().split("\n");
+            const text = decoder.decode(value)
+            const lines = text.trim().split('\n')
             for (const line of lines) {
-              if (line.startsWith("data: ") && !line.includes("data: [DONE]")) {
-                const data = JSON.parse(line.replace("data: ", ""));
-                content += data.choices[0]?.delta?.content ?? "";
-                if (content.startsWith("assistant: ")) {
-                  content = content.replace("assistant: ", "");
+              if (line.startsWith('data: ') && !line.includes('data: [DONE]')) {
+                const data = JSON.parse(line.replace('data: ', ''))
+                content += data.choices[0]?.delta?.content ?? ''
+                if (content.startsWith('assistant: ')) {
+                  content = content.replace('assistant: ', '')
                 }
-                subscriber.next(content);
+                subscriber.next(content)
               }
             }
           }
         }
-        subscriber.complete();
+        subscriber.complete()
       })
-      .catch((err) => subscriber.error(err));
-  });
+      .catch((err) => subscriber.error(err))
+  })
 }
diff --git a/extensions/inference-nitro-extension/src/index.ts b/extensions/inference-nitro-extension/src/index.ts
index 2b0021ba0b..979b4cfac9 100644
--- a/extensions/inference-nitro-extension/src/index.ts
+++ b/extensions/inference-nitro-extension/src/index.ts
@@ -10,6 +10,7 @@ import {
   ChatCompletionRole,
   ContentType,
   MessageRequest,
+  MessageRequestType,
   MessageStatus,
   ThreadContent,
   ThreadMessage,
@@ -25,9 +26,10 @@ import {
   ModelEvent,
   InferenceEvent,
   ModelSettingParams,
-} from "@janhq/core";
-import { requestInference } from "./helpers/sse";
-import { ulid } from "ulid";
+  getJanDataFolderPath,
+} from '@janhq/core'
+import { requestInference } from './helpers/sse'
+import { ulid } from 'ulid'
 
 /**
  * A class that implements the InferenceExtension interface from the @janhq/core package.
@@ -35,16 +37,16 @@ import { ulid } from "ulid";
  * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
  */
 export default class JanInferenceNitroExtension extends InferenceExtension {
-  private static readonly _homeDir = "file://engines";
-  private static readonly _settingsDir = "file://settings";
-  private static readonly _engineMetadataFileName = "nitro.json";
+  private static readonly _homeDir = 'file://engines'
+  private static readonly _settingsDir = 'file://settings'
+  private static readonly _engineMetadataFileName = 'nitro.json'
 
   /**
    * Checking the health for Nitro's process each 5 secs.
    */
-  private static readonly _intervalHealthCheck = 5 * 1000;
+  private static readonly _intervalHealthCheck = 5 * 1000
 
-  private _currentModel: Model | undefined;
+  private _currentModel: Model | undefined
 
   private _engineSettings: ModelSettingParams = {
     ctx_len: 2048,
@@ -52,55 +54,63 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
     cpu_threads: 1,
     cont_batching: false,
     embedding: true,
-  };
+  }
 
-  controller = new AbortController();
-  isCancelled = false;
+  controller = new AbortController()
+  isCancelled = false
 
   /**
    * The interval id for the health check. Used to stop the health check.
    */
-  private getNitroProcesHealthIntervalId: NodeJS.Timeout | undefined =
-    undefined;
+  private getNitroProcesHealthIntervalId: NodeJS.Timeout | undefined = undefined
 
   /**
    * Tracking the current state of nitro process.
    */
-  private nitroProcessInfo: any = undefined;
+  private nitroProcessInfo: any = undefined
+
+  private inferenceUrl = ''
 
   /**
    * Subscribes to events emitted by the @janhq/core package.
    */
   async onLoad() {
     if (!(await fs.existsSync(JanInferenceNitroExtension._homeDir))) {
-      await fs
-        .mkdirSync(JanInferenceNitroExtension._homeDir)
-        .catch((err: Error) => console.debug(err));
+      try {
+        await fs.mkdirSync(JanInferenceNitroExtension._homeDir)
+      } catch (e) {
+        console.debug(e)
+      }
+    }
+
+    // init inference url
+    // @ts-ignore
+    const electronApi = window?.electronAPI
+    this.inferenceUrl = INFERENCE_URL
+    if (!electronApi) {
+      this.inferenceUrl = `${window.core?.api?.baseApiUrl}/v1/chat/completions`
     }
+    console.debug('Inference url: ', this.inferenceUrl)
 
     if (!(await fs.existsSync(JanInferenceNitroExtension._settingsDir)))
-      await fs.mkdirSync(JanInferenceNitroExtension._settingsDir);
-    this.writeDefaultEngineSettings();
+      await fs.mkdirSync(JanInferenceNitroExtension._settingsDir)
+    this.writeDefaultEngineSettings()
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data: MessageRequest) =>
-      this.onMessageRequest(data),
-    );
+      this.onMessageRequest(data)
+    )
 
-    events.on(ModelEvent.OnModelInit, (model: Model) =>
-      this.onModelInit(model),
-    );
+    events.on(ModelEvent.OnModelInit, (model: Model) => this.onModelInit(model))
 
-    events.on(ModelEvent.OnModelStop, (model: Model) =>
-      this.onModelStop(model),
-    );
+    events.on(ModelEvent.OnModelStop, (model: Model) => this.onModelStop(model))
 
     events.on(InferenceEvent.OnInferenceStopped, () =>
-      this.onInferenceStopped(),
-    );
+      this.onInferenceStopped()
+    )
 
     // Attempt to fetch nvidia info
-    await executeOnMain(NODE, "updateNvidiaInfo", {});
+    await executeOnMain(NODE, 'updateNvidiaInfo', {})
   }
 
   /**
@@ -113,56 +123,62 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
       const engineFile = await joinPath([
         JanInferenceNitroExtension._homeDir,
         JanInferenceNitroExtension._engineMetadataFileName,
-      ]);
+      ])
       if (await fs.existsSync(engineFile)) {
-        const engine = await fs.readFileSync(engineFile, "utf-8");
+        const engine = await fs.readFileSync(engineFile, 'utf-8')
         this._engineSettings =
-          typeof engine === "object" ? engine : JSON.parse(engine);
+          typeof engine === 'object' ? engine : JSON.parse(engine)
       } else {
         await fs.writeFileSync(
           engineFile,
-          JSON.stringify(this._engineSettings, null, 2),
-        );
+          JSON.stringify(this._engineSettings, null, 2)
+        )
       }
     } catch (err) {
-      console.error(err);
+      console.error(err)
     }
   }
 
   private async onModelInit(model: Model) {
-    if (model.engine !== InferenceEngine.nitro) return;
-
-    const modelFullPath = await joinPath(["models", model.id]);
-
-    this._currentModel = model;
-    const nitroInitResult = await executeOnMain(NODE, "runModel", {
-      modelFullPath,
+    if (model.engine !== InferenceEngine.nitro) return
+
+    const modelFolder = await joinPath([
+      await getJanDataFolderPath(),
+      'models',
+      model.id,
+    ])
+    this._currentModel = model
+    const nitroInitResult = await executeOnMain(NODE, 'runModel', {
+      modelFolder,
       model,
-    });
+    })
 
     if (nitroInitResult?.error) {
-      events.emit(ModelEvent.OnModelFail, model);
-      return;
+      events.emit(ModelEvent.OnModelFail, {
+        ...model,
+        error: nitroInitResult.error,
+      })
+      return
     }
 
-    events.emit(ModelEvent.OnModelReady, model);
+    events.emit(ModelEvent.OnModelReady, model)
 
     this.getNitroProcesHealthIntervalId = setInterval(
       () => this.periodicallyGetNitroHealth(),
-      JanInferenceNitroExtension._intervalHealthCheck,
-    );
+      JanInferenceNitroExtension._intervalHealthCheck
+    )
   }
 
   private async onModelStop(model: Model) {
-    if (model.engine !== "nitro") return;
+    if (model.engine !== 'nitro') return
 
-    await executeOnMain(NODE, "stopModel");
-    events.emit(ModelEvent.OnModelStopped, {});
+    await executeOnMain(NODE, 'stopModel')
+    events.emit(ModelEvent.OnModelStopped, {})
 
     // stop the periocally health check
     if (this.getNitroProcesHealthIntervalId) {
-      clearInterval(this.getNitroProcesHealthIntervalId);
-      this.getNitroProcesHealthIntervalId = undefined;
+      clearInterval(this.getNitroProcesHealthIntervalId)
+      this.getNitroProcesHealthIntervalId = undefined
     }
   }
 
@@ -170,19 +186,19 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
    * Periodically check for nitro process's health.
    */
   private async periodicallyGetNitroHealth(): Promise<void> {
-    const health = await executeOnMain(NODE, "getCurrentNitroProcessInfo");
+    const health = await executeOnMain(NODE, 'getCurrentNitroProcessInfo')
 
-    const isRunning = this.nitroProcessInfo?.isRunning ?? false;
+    const isRunning = this.nitroProcessInfo?.isRunning ?? false
     if (isRunning && health.isRunning === false) {
-      console.debug("Nitro process is stopped");
-      events.emit(ModelEvent.OnModelStopped, {});
+      console.debug('Nitro process is stopped')
+      events.emit(ModelEvent.OnModelStopped, {})
     }
-    this.nitroProcessInfo = health;
+    this.nitroProcessInfo = health
   }
 
   private async onInferenceStopped() {
-    this.isCancelled = true;
-    this.controller?.abort();
+    this.isCancelled = true
+    this.controller?.abort()
   }
 
   /**
@@ -191,31 +207,35 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
    * @returns {Promise<any>} A promise that resolves with the inference response.
    */
   async inference(data: MessageRequest): Promise<ThreadMessage> {
-    const timestamp = Date.now();
+    const timestamp = Date.now()
     const message: ThreadMessage = {
       thread_id: data.threadId,
       created: timestamp,
       updated: timestamp,
       status: MessageStatus.Ready,
-      id: "",
+      id: '',
       role: ChatCompletionRole.Assistant,
-      object: "thread.message",
+      object: 'thread.message',
       content: [],
-    };
+    }
 
     return new Promise(async (resolve, reject) => {
-      if (!this._currentModel) return Promise.reject("No model loaded");
+      if (!this._currentModel) return Promise.reject('No model loaded')
 
-      requestInference(data.messages ?? [], this._currentModel).subscribe({
+      requestInference(
+        this.inferenceUrl,
+        data.messages ?? [],
+        this._currentModel
+      ).subscribe({
         next: (_content: any) => {},
         complete: async () => {
-          resolve(message);
+          resolve(message)
         },
         error: async (err: any) => {
-          reject(err);
+          reject(err)
         },
-      });
-    });
+      })
+    })
   }
 
   /**
@@ -226,32 +246,41 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
    */
   private async onMessageRequest(data: MessageRequest) {
     if (data.model?.engine !== InferenceEngine.nitro || !this._currentModel) {
-      return;
+      return
     }
 
-    const timestamp = Date.now();
+    const timestamp = Date.now()
     const message: ThreadMessage = {
       id: ulid(),
       thread_id: data.threadId,
+      type: data.type,
       assistant_id: data.assistantId,
       role: ChatCompletionRole.Assistant,
       content: [],
       status: MessageStatus.Pending,
       created: timestamp,
       updated: timestamp,
-      object: "thread.message",
-    };
-    events.emit(MessageEvent.OnMessageResponse, message);
+      object: 'thread.message',
+    }
+
+    if (data.type !== MessageRequestType.Summary) {
+      events.emit(MessageEvent.OnMessageResponse, message)
+    }
 
-    this.isCancelled = false;
-    this.controller = new AbortController();
+    this.isCancelled = false
+    this.controller = new AbortController()
 
     // @ts-ignore
     const model: Model = {
       ...(this._currentModel || {}),
       ...(data.model || {}),
-    };
-    requestInference(data.messages ?? [], model, this.controller).subscribe({
+    }
+    requestInference(
+      this.inferenceUrl,
+      data.messages ?? [],
+      model,
+      this.controller
+    ).subscribe({
       next: (content: any) => {
         const messageContent: ThreadContent = {
           type: ContentType.Text,
@@ -259,26 +288,26 @@ export default class JanInferenceNitroExtension extends InferenceExtension {
             value: content.trim(),
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       complete: async () => {
         message.status = message.content.length
           ? MessageStatus.Ready
-          : MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+          : MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       error: async (err: any) => {
         if (this.isCancelled || message.content.length) {
-          message.status = MessageStatus.Stopped;
-          events.emit(MessageEvent.OnMessageUpdate, message);
-          return;
+          message.status = MessageStatus.Stopped
+          events.emit(MessageEvent.OnMessageUpdate, message)
+          return
         }
-        message.status = MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
-        log(`[APP]::Error: ${err.message}`);
+        message.status = MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
+        log(`[APP]::Error: ${err.message}`)
       },
-    });
+    })
   }
 }
diff --git a/extensions/inference-nitro-extension/src/node/accelerator.ts b/extensions/inference-nitro-extension/src/node/accelerator.ts
new file mode 100644
index 0000000000..972f88681b
--- /dev/null
+++ b/extensions/inference-nitro-extension/src/node/accelerator.ts
@@ -0,0 +1,240 @@
+import { writeFileSync, existsSync, readFileSync } from 'fs'
+import { exec, spawn } from 'child_process'
+import path from 'path'
+import { getJanDataFolderPath, log } from '@janhq/core/node'
+
+/**
+ * Default GPU settings
+ * TODO: This needs to be refactored to support multiple accelerators
+ **/
+const DEFALT_SETTINGS = {
+  notify: true,
+  run_mode: 'cpu',
+  nvidia_driver: {
+    exist: false,
+    version: '',
+  },
+  cuda: {
+    exist: false,
+    version: '',
+  },
+  gpus: [],
+  gpu_highest_vram: '',
+  gpus_in_use: [],
+  is_initial: true,
+  // TODO: This needs to be set based on user toggle in settings
+  vulkan: {
+    enabled: true,
+    gpu_in_use: '1',
+  },
+}
+
+/**
+ * Path to the settings file
+ **/
+export const GPU_INFO_FILE = path.join(
+  getJanDataFolderPath(),
+  'settings',
+  'settings.json'
+)
+
+/**
+ * Current nitro process
+ */
+let nitroProcessInfo: NitroProcessInfo | undefined = undefined
+
+/**
+ * Nitro process info
+ */
+export interface NitroProcessInfo {
+  isRunning: boolean
+}
+
+/**
+ * This will retrive GPU informations and persist settings.json
+ * Will be called when the extension is loaded to turn on GPU acceleration if supported
+ */
+export async function updateNvidiaInfo() {
+  if (process.platform !== 'darwin') {
+    let data
+    try {
+      data = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+    } catch (error) {
+      data = DEFALT_SETTINGS
+      writeFileSync(GPU_INFO_FILE, JSON.stringify(data, null, 2))
+    }
+    updateNvidiaDriverInfo()
+    updateGpuInfo()
+  }
+}
+
+/**
+ * Retrieve current nitro process
+ */
+export const getNitroProcessInfo = (subprocess: any): NitroProcessInfo => {
+  nitroProcessInfo = {
+    isRunning: subprocess != null,
+  }
+  return nitroProcessInfo
+}
+
+/**
+ * Validate nvidia and cuda for linux and windows
+ */
+export async function updateNvidiaDriverInfo(): Promise<void> {
+  exec(
+    'nvidia-smi --query-gpu=driver_version --format=csv,noheader',
+    (error, stdout) => {
+      let data = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+
+      if (!error) {
+        const firstLine = stdout.split('\n')[0].trim()
+        data['nvidia_driver'].exist = true
+        data['nvidia_driver'].version = firstLine
+      } else {
+        data['nvidia_driver'].exist = false
+      }
+
+      writeFileSync(GPU_INFO_FILE, JSON.stringify(data, null, 2))
+      Promise.resolve()
+    }
+  )
+}
+
+/**
+ * Check if file exists in paths
+ */
+export function checkFileExistenceInPaths(
+  file: string,
+  paths: string[]
+): boolean {
+  return paths.some((p) => existsSync(path.join(p, file)))
+}
+
+/**
+ * Validate cuda for linux and windows
+ */
+export function updateCudaExistence(
+  data: Record<string, any> = DEFALT_SETTINGS
+): Record<string, any> {
+  let filesCuda12: string[]
+  let filesCuda11: string[]
+  let paths: string[]
+  let cudaVersion: string = ''
+
+  if (process.platform === 'win32') {
+    filesCuda12 = ['cublas64_12.dll', 'cudart64_12.dll', 'cublasLt64_12.dll']
+    filesCuda11 = ['cublas64_11.dll', 'cudart64_11.dll', 'cublasLt64_11.dll']
+    paths = process.env.PATH ? process.env.PATH.split(path.delimiter) : []
+  } else {
+    filesCuda12 = ['libcudart.so.12', 'libcublas.so.12', 'libcublasLt.so.12']
+    filesCuda11 = ['libcudart.so.11.0', 'libcublas.so.11', 'libcublasLt.so.11']
+    paths = process.env.LD_LIBRARY_PATH
+      ? process.env.LD_LIBRARY_PATH.split(path.delimiter)
+      : []
+    paths.push('/usr/lib/x86_64-linux-gnu/')
+  }
+
+  let cudaExists = filesCuda12.every(
+    (file) => existsSync(file) || checkFileExistenceInPaths(file, paths)
+  )
+
+  if (!cudaExists) {
+    cudaExists = filesCuda11.every(
+      (file) => existsSync(file) || checkFileExistenceInPaths(file, paths)
+    )
+    if (cudaExists) {
+      cudaVersion = '11'
+    }
+  } else {
+    cudaVersion = '12'
+  }
+
+  data['cuda'].exist = cudaExists
+  data['cuda'].version = cudaVersion
+  console.log(data['is_initial'], data['gpus_in_use'])
+  if (cudaExists && data['is_initial'] && data['gpus_in_use'].length > 0) {
+    data.run_mode = 'gpu'
+  }
+  data.is_initial = false
+  return data
+}
+
+/**
+ * Get GPU information
+ */
+export async function updateGpuInfo(): Promise<void> {
+  let data = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+
+  // Cuda
+  if (data['vulkan'] === true) {
+    // Vulkan
+    exec(
+      process.platform === 'win32'
+        ? `${__dirname}\\..\\bin\\vulkaninfoSDK.exe --summary`
+        : `${__dirname}/../bin/vulkaninfo --summary`,
+      (error, stdout) => {
+        if (!error) {
+          const output = stdout.toString()
+          log(output)
+          const gpuRegex = /GPU(\d+):(?:[\s\S]*?)deviceName\s*=\s*(.*)/g
+
+          let gpus = []
+          let match
+          while ((match = gpuRegex.exec(output)) !== null) {
+            const id = match[1]
+            const name = match[2]
+            gpus.push({ id, vram: 0, name })
+          }
+          data.gpus = gpus
+
+          if (!data['gpus_in_use'] || data['gpus_in_use'].length === 0) {
+            data.gpus_in_use = [data.gpus.length > 1 ? '1' : '0']
+          }
+
+          data = updateCudaExistence(data)
+          writeFileSync(GPU_INFO_FILE, JSON.stringify(data, null, 2))
+        }
+        Promise.resolve()
+      }
+    )
+  } else {
+    exec(
+      'nvidia-smi --query-gpu=index,memory.total,name --format=csv,noheader,nounits',
+      (error, stdout) => {
+        if (!error) {
+          log(stdout)
+          // Get GPU info and gpu has higher memory first
+          let highestVram = 0
+          let highestVramId = '0'
+          let gpus = stdout
+            .trim()
+            .split('\n')
+            .map((line) => {
+              let [id, vram, name] = line.split(', ')
+              vram = vram.replace(/\r/g, '')
+              if (parseFloat(vram) > highestVram) {
+                highestVram = parseFloat(vram)
+                highestVramId = id
+              }
+              return { id, vram, name }
+            })
+
+          data.gpus = gpus
+          data.gpu_highest_vram = highestVramId
+        } else {
+          data.gpus = []
+          data.gpu_highest_vram = ''
+        }
+
+        if (!data['gpus_in_use'] || data['gpus_in_use'].length === 0) {
+          data.gpus_in_use = [data['gpu_highest_vram']]
+        }
+
+        data = updateCudaExistence(data)
+        writeFileSync(GPU_INFO_FILE, JSON.stringify(data, null, 2))
+        Promise.resolve()
+      }
+    )
+  }
+}
diff --git a/extensions/inference-nitro-extension/src/node/execute.ts b/extensions/inference-nitro-extension/src/node/execute.ts
index ca266639c6..08baba0d53 100644
--- a/extensions/inference-nitro-extension/src/node/execute.ts
+++ b/extensions/inference-nitro-extension/src/node/execute.ts
@@ -1,65 +1,79 @@
-import { readFileSync } from "fs";
-import * as path from "path";
-import { NVIDIA_INFO_FILE } from "./nvidia";
+import { readFileSync } from 'fs'
+import * as path from 'path'
+import { GPU_INFO_FILE } from './accelerator'
 
 export interface NitroExecutableOptions {
-  executablePath: string;
-  cudaVisibleDevices: string;
+  executablePath: string
+  cudaVisibleDevices: string
+  vkVisibleDevices: string
 }
 /**
  * Find which executable file to run based on the current platform.
  * @returns The name of the executable file to run.
  */
 export const executableNitroFile = (): NitroExecutableOptions => {
-  let binaryFolder = path.join(__dirname, "..", "bin"); // Current directory by default
-  let cudaVisibleDevices = "";
-  let binaryName = "nitro";
+  let binaryFolder = path.join(__dirname, '..', 'bin') // Current directory by default
+  let cudaVisibleDevices = ''
+  let vkVisibleDevices = ''
+  let binaryName = 'nitro'
   /**
    * The binary folder is different for each platform.
    */
-  if (process.platform === "win32") {
+  if (process.platform === 'win32') {
     /**
-     *  For Windows: win-cpu, win-cuda-11-7, win-cuda-12-0
+     *  For Windows: win-cpu, win-vulkan, win-cuda-11-7, win-cuda-12-0
      */
-    let nvidiaInfo = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-    if (nvidiaInfo["run_mode"] === "cpu") {
-      binaryFolder = path.join(binaryFolder, "win-cpu");
+    let gpuInfo = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+    if (gpuInfo['run_mode'] === 'cpu') {
+      binaryFolder = path.join(binaryFolder, 'win-cpu')
     } else {
-      if (nvidiaInfo["cuda"].version === "12") {
-        binaryFolder = path.join(binaryFolder, "win-cuda-12-0");
+      if (gpuInfo['cuda']?.version === '11') {
+        binaryFolder = path.join(binaryFolder, 'win-cuda-11-7')
       } else {
-        binaryFolder = path.join(binaryFolder, "win-cuda-11-7");
+        binaryFolder = path.join(binaryFolder, 'win-cuda-12-0')
       }
-      cudaVisibleDevices = nvidiaInfo["gpu_highest_vram"];
+      cudaVisibleDevices = gpuInfo['gpus_in_use'].join(',')
     }
-    binaryName = "nitro.exe";
-  } else if (process.platform === "darwin") {
+    if (gpuInfo['vulkan'] === true) {
+      binaryFolder = path.join(__dirname, '..', 'bin')
+      binaryFolder = path.join(binaryFolder, 'win-vulkan')
+      vkVisibleDevices = gpuInfo['gpus_in_use'].toString()
+    }
+    binaryName = 'nitro.exe'
+  } else if (process.platform === 'darwin') {
     /**
      *  For MacOS: mac-arm64 (Silicon), mac-x64 (InteL)
      */
-    if (process.arch === "arm64") {
-      binaryFolder = path.join(binaryFolder, "mac-arm64");
+    if (process.arch === 'arm64') {
+      binaryFolder = path.join(binaryFolder, 'mac-arm64')
     } else {
-      binaryFolder = path.join(binaryFolder, "mac-x64");
+      binaryFolder = path.join(binaryFolder, 'mac-x64')
     }
   } else {
     /**
-     *  For Linux: linux-cpu, linux-cuda-11-7, linux-cuda-12-0
+     *  For Linux: linux-cpu, linux-vulkan, linux-cuda-11-7, linux-cuda-12-0
      */
-    let nvidiaInfo = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-    if (nvidiaInfo["run_mode"] === "cpu") {
-      binaryFolder = path.join(binaryFolder, "linux-cpu");
+    let gpuInfo = JSON.parse(readFileSync(GPU_INFO_FILE, 'utf-8'))
+    if (gpuInfo['run_mode'] === 'cpu') {
+      binaryFolder = path.join(binaryFolder, 'linux-cpu')
     } else {
-      if (nvidiaInfo["cuda"].version === "12") {
-        binaryFolder = path.join(binaryFolder, "linux-cuda-12-0");
+      if (gpuInfo['cuda']?.version === '11') {
+        binaryFolder = path.join(binaryFolder, 'linux-cuda-11-7')
       } else {
-        binaryFolder = path.join(binaryFolder, "linux-cuda-11-7");
+        binaryFolder = path.join(binaryFolder, 'linux-cuda-12-0')
       }
-      cudaVisibleDevices = nvidiaInfo["gpu_highest_vram"];
+      cudaVisibleDevices = gpuInfo['gpus_in_use'].join(',')
+    }
+
+    if (gpuInfo['vulkan'] === true) {
+      binaryFolder = path.join(__dirname, '..', 'bin')
+      binaryFolder = path.join(binaryFolder, 'win-vulkan')
+      vkVisibleDevices = gpuInfo['gpus_in_use'].toString()
     }
   }
   return {
     executablePath: path.join(binaryFolder, binaryName),
     cudaVisibleDevices,
-  };
-};
+    vkVisibleDevices,
+  }
+}
diff --git a/extensions/inference-nitro-extension/src/node/index.ts b/extensions/inference-nitro-extension/src/node/index.ts
index 7ba90b556b..9b2684a6c5 100644
--- a/extensions/inference-nitro-extension/src/node/index.ts
+++ b/extensions/inference-nitro-extension/src/node/index.ts
@@ -1,55 +1,50 @@
-import fs from "fs";
-import path from "path";
-import { ChildProcessWithoutNullStreams, spawn } from "child_process";
-import tcpPortUsed from "tcp-port-used";
-import fetchRT from "fetch-retry";
-import {
-  log,
-  getJanDataFolderPath,
-  getSystemResourceInfo,
-} from "@janhq/core/node";
-import { getNitroProcessInfo, updateNvidiaInfo } from "./nvidia";
+import fs from 'fs'
+import path from 'path'
+import { ChildProcessWithoutNullStreams, spawn } from 'child_process'
+import tcpPortUsed from 'tcp-port-used'
+import fetchRT from 'fetch-retry'
+import { log, getSystemResourceInfo } from '@janhq/core/node'
+import { getNitroProcessInfo, updateNvidiaInfo } from './accelerator'
 import {
   Model,
   InferenceEngine,
   ModelSettingParams,
   PromptTemplate,
-} from "@janhq/core";
-import { executableNitroFile } from "./execute";
+} from '@janhq/core'
+import { executableNitroFile } from './execute'
 
 // Polyfill fetch with retry
-const fetchRetry = fetchRT(fetch);
+const fetchRetry = fetchRT(fetch)
 
 /**
  * The response object for model init operation.
  */
 interface ModelInitOptions {
-  modelFullPath: string;
-  model: Model;
+  modelFolder: string
+  model: Model
 }
 // The PORT to use for the Nitro subprocess
-const PORT = 3928;
+const PORT = 3928
 // The HOST address to use for the Nitro subprocess
-const LOCAL_HOST = "127.0.0.1";
+const LOCAL_HOST = '127.0.0.1'
 // The URL for the Nitro subprocess
-const NITRO_HTTP_SERVER_URL = `http://${LOCAL_HOST}:${PORT}`;
+const NITRO_HTTP_SERVER_URL = `http://${LOCAL_HOST}:${PORT}`
 // The URL for the Nitro subprocess to load a model
-const NITRO_HTTP_LOAD_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/loadmodel`;
+const NITRO_HTTP_LOAD_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/loadmodel`
 // The URL for the Nitro subprocess to validate a model
-const NITRO_HTTP_VALIDATE_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/modelstatus`;
+const NITRO_HTTP_VALIDATE_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/modelstatus`
 // The URL for the Nitro subprocess to kill itself
-const NITRO_HTTP_KILL_URL = `${NITRO_HTTP_SERVER_URL}/processmanager/destroy`;
+const NITRO_HTTP_KILL_URL = `${NITRO_HTTP_SERVER_URL}/processmanager/destroy`
 
 // The supported model format
 // TODO: Should be an array to support more models
-const SUPPORTED_MODEL_FORMAT = ".gguf";
+const SUPPORTED_MODEL_FORMAT = '.gguf'
 
 // The subprocess instance for Nitro
-let subprocess: ChildProcessWithoutNullStreams | undefined = undefined;
-// The current model file url
-let currentModelFile: string = "";
+let subprocess: ChildProcessWithoutNullStreams | undefined = undefined
+
 // The current model settings
-let currentSettings: ModelSettingParams | undefined = undefined;
+let currentSettings: ModelSettingParams | undefined = undefined
 
 /**
  * Stops a Nitro subprocess.
@@ -57,7 +52,7 @@ let currentSettings: ModelSettingParams | undefined = undefined;
  * @returns A Promise that resolves when the subprocess is terminated successfully, or rejects with an error message if the subprocess fails to terminate.
  */
 function stopModel(): Promise<void> {
-  return killSubprocess();
+  return killSubprocess()
 }
 
 /**
@@ -67,62 +62,79 @@ function stopModel(): Promise<void> {
  * TODO: Should pass absolute of the model file instead of just the name - So we can modurize the module.ts to npm package
  */
 async function runModel(
-  wrapper: ModelInitOptions,
+  wrapper: ModelInitOptions
 ): Promise<ModelOperationResponse | void> {
   if (wrapper.model.engine !== InferenceEngine.nitro) {
     // Not a nitro model
-    return Promise.resolve();
+    return Promise.resolve()
   }
 
-  currentModelFile = wrapper.modelFullPath;
-  const janRoot = await getJanDataFolderPath();
-  if (!currentModelFile.includes(janRoot)) {
-    currentModelFile = path.join(janRoot, currentModelFile);
-  }
-  const files: string[] = fs.readdirSync(currentModelFile);
-
-  // Look for GGUF model file
-  const ggufBinFile = files.find(
-    (file) =>
-      file === path.basename(currentModelFile) ||
-      file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT),
-  );
-
-  if (!ggufBinFile) return Promise.reject("No GGUF model file found");
-
-  currentModelFile = path.join(currentModelFile, ggufBinFile);
-
   if (wrapper.model.engine !== InferenceEngine.nitro) {
-    return Promise.reject("Not a nitro model");
+    return Promise.reject('Not a nitro model')
   } else {
-    const nitroResourceProbe = await getSystemResourceInfo();
+    const nitroResourceProbe = await getSystemResourceInfo()
     // Convert settings.prompt_template to system_prompt, user_prompt, ai_prompt
     if (wrapper.model.settings.prompt_template) {
-      const promptTemplate = wrapper.model.settings.prompt_template;
-      const prompt = promptTemplateConverter(promptTemplate);
+      const promptTemplate = wrapper.model.settings.prompt_template
+      const prompt = promptTemplateConverter(promptTemplate)
       if (prompt?.error) {
-        return Promise.reject(prompt.error);
+        return Promise.reject(prompt.error)
       }
-      wrapper.model.settings.system_prompt = prompt.system_prompt;
-      wrapper.model.settings.user_prompt = prompt.user_prompt;
-      wrapper.model.settings.ai_prompt = prompt.ai_prompt;
+      wrapper.model.settings.system_prompt = prompt.system_prompt
+      wrapper.model.settings.user_prompt = prompt.user_prompt
+      wrapper.model.settings.ai_prompt = prompt.ai_prompt
+    }
+
+    // modelFolder is the absolute path to the running model folder
+    // e.g. ~/jan/models/llama-2
+    let modelFolder = wrapper.modelFolder
+
+    let llama_model_path = wrapper.model.settings.llama_model_path
+
+    // Absolute model path support
+    if (
+      wrapper.model?.sources.length &&
+      wrapper.model.sources.every((e) => fs.existsSync(e.url))
+    ) {
+      llama_model_path =
+        wrapper.model.sources.length === 1
+          ? wrapper.model.sources[0].url
+          : wrapper.model.sources.find((e) =>
+              e.url.includes(llama_model_path ?? wrapper.model.id)
+            )?.url
     }
 
-    const modelFolderPath = path.join(janRoot, "models", wrapper.model.id);
-    const modelPath = wrapper.model.settings.llama_model_path
-      ? path.join(modelFolderPath, wrapper.model.settings.llama_model_path)
-      : currentModelFile;
+    if (!llama_model_path || !path.isAbsolute(llama_model_path)) {
+      // Look for GGUF model file
+      const modelFiles: string[] = fs.readdirSync(modelFolder)
+      const ggufBinFile = modelFiles.find(
+        (file) =>
+          // 1. Prioritize llama_model_path (predefined)
+          (llama_model_path && file === llama_model_path) ||
+          // 2. Prioritize GGUF File (manual import)
+          file.toLowerCase().includes(SUPPORTED_MODEL_FORMAT) ||
+          // 3. Fallback Model ID (for backward compatibility)
+          file === wrapper.model.id
+      )
+      if (ggufBinFile) llama_model_path = path.join(modelFolder, ggufBinFile)
+    }
+
+    // Look for absolute source path for single model
+
+    if (!llama_model_path) return Promise.reject('No GGUF model file found')
 
     currentSettings = {
       ...wrapper.model.settings,
-      llama_model_path: modelPath,
+      llama_model_path,
       // This is critical and requires real CPU physical core count (or performance core)
       cpu_threads: Math.max(1, nitroResourceProbe.numCpuPhysicalCore),
       ...(wrapper.model.settings.mmproj && {
-        mmproj: path.join(modelFolderPath, wrapper.model.settings.mmproj),
+        mmproj: path.isAbsolute(wrapper.model.settings.mmproj)
+          ? wrapper.model.settings.mmproj
+          : path.join(modelFolder, wrapper.model.settings.mmproj),
       }),
-    };
-    return runNitroAndLoadModel();
+    }
+    return runNitroAndLoadModel()
   }
 }
 
@@ -142,10 +154,10 @@ async function runNitroAndLoadModel() {
        * Should wait for awhile to make sure the port is free and subprocess is killed
        * The tested threshold is 500ms
        **/
-      if (process.platform === "win32") {
-        return new Promise((resolve) => setTimeout(resolve, 500));
+      if (process.platform === 'win32') {
+        return new Promise((resolve) => setTimeout(resolve, 500))
       } else {
-        return Promise.resolve();
+        return Promise.resolve()
       }
     })
     .then(spawnNitroProcess)
@@ -153,9 +165,9 @@ async function runNitroAndLoadModel() {
     .then(validateModelStatus)
     .catch((err) => {
       // TODO: Broadcast error so app could display proper error message
-      log(`[NITRO]::Error: ${err}`);
-      return { error: err };
-    });
+      log(`[NITRO]::Error: ${err}`)
+      return { error: err }
+    })
 }
 
 /**
@@ -165,43 +177,43 @@ async function runNitroAndLoadModel() {
  */
 function promptTemplateConverter(promptTemplate: string): PromptTemplate {
   // Split the string using the markers
-  const systemMarker = "{system_message}";
-  const promptMarker = "{prompt}";
+  const systemMarker = '{system_message}'
+  const promptMarker = '{prompt}'
 
   if (
     promptTemplate.includes(systemMarker) &&
     promptTemplate.includes(promptMarker)
   ) {
     // Find the indices of the markers
-    const systemIndex = promptTemplate.indexOf(systemMarker);
-    const promptIndex = promptTemplate.indexOf(promptMarker);
+    const systemIndex = promptTemplate.indexOf(systemMarker)
+    const promptIndex = promptTemplate.indexOf(promptMarker)
 
     // Extract the parts of the string
-    const system_prompt = promptTemplate.substring(0, systemIndex);
+    const system_prompt = promptTemplate.substring(0, systemIndex)
     const user_prompt = promptTemplate.substring(
       systemIndex + systemMarker.length,
-      promptIndex,
-    );
+      promptIndex
+    )
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length,
-    );
+      promptIndex + promptMarker.length
+    )
 
     // Return the split parts
-    return { system_prompt, user_prompt, ai_prompt };
+    return { system_prompt, user_prompt, ai_prompt }
   } else if (promptTemplate.includes(promptMarker)) {
     // Extract the parts of the string for the case where only promptMarker is present
-    const promptIndex = promptTemplate.indexOf(promptMarker);
-    const user_prompt = promptTemplate.substring(0, promptIndex);
+    const promptIndex = promptTemplate.indexOf(promptMarker)
+    const user_prompt = promptTemplate.substring(0, promptIndex)
     const ai_prompt = promptTemplate.substring(
-      promptIndex + promptMarker.length,
-    );
+      promptIndex + promptMarker.length
+    )
 
     // Return the split parts
-    return { user_prompt, ai_prompt };
+    return { user_prompt, ai_prompt }
   }
 
   // Return an error if none of the conditions are met
-  return { error: "Cannot split prompt template" };
+  return { error: 'Cannot split prompt template' }
 }
 
 /**
@@ -210,13 +222,13 @@ function promptTemplateConverter(promptTemplate: string): PromptTemplate {
  */
 function loadLLMModel(settings: any): Promise<Response> {
   if (!settings?.ngl) {
-    settings.ngl = 100;
+    settings.ngl = 100
   }
-  log(`[NITRO]::Debug: Loading model with params ${JSON.stringify(settings)}`);
+  log(`[NITRO]::Debug: Loading model with params ${JSON.stringify(settings)}`)
   return fetchRetry(NITRO_HTTP_LOAD_MODEL_URL, {
-    method: "POST",
+    method: 'POST',
     headers: {
-      "Content-Type": "application/json",
+      'Content-Type': 'application/json',
     },
     body: JSON.stringify(settings),
     retries: 3,
@@ -225,15 +237,15 @@ function loadLLMModel(settings: any): Promise<Response> {
     .then((res) => {
       log(
         `[NITRO]::Debug: Load model success with response ${JSON.stringify(
-          res,
-        )}`,
-      );
-      return Promise.resolve(res);
+          res
+        )}`
+      )
+      return Promise.resolve(res)
     })
     .catch((err) => {
-      log(`[NITRO]::Error: Load model failed with error ${err}`);
-      return Promise.reject(err);
-    });
+      log(`[NITRO]::Error: Load model failed with error ${err}`)
+      return Promise.reject(err)
+    })
 }
 
 /**
@@ -246,9 +258,9 @@ async function validateModelStatus(): Promise<void> {
   // Send a GET request to the validation URL.
   // Retry the request up to 3 times if it fails, with a delay of 500 milliseconds between retries.
   return fetchRetry(NITRO_HTTP_VALIDATE_MODEL_URL, {
-    method: "GET",
+    method: 'GET',
     headers: {
-      "Content-Type": "application/json",
+      'Content-Type': 'application/json',
     },
     retries: 5,
     retryDelay: 500,
@@ -257,10 +269,10 @@ async function validateModelStatus(): Promise<void> {
       `[NITRO]::Debug: Validate model state with response ${JSON.stringify(
         res.status
       )}`
-    );
+    )
     // If the response is OK, check model_loaded status.
     if (res.ok) {
-      const body = await res.json();
+      const body = await res.json()
       // If the model is loaded, return an empty object.
       // Otherwise, return an object with an error message.
       if (body.model_loaded) {
@@ -268,17 +280,17 @@ async function validateModelStatus(): Promise<void> {
           `[NITRO]::Debug: Validate model state success with response ${JSON.stringify(
             body
           )}`
-        );
-        return Promise.resolve();
+        )
+        return Promise.resolve()
       }
     }
     log(
       `[NITRO]::Debug: Validate model state failed with response ${JSON.stringify(
         res.statusText
       )}`
-    );
-    return Promise.reject("Validate model status failed");
-  });
+    )
+    return Promise.reject('Validate model status failed')
+  })
 }
 
 /**
@@ -286,21 +298,27 @@ async function validateModelStatus(): Promise<void> {
  * @returns A Promise that resolves when the subprocess is terminated successfully, or rejects with an error message if the subprocess fails to terminate.
  */
 async function killSubprocess(): Promise<void> {
-  const controller = new AbortController();
-  setTimeout(() => controller.abort(), 5000);
-  log(`[NITRO]::Debug: Request to kill Nitro`);
+  const controller = new AbortController()
+  setTimeout(() => controller.abort(), 5000)
+  log(`[NITRO]::Debug: Request to kill Nitro`)
 
   return fetch(NITRO_HTTP_KILL_URL, {
-    method: "DELETE",
+    method: 'DELETE',
     signal: controller.signal,
   })
     .then(() => {
-      subprocess?.kill();
-      subprocess = undefined;
+      subprocess?.kill()
+      subprocess = undefined
     })
-    .catch(() => {})
+    .catch(() => {}) // Do nothing with this attempt
     .then(() => tcpPortUsed.waitUntilFree(PORT, 300, 5000))
-    .then(() => log(`[NITRO]::Debug: Nitro process is terminated`));
+    .then(() => log(`[NITRO]::Debug: Nitro process is terminated`))
+    .catch((err) => {
+      log(
+        `[NITRO]::Debug: Could not kill running process on port ${PORT}. Might be another process running on the same port? ${err}`
+      )
+      throw 'PORT_NOT_AVAILABLE'
+    })
 }
 
 /**
@@ -308,49 +326,53 @@ async function killSubprocess(): Promise<void> {
  * @returns A promise that resolves when the Nitro subprocess is started.
  */
 function spawnNitroProcess(): Promise<any> {
-  log(`[NITRO]::Debug: Spawning Nitro subprocess...`);
+  log(`[NITRO]::Debug: Spawning Nitro subprocess...`)
 
   return new Promise<void>(async (resolve, reject) => {
-    let binaryFolder = path.join(__dirname, "..", "bin"); // Current directory by default
-    let executableOptions = executableNitroFile();
+    let binaryFolder = path.join(__dirname, '..', 'bin') // Current directory by default
+    let executableOptions = executableNitroFile()
 
-    const args: string[] = ["1", LOCAL_HOST, PORT.toString()];
+    const args: string[] = ['1', LOCAL_HOST, PORT.toString()]
     // Execute the binary
     log(
-      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`,
-    );
+      `[NITRO]::Debug: Spawn nitro at path: ${executableOptions.executablePath}, and args: ${args}`
+    )
     subprocess = spawn(
       executableOptions.executablePath,
-      ["1", LOCAL_HOST, PORT.toString()],
+      ['1', LOCAL_HOST, PORT.toString()],
       {
         cwd: binaryFolder,
         env: {
           ...process.env,
           CUDA_VISIBLE_DEVICES: executableOptions.cudaVisibleDevices,
+          // Vulkan - Support 1 device at a time for now
+          ...(executableOptions.vkVisibleDevices?.length > 0 && {
+            GGML_VULKAN_DEVICE: executableOptions.vkVisibleDevices[0],
+          }),
         },
-      },
-    );
+      }
+    )
 
     // Handle subprocess output
-    subprocess.stdout.on("data", (data: any) => {
-      log(`[NITRO]::Debug: ${data}`);
-    });
+    subprocess.stdout.on('data', (data: any) => {
+      log(`[NITRO]::Debug: ${data}`)
+    })
 
-    subprocess.stderr.on("data", (data: any) => {
-      log(`[NITRO]::Error: ${data}`);
-    });
+    subprocess.stderr.on('data', (data: any) => {
+      log(`[NITRO]::Error: ${data}`)
+    })
 
-    subprocess.on("close", (code: any) => {
-      log(`[NITRO]::Debug: Nitro exited with code: ${code}`);
-      subprocess = undefined;
-      reject(`child process exited with code ${code}`);
-    });
+    subprocess.on('close', (code: any) => {
+      log(`[NITRO]::Debug: Nitro exited with code: ${code}`)
+      subprocess = undefined
+      reject(`child process exited with code ${code}`)
+    })
 
     tcpPortUsed.waitUntilUsed(PORT, 300, 30000).then(() => {
-      log(`[NITRO]::Debug: Nitro is ready`);
-      resolve();
-    });
-  });
+      log(`[NITRO]::Debug: Nitro is ready`)
+      resolve()
+    })
+  })
 }
 
 /**
@@ -360,7 +382,7 @@ function spawnNitroProcess(): Promise<any> {
  */
 function dispose() {
   // clean other registered resources here
-  killSubprocess();
+  killSubprocess()
 }
 
 export default {
@@ -370,4 +392,4 @@ export default {
   dispose,
   updateNvidiaInfo,
   getCurrentNitroProcessInfo: () => getNitroProcessInfo(subprocess),
-};
+}
diff --git a/extensions/inference-nitro-extension/src/node/nvidia.ts b/extensions/inference-nitro-extension/src/node/nvidia.ts
deleted file mode 100644
index 13e43290b6..0000000000
--- a/extensions/inference-nitro-extension/src/node/nvidia.ts
+++ /dev/null
@@ -1,200 +0,0 @@
-import { writeFileSync, existsSync, readFileSync } from "fs";
-import { exec } from "child_process";
-import path from "path";
-import { getJanDataFolderPath } from "@janhq/core/node";
-
-/**
- * Default GPU settings
- **/
-const DEFALT_SETTINGS = {
-  notify: true,
-  run_mode: "cpu",
-  nvidia_driver: {
-    exist: false,
-    version: "",
-  },
-  cuda: {
-    exist: false,
-    version: "",
-  },
-  gpus: [],
-  gpu_highest_vram: "",
-};
-
-/**
- * Path to the settings file
- **/
-export const NVIDIA_INFO_FILE = path.join(
-  getJanDataFolderPath(),
-  "settings",
-  "settings.json"
-);
-
-/**
- * Current nitro process
- */
-let nitroProcessInfo: NitroProcessInfo | undefined = undefined;
-
-/**
- * Nitro process info
- */
-export interface NitroProcessInfo {
-  isRunning: boolean;
-}
-
-/**
- * This will retrive GPU informations and persist settings.json
- * Will be called when the extension is loaded to turn on GPU acceleration if supported
- */
-export async function updateNvidiaInfo() {
-  if (process.platform !== "darwin") {
-    await Promise.all([
-      updateNvidiaDriverInfo(),
-      updateCudaExistence(),
-      updateGpuInfo(),
-    ]);
-  }
-}
-
-/**
- * Retrieve current nitro process
- */
-export const getNitroProcessInfo = (subprocess: any): NitroProcessInfo => {
-  nitroProcessInfo = {
-    isRunning: subprocess != null,
-  };
-  return nitroProcessInfo;
-};
-
-/**
- * Validate nvidia and cuda for linux and windows
- */
-export async function updateNvidiaDriverInfo(): Promise<void> {
-  exec(
-    "nvidia-smi --query-gpu=driver_version --format=csv,noheader",
-    (error, stdout) => {
-      let data;
-      try {
-        data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-      } catch (error) {
-        data = DEFALT_SETTINGS;
-      }
-
-      if (!error) {
-        const firstLine = stdout.split("\n")[0].trim();
-        data["nvidia_driver"].exist = true;
-        data["nvidia_driver"].version = firstLine;
-      } else {
-        data["nvidia_driver"].exist = false;
-      }
-
-      writeFileSync(NVIDIA_INFO_FILE, JSON.stringify(data, null, 2));
-      Promise.resolve();
-    }
-  );
-}
-
-/**
- * Check if file exists in paths
- */
-export function checkFileExistenceInPaths(
-  file: string,
-  paths: string[]
-): boolean {
-  return paths.some((p) => existsSync(path.join(p, file)));
-}
-
-/**
- * Validate cuda for linux and windows
- */
-export function updateCudaExistence() {
-  let filesCuda12: string[];
-  let filesCuda11: string[];
-  let paths: string[];
-  let cudaVersion: string = "";
-
-  if (process.platform === "win32") {
-    filesCuda12 = ["cublas64_12.dll", "cudart64_12.dll", "cublasLt64_12.dll"];
-    filesCuda11 = ["cublas64_11.dll", "cudart64_11.dll", "cublasLt64_11.dll"];
-    paths = process.env.PATH ? process.env.PATH.split(path.delimiter) : [];
-  } else {
-    filesCuda12 = ["libcudart.so.12", "libcublas.so.12", "libcublasLt.so.12"];
-    filesCuda11 = ["libcudart.so.11.0", "libcublas.so.11", "libcublasLt.so.11"];
-    paths = process.env.LD_LIBRARY_PATH
-      ? process.env.LD_LIBRARY_PATH.split(path.delimiter)
-      : [];
-    paths.push("/usr/lib/x86_64-linux-gnu/");
-  }
-
-  let cudaExists = filesCuda12.every(
-    (file) => existsSync(file) || checkFileExistenceInPaths(file, paths)
-  );
-
-  if (!cudaExists) {
-    cudaExists = filesCuda11.every(
-      (file) => existsSync(file) || checkFileExistenceInPaths(file, paths)
-    );
-    if (cudaExists) {
-      cudaVersion = "11";
-    }
-  } else {
-    cudaVersion = "12";
-  }
-
-  let data;
-  try {
-    data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-  } catch (error) {
-    data = DEFALT_SETTINGS;
-  }
-
-  data["cuda"].exist = cudaExists;
-  data["cuda"].version = cudaVersion;
-  if (cudaExists) {
-    data.run_mode = "gpu";
-  }
-  writeFileSync(NVIDIA_INFO_FILE, JSON.stringify(data, null, 2));
-}
-
-/**
- * Get GPU information
- */
-export async function updateGpuInfo(): Promise<void> {
-  exec(
-    "nvidia-smi --query-gpu=index,memory.total --format=csv,noheader,nounits",
-    (error, stdout) => {
-      let data;
-      try {
-        data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, "utf-8"));
-      } catch (error) {
-        data = DEFALT_SETTINGS;
-      }
-
-      if (!error) {
-        // Get GPU info and gpu has higher memory first
-        let highestVram = 0;
-        let highestVramId = "0";
-        let gpus = stdout
-          .trim()
-          .split("\n")
-          .map((line) => {
-            let [id, vram] = line.split(", ");
-            vram = vram.replace(/\r/g, "");
-            if (parseFloat(vram) > highestVram) {
-              highestVram = parseFloat(vram);
-              highestVramId = id;
-            }
-            return { id, vram };
-          });
-
-        data["gpus"] = gpus;
-        data["gpu_highest_vram"] = highestVramId;
-      } else {
-        data["gpus"] = [];
-      }
-
-      writeFileSync(NVIDIA_INFO_FILE, JSON.stringify(data, null, 2));
-      Promise.resolve();
-    }
-  );
-}
diff --git a/extensions/inference-openai-extension/package.json b/extensions/inference-openai-extension/package.json
index 5fa0ce974f..5efdbf874f 100644
--- a/extensions/inference-openai-extension/package.json
+++ b/extensions/inference-openai-extension/package.json
@@ -8,7 +8,7 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "exports": {
     ".": "./dist/index.js",
@@ -18,13 +18,13 @@
     "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
     "fetch-retry": "^5.0.6",
     "path-browserify": "^1.0.1",
-    "ts-loader": "^9.5.0",
     "ulid": "^2.3.0"
   },
   "engines": {
diff --git a/extensions/inference-openai-extension/src/@types/global.d.ts b/extensions/inference-openai-extension/src/@types/global.d.ts
index 84f86c1458..a49bb5a2f2 100644
--- a/extensions/inference-openai-extension/src/@types/global.d.ts
+++ b/extensions/inference-openai-extension/src/@types/global.d.ts
@@ -1,26 +1,26 @@
-declare const MODULE: string;
-declare const OPENAI_DOMAIN: string;
+declare const MODULE: string
+declare const OPENAI_DOMAIN: string
 
 declare interface EngineSettings {
-  full_url?: string;
-  api_key?: string;
+  full_url?: string
+  api_key?: string
 }
 
 enum OpenAIChatCompletionModelName {
-  "gpt-3.5-turbo-instruct" = "gpt-3.5-turbo-instruct",
-  "gpt-3.5-turbo-instruct-0914" = "gpt-3.5-turbo-instruct-0914",
-  "gpt-4-1106-preview" = "gpt-4-1106-preview",
-  "gpt-3.5-turbo-0613" = "gpt-3.5-turbo-0613",
-  "gpt-3.5-turbo-0301" = "gpt-3.5-turbo-0301",
-  "gpt-3.5-turbo" = "gpt-3.5-turbo",
-  "gpt-3.5-turbo-16k-0613" = "gpt-3.5-turbo-16k-0613",
-  "gpt-3.5-turbo-1106" = "gpt-3.5-turbo-1106",
-  "gpt-4-vision-preview" = "gpt-4-vision-preview",
-  "gpt-4" = "gpt-4",
-  "gpt-4-0314" = "gpt-4-0314",
-  "gpt-4-0613" = "gpt-4-0613",
+  'gpt-3.5-turbo-instruct' = 'gpt-3.5-turbo-instruct',
+  'gpt-3.5-turbo-instruct-0914' = 'gpt-3.5-turbo-instruct-0914',
+  'gpt-4-1106-preview' = 'gpt-4-1106-preview',
+  'gpt-3.5-turbo-0613' = 'gpt-3.5-turbo-0613',
+  'gpt-3.5-turbo-0301' = 'gpt-3.5-turbo-0301',
+  'gpt-3.5-turbo' = 'gpt-3.5-turbo',
+  'gpt-3.5-turbo-16k-0613' = 'gpt-3.5-turbo-16k-0613',
+  'gpt-3.5-turbo-1106' = 'gpt-3.5-turbo-1106',
+  'gpt-4-vision-preview' = 'gpt-4-vision-preview',
+  'gpt-4' = 'gpt-4',
+  'gpt-4-0314' = 'gpt-4-0314',
+  'gpt-4-0613' = 'gpt-4-0613',
 }
 
-declare type OpenAIModel = Omit<Model, "id"> & {
-  id: OpenAIChatCompletionModelName;
-};
+declare type OpenAIModel = Omit<Model, 'id'> & {
+  id: OpenAIChatCompletionModelName
+}
diff --git a/extensions/inference-openai-extension/src/helpers/sse.ts b/extensions/inference-openai-extension/src/helpers/sse.ts
index fb75816e7e..11db382827 100644
--- a/extensions/inference-openai-extension/src/helpers/sse.ts
+++ b/extensions/inference-openai-extension/src/helpers/sse.ts
@@ -1,4 +1,4 @@
-import { Observable } from "rxjs";
+import { Observable } from 'rxjs'
 
 /**
  * Sends a request to the inference server to generate a response based on the recent messages.
@@ -14,26 +14,26 @@ export function requestInference(
   controller?: AbortController
 ): Observable<string> {
   return new Observable((subscriber) => {
-    let model_id: string = model.id;
+    let model_id: string = model.id
     if (engine.full_url.includes(OPENAI_DOMAIN)) {
-      model_id = engine.full_url.split("/")[5];
+      model_id = engine.full_url.split('/')[5]
     }
     const requestBody = JSON.stringify({
       messages: recentMessages,
       stream: true,
       model: model_id,
       ...model.parameters,
-    });
+    })
     fetch(`${engine.full_url}`, {
-      method: "POST",
+      method: 'POST',
       headers: {
-        "Content-Type": "application/json",
-        Accept: model.parameters.stream
-          ? "text/event-stream"
-          : "application/json",
-        "Access-Control-Allow-Origin": "*",
-        Authorization: `Bearer ${engine.api_key}`,
-        "api-key": `${engine.api_key}`,
+        'Content-Type': 'application/json',
+        'Accept': model.parameters.stream
+          ? 'text/event-stream'
+          : 'application/json',
+        'Access-Control-Allow-Origin': '*',
+        'Authorization': `Bearer ${engine.api_key}`,
+        'api-key': `${engine.api_key}`,
       },
       body: requestBody,
       signal: controller?.signal,
@@ -41,41 +41,41 @@ export function requestInference(
       .then(async (response) => {
         if (!response.ok) {
           subscriber.next(
-            (await response.json()).error?.message ?? "Error occured"
-          );
-          subscriber.complete();
-          return;
+            (await response.json()).error?.message ?? 'Error occurred.'
+          )
+          subscriber.complete()
+          return
         }
         if (model.parameters.stream === false) {
-          const data = await response.json();
-          subscriber.next(data.choices[0]?.message?.content ?? "");
+          const data = await response.json()
+          subscriber.next(data.choices[0]?.message?.content ?? '')
         } else {
-          const stream = response.body;
-          const decoder = new TextDecoder("utf-8");
-          const reader = stream?.getReader();
-          let content = "";
+          const stream = response.body
+          const decoder = new TextDecoder('utf-8')
+          const reader = stream?.getReader()
+          let content = ''
 
           while (true && reader) {
-            const { done, value } = await reader.read();
+            const { done, value } = await reader.read()
             if (done) {
-              break;
+              break
             }
-            const text = decoder.decode(value);
-            const lines = text.trim().split("\n");
+            const text = decoder.decode(value)
+            const lines = text.trim().split('\n')
             for (const line of lines) {
-              if (line.startsWith("data: ") && !line.includes("data: [DONE]")) {
-                const data = JSON.parse(line.replace("data: ", ""));
-                content += data.choices[0]?.delta?.content ?? "";
-                if (content.startsWith("assistant: ")) {
-                  content = content.replace("assistant: ", "");
+              if (line.startsWith('data: ') && !line.includes('data: [DONE]')) {
+                const data = JSON.parse(line.replace('data: ', ''))
+                content += data.choices[0]?.delta?.content ?? ''
+                if (content.startsWith('assistant: ')) {
+                  content = content.replace('assistant: ', '')
                 }
-                subscriber.next(content);
+                subscriber.next(content)
               }
             }
           }
         }
-        subscriber.complete();
+        subscriber.complete()
       })
-      .catch((err) => subscriber.error(err));
-  });
+      .catch((err) => subscriber.error(err))
+  })
 }
diff --git a/extensions/inference-openai-extension/src/index.ts b/extensions/inference-openai-extension/src/index.ts
index fd1230bc7e..4811717421 100644
--- a/extensions/inference-openai-extension/src/index.ts
+++ b/extensions/inference-openai-extension/src/index.ts
@@ -18,14 +18,15 @@ import {
   InferenceEngine,
   BaseExtension,
   MessageEvent,
+  MessageRequestType,
   ModelEvent,
   InferenceEvent,
   AppConfigurationEventName,
   joinPath,
-} from "@janhq/core";
-import { requestInference } from "./helpers/sse";
-import { ulid } from "ulid";
-import { join } from "path";
+} from '@janhq/core'
+import { requestInference } from './helpers/sse'
+import { ulid } from 'ulid'
+import { join } from 'path'
 
 /**
  * A class that implements the InferenceExtension interface from the @janhq/core package.
@@ -33,18 +34,18 @@ import { join } from "path";
  * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
  */
 export default class JanInferenceOpenAIExtension extends BaseExtension {
-  private static readonly _engineDir = "file://engines";
-  private static readonly _engineMetadataFileName = "openai.json";
+  private static readonly _engineDir = 'file://engines'
+  private static readonly _engineMetadataFileName = 'openai.json'
 
-  private static _currentModel: OpenAIModel;
+  private static _currentModel: OpenAIModel
 
   private static _engineSettings: EngineSettings = {
-    full_url: "https://api.openai.com/v1/chat/completions",
-    api_key: "sk-<your key here>",
-  };
+    full_url: 'https://api.openai.com/v1/chat/completions',
+    api_key: 'sk-<your key here>',
+  }
 
-  controller = new AbortController();
-  isCancelled = false;
+  controller = new AbortController()
+  isCancelled = false
 
   /**
    * Subscribes to events emitted by the @janhq/core package.
@@ -53,40 +54,40 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
     if (!(await fs.existsSync(JanInferenceOpenAIExtension._engineDir))) {
       await fs
         .mkdirSync(JanInferenceOpenAIExtension._engineDir)
-        .catch((err) => console.debug(err));
+        .catch((err) => console.debug(err))
     }
 
-    JanInferenceOpenAIExtension.writeDefaultEngineSettings();
+    JanInferenceOpenAIExtension.writeDefaultEngineSettings()
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data) =>
-      JanInferenceOpenAIExtension.handleMessageRequest(data, this),
-    );
+      JanInferenceOpenAIExtension.handleMessageRequest(data, this)
+    )
 
     events.on(ModelEvent.OnModelInit, (model: OpenAIModel) => {
-      JanInferenceOpenAIExtension.handleModelInit(model);
-    });
+      JanInferenceOpenAIExtension.handleModelInit(model)
+    })
 
     events.on(ModelEvent.OnModelStop, (model: OpenAIModel) => {
-      JanInferenceOpenAIExtension.handleModelStop(model);
-    });
+      JanInferenceOpenAIExtension.handleModelStop(model)
+    })
     events.on(InferenceEvent.OnInferenceStopped, () => {
-      JanInferenceOpenAIExtension.handleInferenceStopped(this);
-    });
+      JanInferenceOpenAIExtension.handleInferenceStopped(this)
+    })
 
     const settingsFilePath = await joinPath([
       JanInferenceOpenAIExtension._engineDir,
       JanInferenceOpenAIExtension._engineMetadataFileName,
-    ]);
+    ])
 
     events.on(
       AppConfigurationEventName.OnConfigurationUpdate,
       (settingsKey: string) => {
         // Update settings on changes
         if (settingsKey === settingsFilePath)
-          JanInferenceOpenAIExtension.writeDefaultEngineSettings();
-      },
-    );
+          JanInferenceOpenAIExtension.writeDefaultEngineSettings()
+      }
+    )
   }
 
   /**
@@ -98,45 +99,45 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
     try {
       const engineFile = join(
         JanInferenceOpenAIExtension._engineDir,
-        JanInferenceOpenAIExtension._engineMetadataFileName,
-      );
+        JanInferenceOpenAIExtension._engineMetadataFileName
+      )
       if (await fs.existsSync(engineFile)) {
-        const engine = await fs.readFileSync(engineFile, "utf-8");
+        const engine = await fs.readFileSync(engineFile, 'utf-8')
         JanInferenceOpenAIExtension._engineSettings =
-          typeof engine === "object" ? engine : JSON.parse(engine);
+          typeof engine === 'object' ? engine : JSON.parse(engine)
       } else {
         await fs.writeFileSync(
           engineFile,
-          JSON.stringify(JanInferenceOpenAIExtension._engineSettings, null, 2),
-        );
+          JSON.stringify(JanInferenceOpenAIExtension._engineSettings, null, 2)
+        )
       }
     } catch (err) {
-      console.error(err);
+      console.error(err)
     }
   }
   private static async handleModelInit(model: OpenAIModel) {
     if (model.engine !== InferenceEngine.openai) {
-      return;
+      return
     } else {
-      JanInferenceOpenAIExtension._currentModel = model;
-      JanInferenceOpenAIExtension.writeDefaultEngineSettings();
+      JanInferenceOpenAIExtension._currentModel = model
+      JanInferenceOpenAIExtension.writeDefaultEngineSettings()
       // Todo: Check model list with API key
-      events.emit(ModelEvent.OnModelReady, model);
+      events.emit(ModelEvent.OnModelReady, model)
     }
   }
 
   private static async handleModelStop(model: OpenAIModel) {
-    if (model.engine !== "openai") {
-      return;
+    if (model.engine !== 'openai') {
+      return
     }
-    events.emit(ModelEvent.OnModelStopped, model);
+    events.emit(ModelEvent.OnModelStopped, model)
   }
 
   private static async handleInferenceStopped(
-    instance: JanInferenceOpenAIExtension,
+    instance: JanInferenceOpenAIExtension
   ) {
-    instance.isCancelled = true;
-    instance.controller?.abort();
+    instance.isCancelled = true
+    instance.controller?.abort()
   }
 
   /**
@@ -147,28 +148,32 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
    */
   private static async handleMessageRequest(
     data: MessageRequest,
-    instance: JanInferenceOpenAIExtension,
+    instance: JanInferenceOpenAIExtension
   ) {
-    if (data.model.engine !== "openai") {
-      return;
+    if (data.model.engine !== 'openai') {
+      return
     }
 
-    const timestamp = Date.now();
+    const timestamp = Date.now()
     const message: ThreadMessage = {
       id: ulid(),
       thread_id: data.threadId,
+      type: data.type,
       assistant_id: data.assistantId,
       role: ChatCompletionRole.Assistant,
       content: [],
       status: MessageStatus.Pending,
       created: timestamp,
       updated: timestamp,
-      object: "thread.message",
-    };
-    events.emit(MessageEvent.OnMessageResponse, message);
+      object: 'thread.message',
+    }
 
-    instance.isCancelled = false;
-    instance.controller = new AbortController();
+    if (data.type !== MessageRequestType.Summary) {
+      events.emit(MessageEvent.OnMessageResponse, message)
+    }
+
+    instance.isCancelled = false
+    instance.controller = new AbortController()
 
     requestInference(
       data?.messages ?? [],
@@ -177,7 +182,7 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
         ...JanInferenceOpenAIExtension._currentModel,
         parameters: data.model.parameters,
       },
-      instance.controller,
+      instance.controller
     ).subscribe({
       next: (content) => {
         const messageContent: ThreadContent = {
@@ -186,33 +191,33 @@ export default class JanInferenceOpenAIExtension extends BaseExtension {
             value: content.trim(),
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       complete: async () => {
         message.status = message.content.length
           ? MessageStatus.Ready
-          : MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+          : MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       error: async (err) => {
         if (instance.isCancelled || message.content.length > 0) {
-          message.status = MessageStatus.Stopped;
-          events.emit(MessageEvent.OnMessageUpdate, message);
-          return;
+          message.status = MessageStatus.Stopped
+          events.emit(MessageEvent.OnMessageUpdate, message)
+          return
         }
         const messageContent: ThreadContent = {
           type: ContentType.Text,
           text: {
-            value: "Error occurred: " + err.message,
+            value: 'Error occurred: ' + err.message,
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        message.status = MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        message.status = MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
-    });
+    })
   }
 }
diff --git a/extensions/inference-openai-extension/tsconfig.json b/extensions/inference-openai-extension/tsconfig.json
index 7bfdd90096..2477d58ce5 100644
--- a/extensions/inference-openai-extension/tsconfig.json
+++ b/extensions/inference-openai-extension/tsconfig.json
@@ -8,7 +8,7 @@
     "forceConsistentCasingInFileNames": true,
     "strict": false,
     "skipLibCheck": true,
-    "rootDir": "./src",
+    "rootDir": "./src"
   },
-  "include": ["./src"],
+  "include": ["./src"]
 }
diff --git a/extensions/inference-openai-extension/webpack.config.js b/extensions/inference-openai-extension/webpack.config.js
index 72b7d90c10..ee2e3b6243 100644
--- a/extensions/inference-openai-extension/webpack.config.js
+++ b/extensions/inference-openai-extension/webpack.config.js
@@ -1,16 +1,16 @@
-const path = require("path");
-const webpack = require("webpack");
-const packageJson = require("./package.json");
+const path = require('path')
+const webpack = require('webpack')
+const packageJson = require('./package.json')
 
 module.exports = {
   experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
+  entry: './src/index.ts', // Adjust the entry point to match your project's main file
+  mode: 'production',
   module: {
     rules: [
       {
         test: /\.tsx?$/,
-        use: "ts-loader",
+        use: 'ts-loader',
         exclude: /node_modules/,
       },
     ],
@@ -18,22 +18,22 @@ module.exports = {
   plugins: [
     new webpack.DefinePlugin({
       MODULE: JSON.stringify(`${packageJson.name}/${packageJson.module}`),
-      OPENAI_DOMAIN: JSON.stringify("openai.azure.com"),
+      OPENAI_DOMAIN: JSON.stringify('openai.azure.com'),
     }),
   ],
   output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
+    filename: 'index.js', // Adjust the output file name as needed
+    path: path.resolve(__dirname, 'dist'),
+    library: { type: 'module' }, // Specify ESM output format
   },
   resolve: {
-    extensions: [".ts", ".js"],
+    extensions: ['.ts', '.js'],
     fallback: {
-      path: require.resolve("path-browserify"),
+      path: require.resolve('path-browserify'),
     },
   },
   optimization: {
     minimize: false,
   },
   // Add loaders and other configuration as needed for your project
-};
+}
diff --git a/extensions/inference-triton-trtllm-extension/package.json b/extensions/inference-triton-trtllm-extension/package.json
index 1d27f9f188..455f8030e2 100644
--- a/extensions/inference-triton-trtllm-extension/package.json
+++ b/extensions/inference-triton-trtllm-extension/package.json
@@ -8,7 +8,7 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "exports": {
     ".": "./dist/index.js",
@@ -18,13 +18,13 @@
     "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
     "fetch-retry": "^5.0.6",
     "path-browserify": "^1.0.1",
-    "ts-loader": "^9.5.0",
     "ulid": "^2.3.0",
     "rxjs": "^7.8.1"
   },
diff --git a/extensions/inference-triton-trtllm-extension/src/@types/global.d.ts b/extensions/inference-triton-trtllm-extension/src/@types/global.d.ts
index 6224b8e68c..c834feba01 100644
--- a/extensions/inference-triton-trtllm-extension/src/@types/global.d.ts
+++ b/extensions/inference-triton-trtllm-extension/src/@types/global.d.ts
@@ -1,5 +1,5 @@
-import { Model } from "@janhq/core";
+import { Model } from '@janhq/core'
 
 declare interface EngineSettings {
-    base_url?: string;
+  base_url?: string
 }
diff --git a/extensions/inference-triton-trtllm-extension/src/helpers/sse.ts b/extensions/inference-triton-trtllm-extension/src/helpers/sse.ts
index da20fa32d9..9aff612654 100644
--- a/extensions/inference-triton-trtllm-extension/src/helpers/sse.ts
+++ b/extensions/inference-triton-trtllm-extension/src/helpers/sse.ts
@@ -1,6 +1,6 @@
-import { Observable } from "rxjs";
-import { EngineSettings } from "../@types/global";
-import { Model } from "@janhq/core";
+import { Observable } from 'rxjs'
+import { EngineSettings } from '../@types/global'
+import { Model } from '@janhq/core'
 
 /**
  * Sends a request to the inference server to generate a response based on the recent messages.
@@ -16,48 +16,48 @@ export function requestInference(
   controller?: AbortController
 ): Observable<string> {
   return new Observable((subscriber) => {
-    const text_input = recentMessages.map((message) => message.text).join("\n");
+    const text_input = recentMessages.map((message) => message.text).join('\n')
     const requestBody = JSON.stringify({
       text_input: text_input,
       max_tokens: 4096,
       temperature: 0,
-      bad_words: "",
-      stop_words: "[DONE]",
-      stream: true
-    });
+      bad_words: '',
+      stop_words: '[DONE]',
+      stream: true,
+    })
     fetch(`${engine.base_url}/v2/models/ensemble/generate_stream`, {
-      method: "POST",
+      method: 'POST',
       headers: {
-        "Content-Type": "application/json",
-        Accept: "text/event-stream",
-        "Access-Control-Allow-Origin": "*",
+        'Content-Type': 'application/json',
+        'Accept': 'text/event-stream',
+        'Access-Control-Allow-Origin': '*',
       },
       body: requestBody,
       signal: controller?.signal,
     })
       .then(async (response) => {
-        const stream = response.body;
-        const decoder = new TextDecoder("utf-8");
-        const reader = stream?.getReader();
-        let content = "";
+        const stream = response.body
+        const decoder = new TextDecoder('utf-8')
+        const reader = stream?.getReader()
+        let content = ''
 
         while (true && reader) {
-          const { done, value } = await reader.read();
+          const { done, value } = await reader.read()
           if (done) {
-            break;
+            break
           }
-          const text = decoder.decode(value);
-          const lines = text.trim().split("\n");
+          const text = decoder.decode(value)
+          const lines = text.trim().split('\n')
           for (const line of lines) {
-            if (line.startsWith("data: ") && !line.includes("data: [DONE]")) {
-              const data = JSON.parse(line.replace("data: ", ""));
-              content += data.choices[0]?.delta?.content ?? "";
-              subscriber.next(content);
+            if (line.startsWith('data: ') && !line.includes('data: [DONE]')) {
+              const data = JSON.parse(line.replace('data: ', ''))
+              content += data.choices[0]?.delta?.content ?? ''
+              subscriber.next(content)
             }
           }
         }
-        subscriber.complete();
+        subscriber.complete()
       })
-      .catch((err) => subscriber.error(err));
-  });
+      .catch((err) => subscriber.error(err))
+  })
 }
diff --git a/extensions/inference-triton-trtllm-extension/src/index.ts b/extensions/inference-triton-trtllm-extension/src/index.ts
index 11ddf78933..f009a81e03 100644
--- a/extensions/inference-triton-trtllm-extension/src/index.ts
+++ b/extensions/inference-triton-trtllm-extension/src/index.ts
@@ -20,51 +20,49 @@ import {
   BaseExtension,
   MessageEvent,
   ModelEvent,
-} from "@janhq/core";
-import { requestInference } from "./helpers/sse";
-import { ulid } from "ulid";
-import { join } from "path";
-import { EngineSettings } from "./@types/global";
+} from '@janhq/core'
+import { requestInference } from './helpers/sse'
+import { ulid } from 'ulid'
+import { join } from 'path'
+import { EngineSettings } from './@types/global'
 
 /**
  * A class that implements the InferenceExtension interface from the @janhq/core package.
  * The class provides methods for initializing and stopping a model, and for making inference requests.
  * It also subscribes to events emitted by the @janhq/core package and handles new message requests.
  */
-export default class JanInferenceTritonTrtLLMExtension
-  extends BaseExtension
-{
-  private static readonly _homeDir = "file://engines";
-  private static readonly _engineMetadataFileName = "triton_trtllm.json";
+export default class JanInferenceTritonTrtLLMExtension extends BaseExtension {
+  private static readonly _homeDir = 'file://engines'
+  private static readonly _engineMetadataFileName = 'triton_trtllm.json'
 
-  static _currentModel: Model;
+  static _currentModel: Model
 
   static _engineSettings: EngineSettings = {
-    base_url: "",
-  };
+    base_url: '',
+  }
 
-  controller = new AbortController();
-  isCancelled = false;
+  controller = new AbortController()
+  isCancelled = false
 
   /**
    * Subscribes to events emitted by the @janhq/core package.
    */
   async onLoad() {
     if (!(await fs.existsSync(JanInferenceTritonTrtLLMExtension._homeDir)))
-      JanInferenceTritonTrtLLMExtension.writeDefaultEngineSettings();
+      JanInferenceTritonTrtLLMExtension.writeDefaultEngineSettings()
 
     // Events subscription
     events.on(MessageEvent.OnMessageSent, (data) =>
       JanInferenceTritonTrtLLMExtension.handleMessageRequest(data, this)
-    );
+    )
 
     events.on(ModelEvent.OnModelInit, (model: Model) => {
-      JanInferenceTritonTrtLLMExtension.handleModelInit(model);
-    });
+      JanInferenceTritonTrtLLMExtension.handleModelInit(model)
+    })
 
     events.on(ModelEvent.OnModelStop, (model: Model) => {
-      JanInferenceTritonTrtLLMExtension.handleModelStop(model);
-    });
+      JanInferenceTritonTrtLLMExtension.handleModelStop(model)
+    })
   }
 
   /**
@@ -81,7 +79,7 @@ export default class JanInferenceTritonTrtLLMExtension
     modelId: string,
     settings?: ModelSettingParams
   ): Promise<void> {
-    return;
+    return
   }
 
   static async writeDefaultEngineSettings() {
@@ -89,11 +87,11 @@ export default class JanInferenceTritonTrtLLMExtension
       const engine_json = join(
         JanInferenceTritonTrtLLMExtension._homeDir,
         JanInferenceTritonTrtLLMExtension._engineMetadataFileName
-      );
+      )
       if (await fs.existsSync(engine_json)) {
-        const engine = await fs.readFileSync(engine_json, "utf-8");
+        const engine = await fs.readFileSync(engine_json, 'utf-8')
         JanInferenceTritonTrtLLMExtension._engineSettings =
-          typeof engine === "object" ? engine : JSON.parse(engine);
+          typeof engine === 'object' ? engine : JSON.parse(engine)
       } else {
         await fs.writeFileSync(
           engine_json,
@@ -102,10 +100,10 @@ export default class JanInferenceTritonTrtLLMExtension
             null,
             2
           )
-        );
+        )
       }
     } catch (err) {
-      console.error(err);
+      console.error(err)
     }
   }
   /**
@@ -119,26 +117,26 @@ export default class JanInferenceTritonTrtLLMExtension
    * @returns {Promise<void>} A promise that resolves when the streaming is stopped.
    */
   async stopInference(): Promise<void> {
-    this.isCancelled = true;
-    this.controller?.abort();
+    this.isCancelled = true
+    this.controller?.abort()
   }
 
   private static async handleModelInit(model: Model) {
-    if (model.engine !== "triton_trtllm") {
-      return;
+    if (model.engine !== 'triton_trtllm') {
+      return
     } else {
-      JanInferenceTritonTrtLLMExtension._currentModel = model;
-      JanInferenceTritonTrtLLMExtension.writeDefaultEngineSettings();
+      JanInferenceTritonTrtLLMExtension._currentModel = model
+      JanInferenceTritonTrtLLMExtension.writeDefaultEngineSettings()
       // Todo: Check model list with API key
-      events.emit(ModelEvent.OnModelReady, model);
+      events.emit(ModelEvent.OnModelReady, model)
     }
   }
 
   private static async handleModelStop(model: Model) {
-    if (model.engine !== "triton_trtllm") {
-      return;
+    if (model.engine !== 'triton_trtllm') {
+      return
     }
-    events.emit(ModelEvent.OnModelStopped, model);
+    events.emit(ModelEvent.OnModelStopped, model)
   }
 
   /**
@@ -151,11 +149,11 @@ export default class JanInferenceTritonTrtLLMExtension
     data: MessageRequest,
     instance: JanInferenceTritonTrtLLMExtension
   ) {
-    if (data.model.engine !== "triton_trtllm") {
-      return;
+    if (data.model.engine !== 'triton_trtllm') {
+      return
     }
 
-    const timestamp = Date.now();
+    const timestamp = Date.now()
     const message: ThreadMessage = {
       id: ulid(),
       thread_id: data.threadId,
@@ -165,12 +163,12 @@ export default class JanInferenceTritonTrtLLMExtension
       status: MessageStatus.Pending,
       created: timestamp,
       updated: timestamp,
-      object: "thread.message",
-    };
-    events.emit(MessageEvent.OnMessageResponse, message);
+      object: 'thread.message',
+    }
+    events.emit(MessageEvent.OnMessageResponse, message)
 
-    instance.isCancelled = false;
-    instance.controller = new AbortController();
+    instance.isCancelled = false
+    instance.controller = new AbortController()
 
     requestInference(
       data?.messages ?? [],
@@ -188,33 +186,33 @@ export default class JanInferenceTritonTrtLLMExtension
             value: content.trim(),
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       complete: async () => {
         message.status = message.content.length
           ? MessageStatus.Ready
-          : MessageStatus.Error;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+          : MessageStatus.Error
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
       error: async (err) => {
         if (instance.isCancelled || message.content.length) {
-          message.status = MessageStatus.Error;
-          events.emit(MessageEvent.OnMessageUpdate, message);
-          return;
+          message.status = MessageStatus.Error
+          events.emit(MessageEvent.OnMessageUpdate, message)
+          return
         }
         const messageContent: ThreadContent = {
           type: ContentType.Text,
           text: {
-            value: "Error occurred: " + err.message,
+            value: 'Error occurred: ' + err.message,
             annotations: [],
           },
-        };
-        message.content = [messageContent];
-        message.status = MessageStatus.Ready;
-        events.emit(MessageEvent.OnMessageUpdate, message);
+        }
+        message.content = [messageContent]
+        message.status = MessageStatus.Ready
+        events.emit(MessageEvent.OnMessageUpdate, message)
       },
-    });
+    })
   }
 }
diff --git a/extensions/inference-triton-trtllm-extension/tsconfig.json b/extensions/inference-triton-trtllm-extension/tsconfig.json
index 7bfdd90096..2477d58ce5 100644
--- a/extensions/inference-triton-trtllm-extension/tsconfig.json
+++ b/extensions/inference-triton-trtllm-extension/tsconfig.json
@@ -8,7 +8,7 @@
     "forceConsistentCasingInFileNames": true,
     "strict": false,
     "skipLibCheck": true,
-    "rootDir": "./src",
+    "rootDir": "./src"
   },
-  "include": ["./src"],
+  "include": ["./src"]
 }
diff --git a/extensions/inference-triton-trtllm-extension/webpack.config.js b/extensions/inference-triton-trtllm-extension/webpack.config.js
index 57a0adb0a2..e83370a1ac 100644
--- a/extensions/inference-triton-trtllm-extension/webpack.config.js
+++ b/extensions/inference-triton-trtllm-extension/webpack.config.js
@@ -1,16 +1,16 @@
-const path = require("path");
-const webpack = require("webpack");
-const packageJson = require("./package.json");
+const path = require('path')
+const webpack = require('webpack')
+const packageJson = require('./package.json')
 
 module.exports = {
   experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
+  entry: './src/index.ts', // Adjust the entry point to match your project's main file
+  mode: 'production',
   module: {
     rules: [
       {
         test: /\.tsx?$/,
-        use: "ts-loader",
+        use: 'ts-loader',
         exclude: /node_modules/,
       },
     ],
@@ -21,18 +21,18 @@ module.exports = {
     }),
   ],
   output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
+    filename: 'index.js', // Adjust the output file name as needed
+    path: path.resolve(__dirname, 'dist'),
+    library: { type: 'module' }, // Specify ESM output format
   },
   resolve: {
-    extensions: [".ts", ".js"],
+    extensions: ['.ts', '.js'],
     fallback: {
-      path: require.resolve("path-browserify"),
+      path: require.resolve('path-browserify'),
     },
   },
   optimization: {
     minimize: false,
   },
   // Add loaders and other configuration as needed for your project
-};
+}
diff --git a/extensions/model-extension/.prettierrc b/extensions/model-extension/.prettierrc
deleted file mode 100644
index 46f1abcb02..0000000000
--- a/extensions/model-extension/.prettierrc
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-  "semi": false,
-  "singleQuote": true,
-  "quoteProps": "consistent",
-  "trailingComma": "es5",
-  "endOfLine": "auto",
-  "plugins": ["prettier-plugin-tailwindcss"]
-}
diff --git a/extensions/model-extension/package.json b/extensions/model-extension/package.json
index 86f177d149..e99122bcf6 100644
--- a/extensions/model-extension/package.json
+++ b/extensions/model-extension/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@janhq/model-extension",
-  "version": "1.0.23",
+  "version": "1.0.25",
   "description": "Model Management Extension provides model exploration and seamless downloads",
   "main": "dist/index.js",
   "module": "dist/module.js",
@@ -8,13 +8,14 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "devDependencies": {
     "cpx": "^1.5.0",
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "files": [
     "dist/*",
@@ -23,7 +24,6 @@
   ],
   "dependencies": {
     "@janhq/core": "file:../../core",
-    "path-browserify": "^1.0.1",
-    "ts-loader": "^9.5.0"
+    "path-browserify": "^1.0.1"
   }
 }
diff --git a/extensions/model-extension/src/@types/global.d.ts b/extensions/model-extension/src/@types/global.d.ts
index e998455f2e..7a9202a627 100644
--- a/extensions/model-extension/src/@types/global.d.ts
+++ b/extensions/model-extension/src/@types/global.d.ts
@@ -1,3 +1,15 @@
-declare const EXTENSION_NAME: string
-declare const MODULE_PATH: string
-declare const VERSION: stringå
+export {}
+declare global {
+  declare const EXTENSION_NAME: string
+  declare const MODULE_PATH: string
+  declare const VERSION: string
+
+  interface Core {
+    api: APIFunctions
+    events: EventEmitter
+  }
+  interface Window {
+    core?: Core | undefined
+    electronAPI?: any | undefined
+  }
+}
diff --git a/extensions/model-extension/src/helpers/path.ts b/extensions/model-extension/src/helpers/path.ts
new file mode 100644
index 0000000000..cbb151aa6c
--- /dev/null
+++ b/extensions/model-extension/src/helpers/path.ts
@@ -0,0 +1,11 @@
+/**
+ *  try to retrieve the download file name from the source url
+ */
+
+export function extractFileName(url: string, fileExtension: string): string {
+  const extractedFileName = url.split('/').pop()
+  const fileName = extractedFileName.toLowerCase().endsWith(fileExtension)
+    ? extractedFileName
+    : extractedFileName + fileExtension
+  return fileName
+}
diff --git a/extensions/model-extension/src/index.ts b/extensions/model-extension/src/index.ts
index b9fa7731e2..926e65ee50 100644
--- a/extensions/model-extension/src/index.ts
+++ b/extensions/model-extension/src/index.ts
@@ -8,8 +8,15 @@ import {
   ModelExtension,
   Model,
   getJanDataFolderPath,
+  events,
+  DownloadEvent,
+  DownloadRoute,
+  ModelEvent,
+  DownloadState,
 } from '@janhq/core'
 
+import { extractFileName } from './helpers/path'
+
 /**
  * A extension for models
  */
@@ -29,6 +36,8 @@ export default class JanModelExtension extends ModelExtension {
    */
   async onLoad() {
     this.copyModelsToHomeDir()
+    // Handle Desktop Events
+    this.handleDesktopEvents()
   }
 
   /**
@@ -61,6 +70,8 @@ export default class JanModelExtension extends ModelExtension {
 
       // Finished migration
       localStorage.setItem(`${EXTENSION_NAME}-version`, VERSION)
+
+      events.emit(ModelEvent.OnModelsUpdate, {})
     } catch (err) {
       console.error(err)
     }
@@ -83,31 +94,66 @@ export default class JanModelExtension extends ModelExtension {
     if (model.sources.length > 1) {
       // path to model binaries
       for (const source of model.sources) {
-        let path = this.extractFileName(source.url)
+        let path = extractFileName(
+          source.url,
+          JanModelExtension._supportedModelFormat
+        )
         if (source.filename) {
           path = await joinPath([modelDirPath, source.filename])
         }
 
         downloadFile(source.url, path, network)
       }
+      // TODO: handle multiple binaries for web later
     } else {
-      const fileName = this.extractFileName(model.sources[0]?.url)
+      const fileName = extractFileName(
+        model.sources[0]?.url,
+        JanModelExtension._supportedModelFormat
+      )
       const path = await joinPath([modelDirPath, fileName])
       downloadFile(model.sources[0]?.url, path, network)
+
+      if (window && window.core?.api && window.core.api.baseApiUrl) {
+        this.startPollingDownloadProgress(model.id)
+      }
     }
   }
 
   /**
-   *  try to retrieve the download file name from the source url
+   * Specifically for Jan server.
    */
-  private extractFileName(url: string): string {
-    const extractedFileName = url.split('/').pop()
-    const fileName = extractedFileName
-      .toLowerCase()
-      .endsWith(JanModelExtension._supportedModelFormat)
-      ? extractedFileName
-      : extractedFileName + JanModelExtension._supportedModelFormat
-    return fileName
+  private async startPollingDownloadProgress(modelId: string): Promise<void> {
+    // wait for some seconds before polling
+    await new Promise((resolve) => setTimeout(resolve, 3000))
+
+    return new Promise((resolve) => {
+      const interval = setInterval(async () => {
+        fetch(
+          `${window.core.api.baseApiUrl}/v1/download/${DownloadRoute.getDownloadProgress}/${modelId}`,
+          {
+            method: 'GET',
+            headers: { contentType: 'application/json' },
+          }
+        ).then(async (res) => {
+          const state: DownloadState = await res.json()
+          if (state.downloadState === 'end') {
+            events.emit(DownloadEvent.onFileDownloadSuccess, state)
+            clearInterval(interval)
+            resolve()
+            return
+          }
+
+          if (state.downloadState === 'error') {
+            events.emit(DownloadEvent.onFileDownloadError, state)
+            clearInterval(interval)
+            resolve()
+            return
+          }
+
+          events.emit(DownloadEvent.onFileDownloadUpdate, state)
+        })
+      }, 1000)
+    })
   }
 
   /**
@@ -174,15 +220,20 @@ export default class JanModelExtension extends ModelExtension {
   async getDownloadedModels(): Promise<Model[]> {
     return await this.getModelsMetadata(
       async (modelDir: string, model: Model) => {
-        if (model.engine !== JanModelExtension._offlineInferenceEngine) {
+        if (model.engine !== JanModelExtension._offlineInferenceEngine)
           return true
-        }
+
+        // model binaries (sources) are absolute path & exist
+        const existFiles = await Promise.all(
+          model.sources.map((source) => fs.existsSync(source.url))
+        )
+        if (existFiles.every((exist) => exist)) return true
+
         return await fs
           .readdirSync(await joinPath([JanModelExtension._homeDir, modelDir]))
           .then((files: string[]) => {
-            // or model binary exists in the directory
-            // model binary name can match model ID or be a .gguf file and not be an incompleted model file
-            // TODO: Check diff between urls, filenames
+            // Model binary exists in the directory
+            // Model binary name can match model ID or be a .gguf file and not be an incompleted model file
             return (
               files.includes(modelDir) ||
               files.filter(
@@ -228,8 +279,19 @@ export default class JanModelExtension extends ModelExtension {
         if (await fs.existsSync(jsonPath)) {
           // if we have the model.json file, read it
           let model = await this.readModelMetadata(jsonPath)
+
           model = typeof model === 'object' ? model : JSON.parse(model)
 
+          // This to ensure backward compatibility with `model.json` with `source_url`
+          if (model['source_url'] != null) {
+            model['sources'] = [
+              {
+                filename: model.id,
+                url: model['source_url'],
+              },
+            ]
+          }
+
           if (selector && !(await selector?.(dirName, model))) {
             return
           }
@@ -243,31 +305,18 @@ export default class JanModelExtension extends ModelExtension {
       })
       const results = await Promise.allSettled(readJsonPromises)
       const modelData = results.map((result) => {
-        if (result.status === 'fulfilled') {
+        if (result.status === 'fulfilled' && result.value) {
           try {
-            // This to ensure backward compatibility with `model.json` with `source_url`
-            const tmpModel =
+            const model =
               typeof result.value === 'object'
                 ? result.value
                 : JSON.parse(result.value)
-            if (tmpModel['source_url'] != null) {
-              tmpModel['source'] = [
-                {
-                  filename: tmpModel.id,
-                  url: tmpModel['source_url'],
-                },
-              ]
-            }
-
-            return tmpModel as Model
+            return model as Model
           } catch {
             console.debug(`Unable to parse model metadata: ${result.value}`)
-            return undefined
           }
-        } else {
-          console.error(result.reason)
-          return undefined
         }
+        return undefined
       })
 
       return modelData.filter((e) => !!e)
@@ -318,7 +367,7 @@ export default class JanModelExtension extends ModelExtension {
       return
     }
 
-    const defaultModel = await this.getDefaultModel() as Model
+    const defaultModel = (await this.getDefaultModel()) as Model
     if (!defaultModel) {
       console.error('Unable to find default model')
       return
@@ -382,4 +431,28 @@ export default class JanModelExtension extends ModelExtension {
   async getConfiguredModels(): Promise<Model[]> {
     return this.getModelsMetadata()
   }
+
+  handleDesktopEvents() {
+    if (window && window.electronAPI) {
+      window.electronAPI.onFileDownloadUpdate(
+        async (_event: string, state: DownloadState | undefined) => {
+          if (!state) return
+          state.downloadState = 'downloading'
+          events.emit(DownloadEvent.onFileDownloadUpdate, state)
+        }
+      )
+      window.electronAPI.onFileDownloadError(
+        async (_event: string, state: DownloadState) => {
+          state.downloadState = 'error'
+          events.emit(DownloadEvent.onFileDownloadError, state)
+        }
+      )
+      window.electronAPI.onFileDownloadSuccess(
+        async (_event: string, state: DownloadState) => {
+          state.downloadState = 'end'
+          events.emit(DownloadEvent.onFileDownloadSuccess, state)
+        }
+      )
+    }
+  }
 }
diff --git a/extensions/monitoring-extension/package.json b/extensions/monitoring-extension/package.json
index 9935e536ee..582f7cd7b8 100644
--- a/extensions/monitoring-extension/package.json
+++ b/extensions/monitoring-extension/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@janhq/monitoring-extension",
-  "version": "1.0.9",
+  "version": "1.0.10",
   "description": "This extension provides system health and OS level data",
   "main": "dist/index.js",
   "module": "dist/module.js",
@@ -8,17 +8,17 @@
   "license": "AGPL-3.0",
   "scripts": {
     "build": "tsc -b . && webpack --config webpack.config.js",
-    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../electron/pre-install"
+    "build:publish": "rimraf *.tgz --glob && npm run build && npm pack && cpx *.tgz ../../pre-install"
   },
   "devDependencies": {
     "rimraf": "^3.0.2",
     "webpack": "^5.88.2",
-    "webpack-cli": "^5.1.4"
+    "webpack-cli": "^5.1.4",
+    "ts-loader": "^9.5.0"
   },
   "dependencies": {
     "@janhq/core": "file:../../core",
-    "node-os-utils": "^1.3.7",
-    "ts-loader": "^9.5.0"
+    "node-os-utils": "^1.3.7"
   },
   "files": [
     "dist/*",
@@ -26,6 +26,7 @@
     "README.md"
   ],
   "bundleDependencies": [
-    "node-os-utils"
+    "node-os-utils",
+    "@janhq/core"
   ]
 }
diff --git a/extensions/monitoring-extension/src/@types/global.d.ts b/extensions/monitoring-extension/src/@types/global.d.ts
index 3b45ccc5ad..8106353cfc 100644
--- a/extensions/monitoring-extension/src/@types/global.d.ts
+++ b/extensions/monitoring-extension/src/@types/global.d.ts
@@ -1 +1 @@
-declare const MODULE: string;
+declare const MODULE: string
diff --git a/extensions/monitoring-extension/src/index.ts b/extensions/monitoring-extension/src/index.ts
index 9297a770f5..ce9b2fc148 100644
--- a/extensions/monitoring-extension/src/index.ts
+++ b/extensions/monitoring-extension/src/index.ts
@@ -1,4 +1,4 @@
-import { MonitoringExtension, executeOnMain } from "@janhq/core";
+import { MonitoringExtension, executeOnMain } from '@janhq/core'
 
 /**
  * JanMonitoringExtension is a extension that provides system monitoring functionality.
@@ -20,7 +20,7 @@ export default class JanMonitoringExtension extends MonitoringExtension {
    * @returns A Promise that resolves to an object containing information about the system resources.
    */
   getResourcesInfo(): Promise<any> {
-    return executeOnMain(MODULE, "getResourcesInfo");
+    return executeOnMain(MODULE, 'getResourcesInfo')
   }
 
   /**
@@ -28,6 +28,6 @@ export default class JanMonitoringExtension extends MonitoringExtension {
    * @returns A Promise that resolves to an object containing information about the current system load.
    */
   getCurrentLoad(): Promise<any> {
-    return executeOnMain(MODULE, "getCurrentLoad");
+    return executeOnMain(MODULE, 'getCurrentLoad')
   }
 }
diff --git a/extensions/monitoring-extension/src/module.ts b/extensions/monitoring-extension/src/module.ts
index 86b553d526..27781a5d6f 100644
--- a/extensions/monitoring-extension/src/module.ts
+++ b/extensions/monitoring-extension/src/module.ts
@@ -1,33 +1,92 @@
-const nodeOsUtils = require("node-os-utils");
+const nodeOsUtils = require('node-os-utils')
+const getJanDataFolderPath = require('@janhq/core/node').getJanDataFolderPath
+const path = require('path')
+const { readFileSync } = require('fs')
+const exec = require('child_process').exec
+
+const NVIDIA_INFO_FILE = path.join(
+  getJanDataFolderPath(),
+  'settings',
+  'settings.json'
+)
 
 const getResourcesInfo = () =>
   new Promise((resolve) => {
     nodeOsUtils.mem.used().then((ramUsedInfo) => {
-      const totalMemory = ramUsedInfo.totalMemMb * 1024 * 1024;
-      const usedMemory = ramUsedInfo.usedMemMb * 1024 * 1024;
+      const totalMemory = ramUsedInfo.totalMemMb * 1024 * 1024
+      const usedMemory = ramUsedInfo.usedMemMb * 1024 * 1024
       const response = {
         mem: {
           totalMemory,
           usedMemory,
         },
-      };
-      resolve(response);
-    });
-  });
+      }
+      resolve(response)
+    })
+  })
 
 const getCurrentLoad = () =>
-  new Promise((resolve) => {
+  new Promise((resolve, reject) => {
     nodeOsUtils.cpu.usage().then((cpuPercentage) => {
-      const response = {
-        cpu: {
-          usage: cpuPercentage,
-        },
-      };
-      resolve(response);
-    });
-  });
+      let data = {
+        run_mode: 'cpu',
+        gpus_in_use: [],
+      }
+      if (process.platform !== 'darwin') {
+        data = JSON.parse(readFileSync(NVIDIA_INFO_FILE, 'utf-8'))
+      }
+      if (data.run_mode === 'gpu' && data.gpus_in_use.length > 0) {
+        const gpuIds = data['gpus_in_use'].join(',')
+        if (gpuIds !== '' && data['vulkan'] !== true) {
+          exec(
+            `nvidia-smi --query-gpu=index,name,temperature.gpu,utilization.gpu,memory.total,memory.free,utilization.memory --format=csv,noheader,nounits --id=${gpuIds}`,
+            (error, stdout, _) => {
+              if (error) {
+                console.error(`exec error: ${error}`)
+                reject(error)
+                return
+              }
+              const gpuInfo = stdout
+                .trim()
+                .split('\n')
+                .map((line) => {
+                  const [
+                    id,
+                    name,
+                    temperature,
+                    utilization,
+                    memoryTotal,
+                    memoryFree,
+                    memoryUtilization,
+                  ] = line.split(', ').map((item) => item.replace(/\r/g, ''))
+                  return {
+                    id,
+                    name,
+                    temperature,
+                    utilization,
+                    memoryTotal,
+                    memoryFree,
+                    memoryUtilization,
+                  }
+                })
+              resolve({
+                cpu: { usage: cpuPercentage },
+                gpu: gpuInfo,
+              })
+            }
+          )
+        } else {
+          // Handle the case where gpuIds is empty
+          resolve({ cpu: { usage: cpuPercentage }, gpu: [] })
+        }
+      } else {
+        // Handle the case where run_mode is not 'gpu' or no GPUs are in use
+        resolve({ cpu: { usage: cpuPercentage }, gpu: [] })
+      }
+    })
+  })
 
 module.exports = {
   getResourcesInfo,
   getCurrentLoad,
-};
+}
diff --git a/extensions/monitoring-extension/webpack.config.js b/extensions/monitoring-extension/webpack.config.js
index f54059222f..c8c3a34f79 100644
--- a/extensions/monitoring-extension/webpack.config.js
+++ b/extensions/monitoring-extension/webpack.config.js
@@ -1,24 +1,24 @@
-const path = require("path");
-const webpack = require("webpack");
-const packageJson = require("./package.json");
+const path = require('path')
+const webpack = require('webpack')
+const packageJson = require('./package.json')
 
 module.exports = {
   experiments: { outputModule: true },
-  entry: "./src/index.ts", // Adjust the entry point to match your project's main file
-  mode: "production",
+  entry: './src/index.ts', // Adjust the entry point to match your project's main file
+  mode: 'production',
   module: {
     rules: [
       {
         test: /\.tsx?$/,
-        use: "ts-loader",
+        use: 'ts-loader',
         exclude: /node_modules/,
       },
     ],
   },
   output: {
-    filename: "index.js", // Adjust the output file name as needed
-    path: path.resolve(__dirname, "dist"),
-    library: { type: "module" }, // Specify ESM output format
+    filename: 'index.js', // Adjust the output file name as needed
+    path: path.resolve(__dirname, 'dist'),
+    library: { type: 'module' }, // Specify ESM output format
   },
   plugins: [
     new webpack.DefinePlugin({
@@ -26,10 +26,10 @@ module.exports = {
     }),
   ],
   resolve: {
-    extensions: [".ts", ".js"],
+    extensions: ['.ts', '.js'],
   },
   optimization: {
     minimize: false,
   },
   // Add loaders and other configuration as needed for your project
-};
+}
diff --git a/models/dolphin-phi-2/model.json b/models/dolphin-phi-2/model.json
new file mode 100644
index 0000000000..c25ff8f694
--- /dev/null
+++ b/models/dolphin-phi-2/model.json
@@ -0,0 +1,32 @@
+{
+    "sources": [
+      {
+        "url": "https://huggingface.co/TheBloke/dolphin-2_6-phi-2-GGUF/resolve/main/dolphin-2_6-phi-2.Q8_0.gguf",
+        "filename": "dolphin-2_6-phi-2.Q8_0.gguf"
+      }
+    ],
+    "id": "dolphin-phi-2",
+    "object": "model",
+    "name": "Dolphin Phi-2 2.7B Q8",
+    "version": "1.0",
+    "description": "Dolphin Phi-2 is a 2.7B model, fine-tuned for chat, excelling in common sense and logical reasoning benchmarks.",
+    "format": "gguf",
+    "settings": {
+      "ctx_len": 4096,
+      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+      "llama_model_path": "dolphin-2_6-phi-2.Q8_0.gguf"
+    },
+    "parameters": {
+      "max_tokens": 4096,
+      "stop": ["<|im_end|>"]
+    },
+    "metadata": {
+      "author": "Cognitive Computations, Microsoft",
+      "tags": [
+        "3B",
+        "Finetuned"
+      ],
+      "size": 2960000000
+    },
+    "engine": "nitro"
+  }
diff --git a/models/llamacorn-1.1b/model.json b/models/llamacorn-1.1b/model.json
new file mode 100644
index 0000000000..056fb90504
--- /dev/null
+++ b/models/llamacorn-1.1b/model.json
@@ -0,0 +1,37 @@
+{
+    "sources": [
+        {
+            "url":"https://huggingface.co/janhq/llamacorn-1.1b-chat-GGUF/resolve/main/llamacorn-1.1b-chat.Q8_0.gguf",
+            "filename": "llamacorn-1.1b-chat.Q8_0.gguf"
+        }
+    ],
+    "id": "llamacorn-1.1b",
+    "object": "model",
+    "name": "LlamaCorn 1.1B Q8",
+    "version": "1.0",
+    "description": "LlamaCorn is designed to improve chat functionality from TinyLlama.",
+    "format": "gguf",
+    "settings": {
+      "ctx_len": 2048,
+      "prompt_template": "<|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant",
+      "llama_model_path": "llamacorn-1.1b-chat.Q8_0.gguf"
+    },
+    "parameters": {
+      "temperature": 0.7,
+      "top_p": 0.95,
+      "stream": true,
+      "max_tokens": 2048,
+      "stop": [],
+      "frequency_penalty": 0,
+      "presence_penalty": 0
+    },
+    "metadata": {
+      "author": "Jan",
+      "tags": [
+        "Tiny",
+        "Finetuned"
+      ],
+      "size": 1170000000
+    },
+    "engine": "nitro"
+  }
\ No newline at end of file
diff --git a/models/mistral-ins-7b-q4/cover.png b/models/mistral-ins-7b-q4/cover.png
index 000445ecba..73b82e5996 100644
Binary files a/models/mistral-ins-7b-q4/cover.png and b/models/mistral-ins-7b-q4/cover.png differ
diff --git a/models/mistral-ins-7b-q4/model.json b/models/mistral-ins-7b-q4/model.json
index bfdaffa907..75e0cbf9f0 100644
--- a/models/mistral-ins-7b-q4/model.json
+++ b/models/mistral-ins-7b-q4/model.json
@@ -29,7 +29,7 @@
     "author": "MistralAI, The Bloke",
     "tags": ["Featured", "7B", "Foundational Model"],
     "size": 4370000000,
-    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/mistral-ins-7b-q4/cover.png"
+    "cover": "https://raw.githubusercontent.com/janhq/jan/dev/models/mistral-ins-7b-q4/cover.png"
   },
   "engine": "nitro"
 }
diff --git a/models/openchat-3.5-7b/model.json b/models/openchat-3.5-7b/model.json
index 294f7d2694..18db33f8e6 100644
--- a/models/openchat-3.5-7b/model.json
+++ b/models/openchat-3.5-7b/model.json
@@ -1,8 +1,8 @@
 {
   "sources": [
     {
-      "filename": "openchat-3.5-1210.Q4_K_M.gguf",
-      "url": "https://huggingface.co/TheBloke/openchat-3.5-1210-GGUF/resolve/main/openchat-3.5-1210.Q4_K_M.gguf"
+      "filename": "openchat-3.5-0106.Q4_K_M.gguf",
+      "url": "https://huggingface.co/TheBloke/openchat-3.5-0106-GGUF/resolve/main/openchat-3.5-0106.Q4_K_M.gguf"
     }
   ],
   "id": "openchat-3.5-7b",
@@ -14,7 +14,7 @@
   "settings": {
     "ctx_len": 4096,
     "prompt_template": "GPT4 Correct User: {prompt}<|end_of_turn|>GPT4 Correct Assistant:",
-    "llama_model_path": "openchat-3.5-1210.Q4_K_M.gguf"
+    "llama_model_path": "openchat-3.5-0106.Q4_K_M.gguf"
   },
   "parameters": {
     "temperature": 0.7,
diff --git a/models/openhermes-neural-7b/cover.png b/models/openhermes-neural-7b/cover.png
index 5b9da0aefe..8976d84490 100644
Binary files a/models/openhermes-neural-7b/cover.png and b/models/openhermes-neural-7b/cover.png differ
diff --git a/models/openhermes-neural-7b/model.json b/models/openhermes-neural-7b/model.json
index 87e1df143a..a13a0f2b85 100644
--- a/models/openhermes-neural-7b/model.json
+++ b/models/openhermes-neural-7b/model.json
@@ -28,7 +28,7 @@
     "author": "Intel, Jan",
     "tags": ["7B", "Merged", "Featured"],
     "size": 4370000000,
-    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/openhermes-neural-7b/cover.png"
+    "cover": "https://raw.githubusercontent.com/janhq/jan/dev/models/openhermes-neural-7b/cover.png"
   },
   "engine": "nitro"
 }
diff --git a/models/stable-zephyr-3b/model.json b/models/stable-zephyr-3b/model.json
new file mode 100644
index 0000000000..724299ea5e
--- /dev/null
+++ b/models/stable-zephyr-3b/model.json
@@ -0,0 +1,34 @@
+{
+    "sources": [
+      {
+        "url": "https://huggingface.co/TheBloke/stablelm-zephyr-3b-GGUF/resolve/main/stablelm-zephyr-3b.Q8_0.gguf",
+        "filename": "stablelm-zephyr-3b.Q8_0.gguf"
+      }
+    ],
+    "id": "stable-zephyr-3b",
+    "object": "model",
+    "name": "Stable Zephyr 3B Q8",
+    "version": "1.0",
+    "description": "StableLM Zephyr 3B is trained for safe and reliable chatting.",
+    "format": "gguf",
+    "settings": {
+      "ctx_len": 4096,
+      "prompt_template": "<|user|>\n{prompt}<|endoftext|>\n<|assistant|>",
+      "llama_model_path": "stablelm-zephyr-3b.Q8_0.gguf"
+    },
+    "parameters": {
+      "temperature": 0.7,
+      "top_p": 0.95,
+      "stream": true,
+      "max_tokens": 4096,
+      "stop": ["<|endoftext|>"],
+      "frequency_penalty": 0,
+      "presence_penalty": 0
+    },
+    "metadata": {
+      "author": "StabilityAI",
+      "tags": ["3B", "Finetuned"],
+      "size": 2970000000
+    },
+    "engine": "nitro"
+  }
\ No newline at end of file
diff --git a/models/trinity-v1.2-7b/cover.png b/models/trinity-v1.2-7b/cover.png
index a548e3c173..fbef0bb560 100644
Binary files a/models/trinity-v1.2-7b/cover.png and b/models/trinity-v1.2-7b/cover.png differ
diff --git a/models/trinity-v1.2-7b/model.json b/models/trinity-v1.2-7b/model.json
index 2dda120e65..9476296421 100644
--- a/models/trinity-v1.2-7b/model.json
+++ b/models/trinity-v1.2-7b/model.json
@@ -28,7 +28,7 @@
     "author": "Jan",
     "tags": ["7B", "Merged", "Featured"],
     "size": 4370000000,
-    "cover": "https://raw.githubusercontent.com/janhq/jan/main/models/trinity-v1.2-7b/cover.png"
+    "cover": "https://raw.githubusercontent.com/janhq/jan/dev/models/trinity-v1.2-7b/cover.png"
   },
   "engine": "nitro"
 }
diff --git a/models/yarn-mistral-7b/model.json b/models/yarn-mistral-7b/model.json
deleted file mode 100644
index ee6de13198..0000000000
--- a/models/yarn-mistral-7b/model.json
+++ /dev/null
@@ -1,31 +0,0 @@
-{
-  "sources": [
-    {
-      "url": "https://huggingface.co/TheBloke/Yarn-Mistral-7B-128k-GGUF/resolve/main/yarn-mistral-7b-128k.Q4_K_M.gguf"
-    }
-  ],
-  "id": "yarn-mistral-7b",
-  "object": "model",
-  "name": "Yarn Mistral 7B Q4",
-  "version": "1.0",
-  "description": "Yarn Mistral 7B is a language model for long context and supports a 128k token context window.",
-  "format": "gguf",
-  "settings": {
-    "ctx_len": 4096,
-    "prompt_template": "{prompt}"
-  },
-  "parameters": {
-    "temperature": 0.7,
-    "top_p": 0.95,
-    "stream": true,
-    "max_tokens": 4096,
-    "frequency_penalty": 0,
-    "presence_penalty": 0
-  },
-  "metadata": {
-    "author": "NousResearch, The Bloke",
-    "tags": ["7B", "Finetuned"],
-    "size": 4370000000
-  },
-  "engine": "nitro"
-}
diff --git a/package.json b/package.json
index 4b8bc4af08..957934fdaa 100644
--- a/package.json
+++ b/package.json
@@ -21,22 +21,23 @@
     "lint": "yarn workspace jan lint && yarn workspace jan-web lint",
     "test:unit": "yarn workspace @janhq/core test",
     "test": "yarn workspace jan test:e2e",
-    "copy:assets": "cpx \"models/**\" \"electron/models/\" && cpx \"docs/openapi/**\" \"electron/docs/openapi\"",
+    "copy:assets": "cpx \"models/**\" \"electron/models/\" && cpx \"pre-install/*.tgz\" \"electron/pre-install/\" && cpx \"docs/openapi/**\" \"electron/docs/openapi\"",
     "dev:electron": "yarn copy:assets && yarn workspace jan dev",
     "dev:web": "yarn workspace jan-web dev",
-    "dev:server": "yarn workspace @janhq/server dev",
+    "dev:server": "yarn copy:assets && yarn workspace @janhq/server dev",
     "dev": "concurrently --kill-others \"yarn dev:web\" \"wait-on http://localhost:3000 && yarn dev:electron\"",
     "test-local": "yarn lint && yarn build:test && yarn test",
     "dev:uikit": "yarn workspace @janhq/uikit install && yarn workspace @janhq/uikit dev",
     "build:uikit": "yarn workspace @janhq/uikit install && yarn workspace @janhq/uikit build",
-    "build:server": "cd server && yarn install && yarn run build",
+    "build:server": "yarn copy:assets && cd server && yarn install && yarn run build",
     "build:core": "cd core && yarn install && yarn run build",
     "build:web": "yarn workspace jan-web build && cpx \"web/out/**\" \"electron/renderer/\"",
     "build:electron": "yarn copy:assets && yarn workspace jan build",
     "build:electron:test": "yarn workspace jan build:test",
-    "build:extensions:windows": "rimraf ./electron/pre-install/*.tgz && powershell -command \"$jobs = Get-ChildItem -Path './extensions' -Directory | ForEach-Object { Start-Job -Name ($_.Name) -ScriptBlock { param($_dir); try { Set-Location $_dir; npm install; npm run build:publish; Write-Output 'Build successful in ' + $_dir } catch { Write-Error 'Error in ' + $_dir; throw } } -ArgumentList $_.FullName }; $jobs | Wait-Job; $jobs | ForEach-Object { Receive-Job -Job $_ -Keep } | ForEach-Object { Write-Host $_ }; $failed = $jobs | Where-Object { $_.State -ne 'Completed' -or $_.ChildJobs[0].JobStateInfo.State -ne 'Completed' }; if ($failed) { Exit 1 }\"",
-    "build:extensions:linux": "rimraf ./electron/pre-install/*.tgz && find ./extensions -mindepth 1 -maxdepth 1 -type d -print0 | xargs -0 -n 1 -P 4 -I {} sh -c 'cd {} && npm install && npm run build:publish'",
-    "build:extensions:darwin": "rimraf ./electron/pre-install/*.tgz && find ./extensions -mindepth 1 -maxdepth 1 -type d -print0 | xargs -0 -n 1 -P 4 -I {} sh -c 'cd {} && npm install && npm run build:publish'",
+    "build:extensions:windows": "rimraf ./pre-install/*.tgz && powershell -command \"$jobs = Get-ChildItem -Path './extensions' -Directory | ForEach-Object { Start-Job -Name ($_.Name) -ScriptBlock { param($_dir); try { Set-Location $_dir; npm install; npm run build:publish; Write-Output 'Build successful in ' + $_dir } catch { Write-Error 'Error in ' + $_dir; throw } } -ArgumentList $_.FullName }; $jobs | Wait-Job; $jobs | ForEach-Object { Receive-Job -Job $_ -Keep } | ForEach-Object { Write-Host $_ }; $failed = $jobs | Where-Object { $_.State -ne 'Completed' -or $_.ChildJobs[0].JobStateInfo.State -ne 'Completed' }; if ($failed) { Exit 1 }\"",
+    "build:extensions:linux": "rimraf ./pre-install/*.tgz && find ./extensions -mindepth 1 -maxdepth 1 -type d -print0 | xargs -0 -n 1 -P 4 -I {} sh -c 'cd {} && npm install && npm run build:publish'",
+    "build:extensions:darwin": "rimraf ./pre-install/*.tgz && find ./extensions -mindepth 1 -maxdepth 1 -type d -print0 | xargs -0 -n 1 -P 4 -I {} sh -c 'cd {} && npm install && npm run build:publish'",
+    "build:extensions:server": "yarn workspace build:extensions ",
     "build:extensions": "run-script-os",
     "build:test": "yarn copy:assets && yarn build:web && yarn workspace jan build:test",
     "build": "yarn build:web && yarn build:electron",
diff --git a/pre-install/.gitkeep b/pre-install/.gitkeep
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/server/helpers/setup.ts b/server/helpers/setup.ts
new file mode 100644
index 0000000000..7d8f8914a1
--- /dev/null
+++ b/server/helpers/setup.ts
@@ -0,0 +1,73 @@
+import { join, extname } from 'path'
+import { existsSync, readdirSync, writeFileSync, mkdirSync } from 'fs'
+import { init, installExtensions } from '@janhq/core/node'
+
+export async function setup() {
+  /**
+   * Setup Jan Data Directory
+   */
+  const appDir = process.env.JAN_DATA_DIRECTORY ?? join(__dirname, '..', 'jan')
+
+  console.debug(`Create app data directory at ${appDir}...`)
+  if (!existsSync(appDir)) mkdirSync(appDir)
+  //@ts-ignore
+  global.core = {
+    // Define appPath function for app to retrieve app path globaly
+    appPath: () => appDir,
+  }
+  init({
+    extensionsPath: join(appDir, 'extensions'),
+  })
+
+  /**
+   * Write app configurations. See #1619
+   */
+  console.debug('Writing config file...')
+  writeFileSync(
+    join(appDir, 'settings.json'),
+    JSON.stringify({
+      data_folder: appDir,
+    }),
+    'utf-8'
+  )
+
+  if (!existsSync(join(appDir, 'settings'))) {
+    console.debug('Writing nvidia config file...')
+    mkdirSync(join(appDir, 'settings'))
+    writeFileSync(
+      join(appDir, 'settings', 'settings.json'),
+      JSON.stringify(
+        {
+          notify: true,
+          run_mode: 'cpu',
+          nvidia_driver: {
+            exist: false,
+            version: '',
+          },
+          cuda: {
+            exist: false,
+            version: '',
+          },
+          gpus: [],
+          gpu_highest_vram: '',
+          gpus_in_use: [],
+          is_initial: true,
+        }),
+      'utf-8'
+    )
+  }
+
+  /**
+   * Install extensions
+   */
+
+  console.debug('Installing extensions...')
+
+  const baseExtensionPath = join(__dirname, '../../..', 'pre-install')
+  const extensions = readdirSync(baseExtensionPath)
+    .filter((file) => extname(file) === '.tgz')
+    .map((file) => join(baseExtensionPath, file))
+
+  await installExtensions(extensions)
+  console.debug('Extensions installed')
+}
diff --git a/server/index.ts b/server/index.ts
index 05bfdca961..98cc8385d1 100644
--- a/server/index.ts
+++ b/server/index.ts
@@ -1,26 +1,27 @@
-import fastify from "fastify";
-import dotenv from "dotenv";
+import fastify from 'fastify'
+import dotenv from 'dotenv'
 import {
   getServerLogPath,
   v1Router,
   logServer,
   getJanExtensionsPath,
-} from "@janhq/core/node";
-import { join } from "path";
+} from '@janhq/core/node'
+import { join } from 'path'
+import tcpPortUsed from 'tcp-port-used'
 
 // Load environment variables
-dotenv.config();
+dotenv.config()
 
 // Define default settings
-const JAN_API_HOST = process.env.JAN_API_HOST || "127.0.0.1";
-const JAN_API_PORT = Number.parseInt(process.env.JAN_API_PORT || "1337");
+const JAN_API_HOST = process.env.JAN_API_HOST || '127.0.0.1'
+const JAN_API_PORT = Number.parseInt(process.env.JAN_API_PORT || '1337')
 
 // Initialize server settings
-let server: any | undefined = undefined;
-let hostSetting: string = JAN_API_HOST;
-let portSetting: number = JAN_API_PORT;
-let corsEnabled: boolean = true;
-let isVerbose: boolean = true;
+let server: any | undefined = undefined
+let hostSetting: string = JAN_API_HOST
+let portSetting: number = JAN_API_PORT
+let corsEnabled: boolean = true
+let isVerbose: boolean = true
 
 /**
  * Server configurations
@@ -32,80 +33,93 @@ let isVerbose: boolean = true;
  * @param baseDir - Base directory for the OpenAPI schema file
  */
 export interface ServerConfig {
-  host?: string;
-  port?: number;
-  isCorsEnabled?: boolean;
-  isVerboseEnabled?: boolean;
-  schemaPath?: string;
-  baseDir?: string;
+  host?: string
+  port?: number
+  isCorsEnabled?: boolean
+  isVerboseEnabled?: boolean
+  schemaPath?: string
+  baseDir?: string
+  storageAdataper?: any
 }
 
 /**
  * Function to start the server
  * @param configs - Server configurations
  */
-export const startServer = async (configs?: ServerConfig) => {
+export const startServer = async (configs?: ServerConfig): Promise<boolean> => {
+  if (configs?.port && configs?.host) {
+    const inUse = await tcpPortUsed.check(Number(configs.port), configs.host)
+    if (inUse) {
+      const errorMessage = `Port ${configs.port} is already in use.`
+      logServer(errorMessage)
+      throw new Error(errorMessage)
+    }
+  }
+
   // Update server settings
-  isVerbose = configs?.isVerboseEnabled ?? true;
-  hostSetting = configs?.host ?? JAN_API_HOST;
-  portSetting = configs?.port ?? JAN_API_PORT;
-  corsEnabled = configs?.isCorsEnabled ?? true;
-  const serverLogPath = getServerLogPath();
+  isVerbose = configs?.isVerboseEnabled ?? true
+  hostSetting = configs?.host ?? JAN_API_HOST
+  portSetting = configs?.port ?? JAN_API_PORT
+  corsEnabled = configs?.isCorsEnabled ?? true
+  const serverLogPath = getServerLogPath()
 
   // Start the server
   try {
     // Log server start
-    if (isVerbose) logServer(`Debug: Starting JAN API server...`);
+    if (isVerbose) logServer(`Debug: Starting JAN API server...`)
 
     // Initialize Fastify server with logging
     server = fastify({
       logger: {
-        level: "info",
+        level: 'info',
         file: serverLogPath,
       },
-    });
+    })
 
     // Register CORS if enabled
-    if (corsEnabled) await server.register(require("@fastify/cors"), {});
+    if (corsEnabled) await server.register(require('@fastify/cors'), {})
 
     // Register Swagger for API documentation
-    await server.register(require("@fastify/swagger"), {
-      mode: "static",
+    await server.register(require('@fastify/swagger'), {
+      mode: 'static',
       specification: {
-        path: configs?.schemaPath ?? "./../docs/openapi/jan.yaml",
-        baseDir: configs?.baseDir ?? "./../docs/openapi",
+        path: configs?.schemaPath ?? './../docs/openapi/jan.yaml',
+        baseDir: configs?.baseDir ?? './../docs/openapi',
       },
-    });
+    })
 
     // Register Swagger UI
-    await server.register(require("@fastify/swagger-ui"), {
-      routePrefix: "/",
-      baseDir: configs?.baseDir ?? join(__dirname, "../..", "./docs/openapi"),
+    await server.register(require('@fastify/swagger-ui'), {
+      routePrefix: '/',
+      baseDir: configs?.baseDir ?? join(__dirname, '../..', './docs/openapi'),
       uiConfig: {
-        docExpansion: "full",
+        docExpansion: 'full',
         deepLinking: false,
       },
       staticCSP: false,
       transformSpecificationClone: true,
-    });
+    })
 
     // Register static file serving for extensions
     // TODO: Watch extension files changes and reload
     await server.register(
       (childContext: any, _: any, done: any) => {
-        childContext.register(require("@fastify/static"), {
+        childContext.register(require('@fastify/static'), {
           root: getJanExtensionsPath(),
           wildcard: false,
-        });
+        })
 
-        done();
+        done()
       },
-      { prefix: "extensions" }
-    );
+      { prefix: 'extensions' }
+    )
 
-    // Register API routes
-    await server.register(v1Router, { prefix: "/v1" });
+    // Register proxy middleware
+    if (configs?.storageAdataper)
+      server.addHook('preHandler', configs.storageAdataper)
 
+    // Register API routes
+    await server.register(v1Router, { prefix: '/v1' })
     // Start listening for requests
     await server
       .listen({
@@ -117,13 +131,15 @@ export const startServer = async (configs?: ServerConfig) => {
         if (isVerbose)
           logServer(
             `Debug: JAN API listening at: http://${hostSetting}:${portSetting}`
-          );
-      });
+          )
+      })
+    return true
   } catch (e) {
     // Log any errors
-    if (isVerbose) logServer(`Error: ${e}`);
+    if (isVerbose) logServer(`Error: ${e}`)
   }
-};
+  return false
+}
 
 /**
  * Function to stop the server
@@ -131,11 +147,11 @@ export const startServer = async (configs?: ServerConfig) => {
 export const stopServer = async () => {
   try {
     // Log server stop
-    if (isVerbose) logServer(`Debug: Server stopped`);
+    if (isVerbose) logServer(`Debug: Server stopped`)
     // Stop the server
-    await server.close();
+    await server.close()
   } catch (e) {
     // Log any errors
-    if (isVerbose) logServer(`Error: ${e}`);
+    if (isVerbose) logServer(`Error: ${e}`)
   }
-};
+}
diff --git a/server/main.ts b/server/main.ts
index c3eb691356..71fb111062 100644
--- a/server/main.ts
+++ b/server/main.ts
@@ -1,3 +1,7 @@
-import { startServer } from "./index";
-
-startServer();
+import { s3 } from './middleware/s3'
+import { setup } from './helpers/setup'
+import { startServer as start } from './index'
+/**
+ * Setup extensions and start the server
+ */
+setup().then(() => start({ storageAdataper: s3 }))
diff --git a/server/middleware/s3.ts b/server/middleware/s3.ts
new file mode 100644
index 0000000000..28971a42b4
--- /dev/null
+++ b/server/middleware/s3.ts
@@ -0,0 +1,70 @@
+import { join } from 'path'
+
+// Middleware to intercept requests and proxy if certain conditions are met
+const config = {
+  endpoint: process.env.AWS_ENDPOINT,
+  region: process.env.AWS_REGION,
+  credentials: {
+    accessKeyId: process.env.AWS_ACCESS_KEY_ID,
+    secretAccessKey: process.env.AWS_SECRET_ACCESS_KEY,
+  },
+}
+
+const S3_BUCKET_NAME = process.env.S3_BUCKET_NAME
+
+const fs = require('@cyclic.sh/s3fs')(S3_BUCKET_NAME, config)
+const PROXY_PREFIX = '/v1/fs'
+const PROXY_ROUTES = ['/threads', '/messages']
+
+export const s3 = (req: any, reply: any, done: any) => {
+  // Proxy FS requests to S3 using S3FS
+  if (req.url.startsWith(PROXY_PREFIX)) {
+    const route = req.url.split('/').pop()
+    const args = parseRequestArgs(req)
+
+    // Proxy matched requests to the s3fs module
+    if (args.length && PROXY_ROUTES.some((route) => args[0].includes(route))) {
+      try {
+        // Handle customized route
+        // S3FS does not handle appendFileSync
+        if (route === 'appendFileSync') {
+          let result = handAppendFileSync(args)
+
+          reply.status(200).send(result)
+          return
+        }
+        // Reroute the other requests to the s3fs module
+        const result = fs[route](...args)
+        reply.status(200).send(result)
+        return
+      } catch (ex) {
+        console.log(ex)
+      }
+    }
+  }
+  // Let other requests go through
+  done()
+}
+
+const parseRequestArgs = (req: Request) => {
+  const {
+    getJanDataFolderPath,
+    normalizeFilePath,
+  } = require('@janhq/core/node')
+
+  return JSON.parse(req.body as any).map((arg: any) =>
+    typeof arg === 'string' &&
+    (arg.startsWith(`file:/`) || arg.startsWith(`file:\\`))
+      ? join(getJanDataFolderPath(), normalizeFilePath(arg))
+      : arg
+  )
+}
+
+const handAppendFileSync = (args: any[]) => {
+  if (fs.existsSync(args[0])) {
+    const data = fs.readFileSync(args[0], 'utf-8')
+    return fs.writeFileSync(args[0], data + args[1])
+  } else {
+    return fs.writeFileSync(args[0], args[1])
+  }
+}
diff --git a/server/nodemon.json b/server/nodemon.json
deleted file mode 100644
index 0ea41ca96b..0000000000
--- a/server/nodemon.json
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "watch": ["main.ts", "v1"],
-    "ext": "ts, json",
-    "exec": "tsc && node ./build/main.js"
-}
\ No newline at end of file
diff --git a/server/package.json b/server/package.json
index f61730da4a..d9a2bbc9ab 100644
--- a/server/package.json
+++ b/server/package.json
@@ -18,26 +18,29 @@
   },
   "dependencies": {
     "@alumna/reflect": "^1.1.3",
+    "@cyclic.sh/s3fs": "^1.2.9",
     "@fastify/cors": "^8.4.2",
     "@fastify/static": "^6.12.0",
     "@fastify/swagger": "^8.13.0",
     "@fastify/swagger-ui": "2.0.1",
     "@janhq/core": "link:./core",
+    "@npmcli/arborist": "^7.3.1",
     "dotenv": "^16.3.1",
     "fastify": "^4.24.3",
-    "request": "^2.88.2",
     "fetch-retry": "^5.0.6",
-    "tcp-port-used": "^1.0.2",
-    "request-progress": "^3.0.0"
+    "node-fetch": "2",
+    "request": "^2.88.2",
+    "request-progress": "^3.0.0",
+    "tcp-port-used": "^1.0.2"
   },
   "devDependencies": {
     "@types/body-parser": "^1.19.5",
     "@types/npmcli__arborist": "^5.6.4",
+    "@types/tcp-port-used": "^1.0.4",
     "@typescript-eslint/eslint-plugin": "^6.7.3",
     "@typescript-eslint/parser": "^6.7.3",
     "eslint-plugin-react": "^7.33.2",
     "run-script-os": "^1.1.6",
-    "@types/tcp-port-used": "^1.0.4",
     "typescript": "^5.2.2"
   }
 }
diff --git a/server/tsconfig.json b/server/tsconfig.json
index 2c4fc4a64e..dd27b89323 100644
--- a/server/tsconfig.json
+++ b/server/tsconfig.json
@@ -20,5 +20,5 @@
   // "sourceMap": true,
 
   "include": ["./**/*.ts"],
-  "exclude": ["core", "build", "dist", "tests", "node_modules"]
+  "exclude": ["core", "build", "dist", "tests", "node_modules", "extensions"]
 }
diff --git a/uikit/src/input/styles.scss b/uikit/src/input/styles.scss
index 9990da8b4c..e649f494da 100644
--- a/uikit/src/input/styles.scss
+++ b/uikit/src/input/styles.scss
@@ -1,6 +1,6 @@
 .input {
   @apply border-border placeholder:text-muted-foreground flex h-9 w-full rounded-lg border bg-transparent px-3 py-1 transition-colors;
-  @apply disabled:cursor-not-allowed disabled:bg-zinc-100 disabled:dark:bg-zinc-800 disabled:dark:text-zinc-600;
+  @apply disabled:text-muted-foreground disabled:cursor-not-allowed disabled:bg-zinc-100 disabled:dark:bg-zinc-800 disabled:dark:text-zinc-600;
   @apply focus-within:outline-none focus-visible:outline-0 focus-visible:ring-2 focus-visible:ring-blue-500 focus-visible:ring-offset-1;
   @apply file:border-0 file:bg-transparent file:font-medium;
 }
diff --git a/uikit/src/select/styles.scss b/uikit/src/select/styles.scss
index bc5b6c0cc2..90485723ab 100644
--- a/uikit/src/select/styles.scss
+++ b/uikit/src/select/styles.scss
@@ -1,6 +1,6 @@
 .select {
   @apply placeholder:text-muted-foreground border-border flex h-9 w-full items-center justify-between whitespace-nowrap rounded-md border bg-transparent px-3 py-2 text-sm shadow-sm disabled:cursor-not-allowed [&>span]:line-clamp-1;
-  @apply disabled:cursor-not-allowed disabled:bg-zinc-100 disabled:dark:bg-zinc-800 disabled:dark:text-zinc-600;
+  @apply disabled:text-muted-foreground disabled:cursor-not-allowed disabled:bg-zinc-100 disabled:dark:bg-zinc-800 disabled:dark:text-zinc-600;
   @apply focus-within:outline-none focus-visible:outline-0 focus-visible:ring-2 focus-visible:ring-blue-500 focus-visible:ring-offset-1;
 
   &-caret {
@@ -21,6 +21,7 @@
 
   &-item {
     @apply hover:bg-secondary relative my-1 block w-full cursor-pointer select-none items-center rounded-sm px-4 py-2 text-sm data-[disabled]:pointer-events-none data-[disabled]:opacity-50;
+    @apply focus:outline-none focus-visible:outline-0;
   }
 
   &-trigger-viewport {
diff --git a/uikit/types/declaration.d.ts b/uikit/types/declaration.d.ts
index 85b1a7136f..f8e975fa54 100644
--- a/uikit/types/declaration.d.ts
+++ b/uikit/types/declaration.d.ts
@@ -1,4 +1,4 @@
 declare module '*.scss' {
-  const content: Record<string, string>;
-  export default content;
-}
\ No newline at end of file
+  const content: Record<string, string>
+  export default content
+}
diff --git a/web/.prettierignore b/web/.prettierignore
deleted file mode 100644
index 02d9145c14..0000000000
--- a/web/.prettierignore
+++ /dev/null
@@ -1,5 +0,0 @@
-.next/
-node_modules/
-dist/
-*.hbs
-*.mdx
\ No newline at end of file
diff --git a/web/.prettierrc b/web/.prettierrc
deleted file mode 100644
index 46f1abcb02..0000000000
--- a/web/.prettierrc
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-  "semi": false,
-  "singleQuote": true,
-  "quoteProps": "consistent",
-  "trailingComma": "es5",
-  "endOfLine": "auto",
-  "plugins": ["prettier-plugin-tailwindcss"]
-}
diff --git a/web/app/error.tsx b/web/app/error.tsx
new file mode 100644
index 0000000000..25b24b9ef5
--- /dev/null
+++ b/web/app/error.tsx
@@ -0,0 +1,89 @@
+'use client' // Error components must be Client Components
+
+import { useEffect, useState } from 'react'
+
+export default function Error({
+  error,
+}: {
+  error: Error & { digest?: string }
+  reset: () => void
+}) {
+  const [showFull, setShowFull] = useState(false)
+  useEffect(() => {
+    // Log the error to an error reporting service
+    console.error(error)
+  }, [error])
+
+  return (
+    <>
+      <div className="flex h-screen w-full items-center justify-center overflow-auto bg-white p-5">
+        <div className="w-full text-center">
+          <div className="inline-flex rounded-full bg-red-100 p-4">
+            <div className="rounded-full bg-red-200 stroke-red-600 p-4">
+              <svg
+                className="h-16 w-16"
+                viewBox="0 0 28 28"
+                fill="none"
+                xmlns="http://www.w3.org/2000/svg"
+              >
+                <path
+                  d="M6 8H6.01M6 16H6.01M6 12H18C20.2091 12 22 10.2091 22 8C22 5.79086 20.2091 4 18 4H6C3.79086 4 2 5.79086 2 8C2 10.2091 3.79086 12 6 12ZM6 12C3.79086 12 2 13.7909 2 16C2 18.2091 3.79086 20 6 20H14"
+                  stroke-width="2"
+                  stroke-linecap="round"
+                  stroke-linejoin="round"
+                ></path>
+                <path
+                  d="M17 16L22 21M22 16L17 21"
+                  stroke-width="2"
+                  stroke-linecap="round"
+                  stroke-linejoin="round"
+                ></path>
+              </svg>
+            </div>
+          </div>
+          <h1 className="mt-5 text-xl font-bold text-slate-800">
+            Oops! Unexpected error occurred.
+          </h1>
+          <p className="lg:text-md my-2 text-slate-600">
+            Something went wrong. Try to{' '}
+            <button
+              rel="noopener noreferrer"
+              className="text-blue-600 hover:underline"
+              onClick={() => window.location.reload()}
+            >
+              refresh this page
+            </button>{' '}
+            or <br /> feel free to{' '}
+            <a
+              rel="noopener noreferrer"
+              className="text-blue-600 hover:underline"
+              href="https://discord.gg/FTk2MvZwJH"
+              target="_blank_"
+            >
+              contact us
+            </a>{' '}
+            if the problem presists.
+          </p>
+          <div
+            className="mt-5 w-full rounded border border-red-400 bg-red-100 px-4 py-3 text-red-700"
+            role="alert"
+          >
+            <strong className="font-bold">Error: </strong>
+            <span className="block sm:inline">{error.message}</span>
+            <div className="mt-2 h-full w-full">
+              <pre className="mt-2 w-full whitespace-pre-wrap rounded bg-red-200 p-4 text-left text-sm text-red-600">
+                {showFull ? error.stack : error.stack?.slice(0, 200)}
+              </pre>
+              <button
+                onClick={() => setShowFull(!showFull)}
+                className="mt-1 text-sm text-red-700 underline focus:outline-none"
+              >
+                {showFull ? 'Show less' : 'Show more'}
+              </button>
+            </div>
+          </div>
+        </div>
+      </div>
+    </>
+  )
+}
diff --git a/web/containers/CardSidebar/index.tsx b/web/containers/CardSidebar/index.tsx
index 38a8678d9e..89ff60e664 100644
--- a/web/containers/CardSidebar/index.tsx
+++ b/web/containers/CardSidebar/index.tsx
@@ -22,6 +22,7 @@ interface Props {
   rightAction?: ReactNode
   title: string
   asChild?: boolean
+  isShow?: boolean
   hideMoreVerticalAction?: boolean
 }
 export default function CardSidebar({
@@ -30,8 +31,9 @@ export default function CardSidebar({
   asChild,
   rightAction,
   hideMoreVerticalAction,
+  isShow,
 }: Props) {
-  const [show, setShow] = useState(true)
+  const [show, setShow] = useState(isShow ?? false)
   const [more, setMore] = useState(false)
   const [menu, setMenu] = useState<HTMLDivElement | null>(null)
   const [toggle, setToggle] = useState<HTMLDivElement | null>(null)
@@ -67,8 +69,8 @@ export default function CardSidebar({
                 show && 'rotate-180'
               )}
             />
+            <span className="font-bold">{title}</span>
           </button>
-          <span className="font-bold">{title}</span>
         </div>
         <div className="flex">
           {rightAction && rightAction}
@@ -156,7 +158,10 @@ export default function CardSidebar({
                       </>
                     ) : (
                       <>
-                        Opens <span className="lowercase">{title}.json.</span>
+                        Opens{' '}
+                        <span className="lowercase">
+                          {title === 'Tools' ? 'assistant' : title}.json.
+                        </span>
                         &nbsp;Changes affect all new threads.
                       </>
                     )}
diff --git a/web/containers/DropdownListSidebar/index.tsx b/web/containers/DropdownListSidebar/index.tsx
index 140a1aba15..191c7bcbe8 100644
--- a/web/containers/DropdownListSidebar/index.tsx
+++ b/web/containers/DropdownListSidebar/index.tsx
@@ -14,7 +14,14 @@ import {
 
 import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 
-import { MonitorIcon } from 'lucide-react'
+import {
+  MonitorIcon,
+  LayoutGridIcon,
+  FoldersIcon,
+  GlobeIcon,
+  CheckIcon,
+  CopyIcon,
+} from 'lucide-react'
 
 import { twMerge } from 'tailwind-merge'
 
@@ -22,6 +29,7 @@ import { MainViewState } from '@/constants/screens'
 
 import { useActiveModel } from '@/hooks/useActiveModel'
 
+import { useClipboard } from '@/hooks/useClipboard'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import useRecommendedModel from '@/hooks/useRecommendedModel'
@@ -42,6 +50,8 @@ import {
 
 export const selectedModelAtom = atom<Model | undefined>(undefined)
 
+const engineOptions = ['Local', 'Remote']
+
 // TODO: Move all of the unscoped logics outside of the component
 const DropdownListSidebar = ({
   strictedThread = true,
@@ -51,13 +61,24 @@ const DropdownListSidebar = ({
   const activeThread = useAtomValue(activeThreadAtom)
   const [selectedModel, setSelectedModel] = useAtom(selectedModelAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
-
+  const [isTabActive, setIsTabActive] = useState(0)
   const { stateModel } = useActiveModel()
   const [serverEnabled, setServerEnabled] = useAtom(serverEnabledAtom)
   const { setMainViewState } = useMainViewState()
   const [loader, setLoader] = useState(0)
   const { recommendedModel, downloadedModels } = useRecommendedModel()
   const { updateModelParameter } = useUpdateModelParameters()
+  const clipboard = useClipboard({ timeout: 1000 })
+  const [copyId, setCopyId] = useState('')
+
+  const localModel = downloadedModels.filter(
+    (model) => model.engine === InferenceEngine.nitro
+  )
+  const remoteModel = downloadedModels.filter(
+    (model) => model.engine === InferenceEngine.openai
+  )
+
+  const modelOptions = isTabActive === 0 ? localModel : remoteModel
 
   useEffect(() => {
     if (!activeThread) return
@@ -73,7 +94,7 @@ const DropdownListSidebar = ({
 
   // This is fake loader please fix this when we have realtime percentage when load model
   useEffect(() => {
-    if (stateModel.loading) {
+    if (stateModel.model === selectedModel?.id && stateModel.loading) {
       if (loader === 24) {
         setTimeout(() => {
           setLoader(loader + 1)
@@ -94,7 +115,7 @@ const DropdownListSidebar = ({
     } else {
       setLoader(0)
     }
-  }, [stateModel.loading, loader])
+  }, [stateModel.loading, loader, selectedModel, stateModel.model])
 
   const onValueSelected = useCallback(
     async (modelId: string) => {
@@ -138,12 +159,16 @@ const DropdownListSidebar = ({
     return null
   }
 
+  const selectedModelLoading =
+    stateModel.model === selectedModel?.id && stateModel.loading
+
   return (
     <>
       <div
         className={twMerge(
           'relative w-full overflow-hidden rounded-md',
-          stateModel.loading && 'pointer-events-none bg-blue-200 text-blue-600'
+          stateModel.loading && 'pointer-events-none',
+          selectedModelLoading && 'bg-blue-200 text-blue-600'
         )}
       >
         <Select
@@ -153,7 +178,7 @@ const DropdownListSidebar = ({
         >
           <SelectTrigger className="relative w-full">
             <SelectValue placeholder="Choose model to start">
-              {stateModel.loading && (
+              {selectedModelLoading && (
                 <div
                   className="z-5 absolute left-0 top-0 h-full w-full rounded-md bg-blue-100/80"
                   style={{ width: `${loader}%` }}
@@ -162,7 +187,7 @@ const DropdownListSidebar = ({
               <span
                 className={twMerge(
                   'relative z-20',
-                  stateModel.loading && 'font-medium'
+                  selectedModelLoading && 'font-medium'
                 )}
               >
                 {selectedModel?.name}
@@ -170,49 +195,151 @@ const DropdownListSidebar = ({
             </SelectValue>
           </SelectTrigger>
           <SelectPortal>
-            <SelectContent className="right-2  block w-full min-w-[450px] pr-0">
-              <div className="flex w-full items-center space-x-2 px-4 py-2">
-                <MonitorIcon size={20} className="text-muted-foreground" />
-                <span>Local</span>
+            <SelectContent
+              className={twMerge(
+                'right-2  block w-full min-w-[450px] pr-0',
+                isTabActive === 1 && '[&_.select-scroll-down-button]:hidden'
+              )}
+            >
+              <div className="relative px-2 py-2 dark:bg-secondary/50">
+                <ul className="inline-flex w-full space-x-2 rounded-lg bg-zinc-100 px-1 dark:bg-secondary">
+                  {engineOptions.map((name, i) => {
+                    return (
+                      <li
+                        className={twMerge(
+                          'relative my-1 flex w-full cursor-pointer items-center justify-center space-x-2 px-2 py-2',
+                          isTabActive === i &&
+                            'rounded-md bg-background dark:bg-white'
+                        )}
+                        key={i}
+                        onClick={() => setIsTabActive(i)}
+                      >
+                        {i === 0 ? (
+                          <MonitorIcon
+                            size={20}
+                            className="z-50 text-muted-foreground"
+                          />
+                        ) : (
+                          <GlobeIcon
+                            size={20}
+                            className="z-50 text-muted-foreground"
+                          />
+                        )}
+                        <span
+                          className={twMerge(
+                            'relative z-50 font-medium text-muted-foreground',
+                            isTabActive === i &&
+                              'font-bold text-foreground dark:text-black'
+                          )}
+                        >
+                          {name}
+                        </span>
+                      </li>
+                    )
+                  })}
+                </ul>
               </div>
+
               <div className="border-b border-border" />
               {downloadedModels.length === 0 ? (
                 <div className="px-4 py-2">
                   <p>{`Oops, you don't have a model yet.`}</p>
                 </div>
               ) : (
-                <SelectGroup>
-                  {downloadedModels.map((x, i) => (
-                    <SelectItem
-                      key={i}
-                      value={x.id}
-                      className={twMerge(
-                        x.id === selectedModel?.id && 'bg-secondary'
-                      )}
-                    >
-                      <div className="flex w-full justify-between">
-                        <span className="line-clamp-1 block">{x.name}</span>
-                        <div className="space-x-2">
-                          <span className="font-bold text-muted-foreground">
-                            {toGibibytes(x.metadata.size)}
-                          </span>
-                          {x.engine == InferenceEngine.nitro && (
-                            <ModelLabel size={x.metadata.size} />
+                <SelectGroup className="py-2">
+                  <>
+                    {modelOptions.map((x, i) => (
+                      <div
+                        key={i}
+                        className={twMerge(
+                          x.id === selectedModel?.id && 'bg-secondary',
+                          'hover:bg-secondary'
+                        )}
+                      >
+                        <SelectItem
+                          value={x.id}
+                          className={twMerge(
+                            x.id === selectedModel?.id && 'bg-secondary',
+                            'my-0 pb-8 pt-4'
+                          )}
+                        >
+                          <div className="relative flex w-full justify-between">
+                            {x.engine === InferenceEngine.openai && (
+                              <svg
+                                width="20"
+                                height="20"
+                                viewBox="0 0 20 20"
+                                fill="none"
+                                xmlns="http://www.w3.org/2000/svg"
+                                className="absolute top-1"
+                              >
+                                <path
+                                  d="M18.5681 8.18423C18.7917 7.51079 18.8691 6.79739 18.795 6.09168C18.7209 5.38596 18.497 4.70419 18.1384 4.0919C17.6067 3.16642 16.7948 2.43369 15.8199 1.99936C14.8449 1.56503 13.7572 1.45153 12.7135 1.67523C12.1206 1.0157 11.3646 0.523789 10.5214 0.248906C9.67823 -0.0259764 8.77756 -0.0741542 7.90986 0.109212C7.04216 0.292577 6.23798 0.701031 5.57809 1.29355C4.91821 1.88607 4.42584 2.64179 4.15046 3.48481C3.45518 3.62739 2.79834 3.91672 2.22384 4.33347C1.64933 4.75023 1.1704 5.28481 0.81904 5.90148C0.281569 6.82542 0.0518576 7.89634 0.163116 8.95943C0.274374 10.0225 0.720837 11.0227 1.43796 11.8153C1.21351 12.4884 1.13539 13.2017 1.20883 13.9074C1.28227 14.6132 1.50557 15.2951 1.86379 15.9076C2.39616 16.8334 3.20872 17.5663 4.18438 18.0006C5.16004 18.4349 6.24841 18.5483 7.29262 18.3243C7.76367 18.8548 8.34248 19.2786 8.99038 19.5676C9.63828 19.8566 10.3404 20.004 11.0498 20C12.1195 20.001 13.1618 19.662 14.0263 19.032C14.8909 18.4021 15.5329 17.5137 15.8596 16.4951C16.5548 16.3523 17.2116 16.0629 17.786 15.6461C18.3605 15.2294 18.8395 14.6949 19.191 14.0784C19.7222 13.1558 19.9479 12.0889 19.836 11.0303C19.7242 9.97163 19.2804 8.9754 18.5681 8.18423ZM11.0498 18.691C10.1737 18.6924 9.32512 18.3853 8.65279 17.8236L8.77104 17.7566L12.753 15.4581C12.8521 15.4 12.9343 15.3171 12.9917 15.2176C13.0491 15.118 13.0796 15.0053 13.0802 14.8904V9.27631L14.7635 10.2501C14.7719 10.2544 14.7791 10.2605 14.7846 10.268C14.7901 10.2755 14.7937 10.2843 14.7952 10.2935V14.9456C14.7931 15.9383 14.3978 16.8898 13.6959 17.5917C12.9939 18.2936 12.0425 18.6889 11.0498 18.691ZM2.99921 15.2531C2.55985 14.4945 2.4021 13.6052 2.55371 12.7417L2.67204 12.8127L6.65787 15.1112C6.7565 15.1691 6.86877 15.1996 6.98312 15.1996C7.09747 15.1996 7.20975 15.1691 7.30837 15.1112L12.1774 12.3041V14.2478C12.1769 14.2579 12.1742 14.2677 12.1694 14.2766C12.1646 14.2855 12.1579 14.2932 12.1497 14.2991L8.11654 16.6251C7.25581 17.121 6.2335 17.255 5.27405 16.9978C4.3146 16.7405 3.49644 16.1131 2.99921 15.2531ZM1.95054 6.57965C2.39294 5.81612 3.09123 5.23375 3.92179 4.93565V9.66665C3.92029 9.78094 3.94949 9.89355 4.00635 9.99271C4.06321 10.0919 4.14564 10.174 4.24504 10.2304L9.09037 13.0256L7.40696 13.9994C7.39785 14.0042 7.38769 14.0068 7.37737 14.0068C7.36706 14.0068 7.3569 14.0042 7.34779 13.9994L3.32254 11.6773C2.46343 11.1793 1.83666 10.3612 1.57951 9.40204C1.32236 8.44291 1.45577 7.42095 1.95054 6.55998V6.57965ZM15.7808 9.79281L10.9197 6.96998L12.5992 5.99998C12.6083 5.99514 12.6185 5.99261 12.6288 5.99261C12.6391 5.99261 12.6493 5.99514 12.6584 5.99998L16.6836 8.32606C17.2991 8.68119 17.8008 9.20407 18.1303 9.83365C18.4597 10.4632 18.6032 11.1735 18.5441 11.8816C18.485 12.5898 18.2257 13.2664 17.7964 13.8327C17.3672 14.3989 16.7857 14.8314 16.1199 15.0796V10.3486C16.1164 10.2345 16.0833 10.1232 16.0238 10.0258C15.9644 9.92833 15.8807 9.8481 15.7808 9.79281ZM17.4564 7.27356L17.338 7.20256L13.3601 4.8844C13.2609 4.82617 13.1479 4.79547 13.0329 4.79547C12.9178 4.79547 12.8049 4.82617 12.7056 4.8844L7.84071 7.6914V5.74781C7.83967 5.73793 7.84132 5.72795 7.84549 5.71893C7.84965 5.70991 7.85618 5.70218 7.86437 5.69656L11.8896 3.3744C12.5066 3.01899 13.2119 2.84659 13.9232 2.87736C14.6345 2.90813 15.3224 3.14079 15.9063 3.54813C16.4903 3.95548 16.9461 4.52066 17.2206 5.17759C17.4952 5.83452 17.577 6.55602 17.4565 7.25773L17.4564 7.27356ZM6.92196 10.7191L5.23862 9.74931C5.2302 9.74424 5.223 9.73738 5.21753 9.72921C5.21205 9.72105 5.20845 9.71178 5.20696 9.70206V5.06181C5.20788 4.34996 5.41144 3.65307 5.79383 3.05265C6.17622 2.45222 6.72164 1.97305 7.36632 1.67118C8.011 1.3693 8.7283 1.2572 9.43434 1.34796C10.1404 1.43873 10.806 1.72861 11.3534 2.18373L11.235 2.25081L7.25321 4.54915C7.1541 4.60727 7.07182 4.69017 7.01445 4.78971C6.95707 4.88925 6.92658 5.00201 6.92596 5.1169L6.92196 10.7191ZM7.83662 8.74798L10.005 7.49815L12.1774 8.74798V11.2475L10.0129 12.4972L7.84062 11.2475L7.83662 8.74798Z"
+                                  fill="#18181B"
+                                />
+                              </svg>
+                            )}
+                            <div
+                              className={twMerge(
+                                x.engine === InferenceEngine.openai && 'pl-8'
+                              )}
+                            >
+                              <span className="line-clamp-1 block">
+                                {x.name}
+                              </span>
+                              <div className="absolute right-0 top-2 space-x-2">
+                                <span className="font-bold text-muted-foreground">
+                                  {toGibibytes(x.metadata.size)}
+                                </span>
+                                {x.engine == InferenceEngine.nitro && (
+                                  <ModelLabel size={x.metadata.size} />
+                                )}
+                              </div>
+                            </div>
+                          </div>
+                        </SelectItem>
+                        <div
+                          className={twMerge(
+                            'absolute -mt-6 inline-flex items-center space-x-2 px-4 pb-2 text-muted-foreground',
+                            x.engine === InferenceEngine.openai && 'left-8'
+                          )}
+                        >
+                          <span className="text-xs">{x.id}</span>
+                          {clipboard.copied && copyId === x.id ? (
+                            <CheckIcon size={16} className="text-green-600" />
+                          ) : (
+                            <CopyIcon
+                              size={16}
+                              className="z-20 cursor-pointer"
+                              onClick={() => {
+                                clipboard.copy(x.id)
+                                setCopyId(x.id)
+                              }}
+                            />
                           )}
                         </div>
                       </div>
-                    </SelectItem>
-                  ))}
+                    ))}
+                  </>
                 </SelectGroup>
               )}
               <div className="border-b border-border" />
-              <div className="w-full px-4 py-2">
+              <div className="flex w-full space-x-2 px-4 py-2">
+                <Button
+                  block
+                  themes="secondary"
+                  onClick={() => setMainViewState(MainViewState.Settings)}
+                >
+                  <FoldersIcon size={20} className="mr-2" />
+                  <span>My Models</span>
+                </Button>
                 <Button
                   block
                   className="bg-blue-100 font-bold text-blue-600 hover:bg-blue-100 hover:text-blue-600"
                   onClick={() => setMainViewState(MainViewState.Hub)}
                 >
-                  Explore The Hub
+                  <LayoutGridIcon size={20} className="mr-2" />
+                  <span>Explore The Hub</span>
                 </Button>
               </div>
             </SelectContent>
diff --git a/web/containers/GPUDriverPromptModal/index.tsx b/web/containers/GPUDriverPromptModal/index.tsx
index da20ab3321..bdcf1b2f8f 100644
--- a/web/containers/GPUDriverPromptModal/index.tsx
+++ b/web/containers/GPUDriverPromptModal/index.tsx
@@ -36,7 +36,7 @@ const GPUDriverPrompt: React.FC = () => {
       <Modal open={showNotification} onOpenChange={openChanged}>
         <ModalContent>
           <ModalHeader>
-            <ModalTitle>
+            <ModalTitle className="pr-4 leading-relaxed">
               Checking for machine that does not meet the requirements.
             </ModalTitle>
           </ModalHeader>
diff --git a/web/containers/Layout/BottomBar/DownloadingState/index.tsx b/web/containers/Layout/BottomBar/DownloadingState/index.tsx
index 7aef36cafd..dcebacd3ce 100644
--- a/web/containers/Layout/BottomBar/DownloadingState/index.tsx
+++ b/web/containers/Layout/BottomBar/DownloadingState/index.tsx
@@ -13,35 +13,38 @@ import {
 import { useAtomValue } from 'jotai'
 
 import useDownloadModel from '@/hooks/useDownloadModel'
-import { useDownloadState } from '@/hooks/useDownloadState'
+import { modelDownloadStateAtom } from '@/hooks/useDownloadState'
 
 import { formatDownloadPercentage } from '@/utils/converter'
 
-import { downloadingModelsAtom } from '@/helpers/atoms/Model.atom'
+import { getDownloadingModelAtom } from '@/helpers/atoms/Model.atom'
 
 export default function DownloadingState() {
-  const { downloadStates } = useDownloadState()
-  const downloadingModels = useAtomValue(downloadingModelsAtom)
+  const downloadStates = useAtomValue(modelDownloadStateAtom)
+  const downloadingModels = useAtomValue(getDownloadingModelAtom)
   const { abortModelDownload } = useDownloadModel()
 
-  const totalCurrentProgress = downloadStates
+  const totalCurrentProgress = Object.values(downloadStates)
     .map((a) => a.size.transferred + a.size.transferred)
     .reduce((partialSum, a) => partialSum + a, 0)
 
-  const totalSize = downloadStates
+  const totalSize = Object.values(downloadStates)
     .map((a) => a.size.total + a.size.total)
     .reduce((partialSum, a) => partialSum + a, 0)
 
-  const totalPercentage = ((totalCurrentProgress / totalSize) * 100).toFixed(2)
+  const totalPercentage =
+    totalSize !== 0 ? ((totalCurrentProgress / totalSize) * 100).toFixed(2) : 0
 
   return (
     <Fragment>
-      {downloadStates?.length > 0 && (
+      {Object.values(downloadStates)?.length > 0 && (
         <Modal>
           <ModalTrigger asChild>
             <div className="relative block">
               <Button size="sm" themes="outline">
-                <span>{downloadStates.length} Downloading model</span>
+                <span>
+                  {Object.values(downloadStates).length} Downloading model
+                </span>
               </Button>
               <span
                 className="absolute left-0 h-full rounded-md rounded-l-md bg-primary/20"
@@ -55,40 +58,38 @@ export default function DownloadingState() {
             <ModalHeader>
               <ModalTitle>Downloading model</ModalTitle>
             </ModalHeader>
-            {downloadStates.map((item, i) => {
-              return (
-                <div className="pt-2" key={i}>
-                  <Progress
-                    className="mb-2 h-2"
-                    value={
-                      formatDownloadPercentage(item?.percent, {
-                        hidePercentage: true,
-                      }) as number
-                    }
-                  />
-                  <div className="flex items-center justify-between gap-x-2">
-                    <div className="flex gap-x-2">
-                      <p className="line-clamp-1">{item?.modelId}</p>
-                      <span>{formatDownloadPercentage(item?.percent)}</span>
-                    </div>
-                    <Button
-                      themes="outline"
-                      size="sm"
-                      onClick={() => {
-                        if (item?.modelId) {
-                          const model = downloadingModels.find(
-                            (model) => model.id === item.modelId
-                          )
-                          if (model) abortModelDownload(model)
-                        }
-                      }}
-                    >
-                      Cancel
-                    </Button>
+            {Object.values(downloadStates).map((item, i) => (
+              <div className="pt-2" key={i}>
+                <Progress
+                  className="mb-2 h-2"
+                  value={
+                    formatDownloadPercentage(item?.percent, {
+                      hidePercentage: true,
+                    }) as number
+                  }
+                />
+                <div className="flex items-center justify-between gap-x-2">
+                  <div className="flex gap-x-2">
+                    <p className="line-clamp-1">{item?.modelId}</p>
+                    <span>{formatDownloadPercentage(item?.percent)}</span>
                   </div>
+                  <Button
+                    themes="outline"
+                    size="sm"
+                    onClick={() => {
+                      if (item?.modelId) {
+                        const model = downloadingModels.find(
+                          (model) => model.id === item.modelId
+                        )
+                        if (model) abortModelDownload(model)
+                      }
+                    }}
+                  >
+                    Cancel
+                  </Button>
                 </div>
-              )
-            })}
+              </div>
+            ))}
           </ModalContent>
         </Modal>
       )}
diff --git a/web/containers/Layout/BottomBar/index.tsx b/web/containers/Layout/BottomBar/index.tsx
index 6e334b9ef5..5d6b7e79ca 100644
--- a/web/containers/Layout/BottomBar/index.tsx
+++ b/web/containers/Layout/BottomBar/index.tsx
@@ -1,3 +1,5 @@
+import { useEffect } from 'react'
+
 import {
   Badge,
   Button,
@@ -25,12 +27,17 @@ import { MainViewState } from '@/constants/screens'
 
 import { useActiveModel } from '@/hooks/useActiveModel'
 
-import { useDownloadState } from '@/hooks/useDownloadState'
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
+import { modelDownloadStateAtom } from '@/hooks/useDownloadState'
 import useGetSystemResources from '@/hooks/useGetSystemResources'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
+import {
+  cpuUsageAtom,
+  gpusAtom,
+  ramUtilitizedAtom,
+} from '@/helpers/atoms/SystemBar.atom'
 
 const menuLinks = [
   {
@@ -47,14 +54,39 @@ const menuLinks = [
 
 const BottomBar = () => {
   const { activeModel, stateModel } = useActiveModel()
-  const { ram, cpu } = useGetSystemResources()
+  const { watch, stopWatching } = useGetSystemResources()
   const progress = useAtomValue(appDownloadProgress)
-  const { downloadedModels } = useGetDownloadedModels()
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
+  const gpus = useAtomValue(gpusAtom)
+  const cpu = useAtomValue(cpuUsageAtom)
+  const ramUtilitized = useAtomValue(ramUtilitizedAtom)
+
   const { setMainViewState } = useMainViewState()
-  const { downloadStates } = useDownloadState()
+  const downloadStates = useAtomValue(modelDownloadStateAtom)
   const setShowSelectModelModal = useSetAtom(showSelectModelModalAtom)
   const [serverEnabled] = useAtom(serverEnabledAtom)
 
+  const calculateUtilization = () => {
+    let sum = 0
+    const util = gpus.map((x) => {
+      return Number(x['utilization'])
+    })
+    util.forEach((num) => {
+      sum += num
+    })
+    return sum
+  }
+
+  useEffect(() => {
+    // Watch for resource update
+    watch()
+
+    return () => {
+      stopWatching()
+    }
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [])
+
   return (
     <div className="fixed bottom-0 left-16 z-20 flex h-12 w-[calc(100%-64px)] items-center justify-between border-t border-border bg-background/80 px-3">
       <div className="flex flex-shrink-0 items-center gap-x-2">
@@ -100,7 +132,7 @@ const BottomBar = () => {
           )}
         {downloadedModels.length === 0 &&
           !stateModel.loading &&
-          downloadStates.length === 0 && (
+          Object.values(downloadStates).length === 0 && (
             <Button
               size="sm"
               themes="outline"
@@ -115,8 +147,43 @@ const BottomBar = () => {
       <div className="flex items-center gap-x-3">
         <div className="flex items-center gap-x-2">
           <SystemItem name="CPU:" value={`${cpu}%`} />
-          <SystemItem name="Mem:" value={`${ram}%`} />
+          <SystemItem name="Mem:" value={`${ramUtilitized}%`} />
         </div>
+        {gpus.length > 0 && (
+          <Tooltip>
+            <TooltipTrigger>
+              <div className="flex items-center">
+                <SystemItem
+                  name={`${gpus.length} GPU `}
+                  value={`${calculateUtilization()}% `}
+                />
+              </div>
+            </TooltipTrigger>
+            {gpus.length > 1 && (
+              <TooltipContent
+                side="top"
+                sideOffset={10}
+                className="min-w-[240px]"
+              >
+                <span>
+                  {gpus.map((gpu, index) => (
+                    <div
+                      key={index}
+                      className="flex items-center justify-between"
+                    >
+                      <div>
+                        <span>{gpu.name}</span>
+                        <span>{gpu.vram}MB VRAM</span>
+                      </div>
+                      <span>{gpu.utilization}%</span>
+                    </div>
+                  ))}
+                </span>
+                <TooltipArrow />
+              </TooltipContent>
+            )}
+          </Tooltip>
+        )}
         {/* VERSION is defined by webpack, please see next.config.js */}
         <span className="text-xs text-muted-foreground">
           Jan v{VERSION ?? ''}
diff --git a/web/containers/Layout/Ribbon/index.tsx b/web/containers/Layout/Ribbon/index.tsx
index 83ed2725af..8e7db604e5 100644
--- a/web/containers/Layout/Ribbon/index.tsx
+++ b/web/containers/Layout/Ribbon/index.tsx
@@ -6,7 +6,7 @@ import {
 } from '@janhq/uikit'
 import { motion as m } from 'framer-motion'
 
-import { useAtom } from 'jotai'
+import { useAtom, useSetAtom } from 'jotai'
 import {
   MessageCircleIcon,
   SettingsIcon,
@@ -23,16 +23,19 @@ import { MainViewState } from '@/constants/screens'
 
 import { useMainViewState } from '@/hooks/useMainViewState'
 
+import { editMessageAtom } from '@/helpers/atoms/ChatMessage.atom'
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
 
 export default function RibbonNav() {
   const { mainViewState, setMainViewState } = useMainViewState()
   const [serverEnabled] = useAtom(serverEnabledAtom)
+  const setEditMessage = useSetAtom(editMessageAtom)
 
   const onMenuClick = (state: MainViewState) => {
     if (mainViewState === state) return
     if (serverEnabled && state === MainViewState.Thread) return
     setMainViewState(state)
+    setEditMessage('')
   }
 
   const primaryMenus = [
diff --git a/web/containers/Layout/TopBar/CommandListDownloadedModel/index.tsx b/web/containers/Layout/TopBar/CommandListDownloadedModel/index.tsx
index 3edce06eb5..ac5756e9f3 100644
--- a/web/containers/Layout/TopBar/CommandListDownloadedModel/index.tsx
+++ b/web/containers/Layout/TopBar/CommandListDownloadedModel/index.tsx
@@ -11,7 +11,7 @@ import {
   Badge,
 } from '@janhq/uikit'
 
-import { useAtom } from 'jotai'
+import { useAtom, useAtomValue } from 'jotai'
 import { DatabaseIcon, CpuIcon } from 'lucide-react'
 
 import { showSelectModelModalAtom } from '@/containers/Providers/KeyListener'
@@ -19,14 +19,14 @@ import { showSelectModelModalAtom } from '@/containers/Providers/KeyListener'
 import { MainViewState } from '@/constants/screens'
 
 import { useActiveModel } from '@/hooks/useActiveModel'
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
 
 export default function CommandListDownloadedModel() {
   const { setMainViewState } = useMainViewState()
-  const { downloadedModels } = useGetDownloadedModels()
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
   const { activeModel, startModel, stopModel } = useActiveModel()
   const [serverEnabled] = useAtom(serverEnabledAtom)
   const [showSelectModelModal, setShowSelectModelModal] = useAtom(
diff --git a/web/containers/Layout/TopBar/index.tsx b/web/containers/Layout/TopBar/index.tsx
index f72f5f066a..fdc4b4cdc9 100644
--- a/web/containers/Layout/TopBar/index.tsx
+++ b/web/containers/Layout/TopBar/index.tsx
@@ -20,7 +20,6 @@ import { MainViewState } from '@/constants/screens'
 
 import { useClickOutside } from '@/hooks/useClickOutside'
 import { useCreateNewThread } from '@/hooks/useCreateNewThread'
-import useGetAssistants, { getAssistants } from '@/hooks/useGetAssistants'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import { usePath } from '@/hooks/usePath'
@@ -29,13 +28,14 @@ import { showRightSideBarAtom } from '@/screens/Chat/Sidebar'
 
 import { openFileTitle } from '@/utils/titleUtils'
 
+import { assistantsAtom } from '@/helpers/atoms/Assistant.atom'
 import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 const TopBar = () => {
   const activeThread = useAtomValue(activeThreadAtom)
   const { mainViewState } = useMainViewState()
   const { requestCreateNewThread } = useCreateNewThread()
-  const { assistants } = useGetAssistants()
+  const assistants = useAtomValue(assistantsAtom)
   const [showRightSideBar, setShowRightSideBar] = useAtom(showRightSideBarAtom)
   const [showLeftSideBar, setShowLeftSideBar] = useAtom(showLeftSideBarAtom)
   const showing = useAtomValue(showRightSideBarAtom)
@@ -61,12 +61,7 @@ const TopBar = () => {
 
   const onCreateConversationClick = async () => {
     if (assistants.length === 0) {
-      const res = await getAssistants()
-      if (res.length === 0) {
-        alert('No assistant available')
-        return
-      }
-      requestCreateNewThread(res[0])
+      alert('No assistant available')
     } else {
       requestCreateNewThread(assistants[0])
     }
@@ -100,6 +95,7 @@ const TopBar = () => {
                 </div>
                 <div
                   className="unset-drag cursor-pointer pr-4"
+                  data-testid="btn-create-thread"
                   onClick={onCreateConversationClick}
                 >
                   <PenSquareIcon size={20} className="text-muted-foreground" />
diff --git a/web/containers/ModalCancelDownload/index.tsx b/web/containers/ModalCancelDownload/index.tsx
index 2a5626183e..d52fbe5e9f 100644
--- a/web/containers/ModalCancelDownload/index.tsx
+++ b/web/containers/ModalCancelDownload/index.tsx
@@ -1,4 +1,4 @@
-import { useMemo } from 'react'
+import { useCallback } from 'react'
 
 import { Model } from '@janhq/core'
 
@@ -14,31 +14,37 @@ import {
   Progress,
 } from '@janhq/uikit'
 
-import { atom, useAtomValue } from 'jotai'
+import { useAtomValue } from 'jotai'
 
 import useDownloadModel from '@/hooks/useDownloadModel'
-import { useDownloadState } from '@/hooks/useDownloadState'
+
+import { modelDownloadStateAtom } from '@/hooks/useDownloadState'
 
 import { formatDownloadPercentage } from '@/utils/converter'
 
-import { downloadingModelsAtom } from '@/helpers/atoms/Model.atom'
+import { getDownloadingModelAtom } from '@/helpers/atoms/Model.atom'
 
 type Props = {
   model: Model
   isFromList?: boolean
 }
 
-export default function ModalCancelDownload({ model, isFromList }: Props) {
-  const { modelDownloadStateAtom } = useDownloadState()
-  const downloadingModels = useAtomValue(downloadingModelsAtom)
-  const downloadAtom = useMemo(
-    () => atom((get) => get(modelDownloadStateAtom)[model.id]),
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-    [model.id]
-  )
-  const downloadState = useAtomValue(downloadAtom)
-  const cancelText = `Cancel ${formatDownloadPercentage(downloadState.percent)}`
+const ModalCancelDownload: React.FC<Props> = ({ model, isFromList }) => {
   const { abortModelDownload } = useDownloadModel()
+  const downloadingModels = useAtomValue(getDownloadingModelAtom)
+  const allDownloadStates = useAtomValue(modelDownloadStateAtom)
+  const downloadState = allDownloadStates[model.id]
+
+  const cancelText = `Cancel ${formatDownloadPercentage(downloadState.percent)}`
+
+  const onAbortDownloadClick = useCallback(() => {
+    if (downloadState?.modelId) {
+      const model = downloadingModels.find(
+        (model) => model.id === downloadState.modelId
+      )
+      if (model) abortModelDownload(model)
+    }
+  }, [downloadState, downloadingModels, abortModelDownload])
 
   return (
     <Modal>
@@ -78,17 +84,7 @@ export default function ModalCancelDownload({ model, isFromList }: Props) {
               <Button themes="ghost">No</Button>
             </ModalClose>
             <ModalClose asChild>
-              <Button
-                themes="danger"
-                onClick={() => {
-                  if (downloadState?.modelId) {
-                    const model = downloadingModels.find(
-                      (model) => model.id === downloadState.modelId
-                    )
-                    if (model) abortModelDownload(model)
-                  }
-                }}
-              >
+              <Button themes="danger" onClick={onAbortDownloadClick}>
                 Yes
               </Button>
             </ModalClose>
@@ -98,3 +94,5 @@ export default function ModalCancelDownload({ model, isFromList }: Props) {
     </Modal>
   )
 }
+
+export default ModalCancelDownload
diff --git a/web/containers/ModalTroubleShoot/AppLogs.tsx b/web/containers/ModalTroubleShoot/AppLogs.tsx
new file mode 100644
index 0000000000..d4f6bddb8a
--- /dev/null
+++ b/web/containers/ModalTroubleShoot/AppLogs.tsx
@@ -0,0 +1,203 @@
+import React, { useEffect, useState } from 'react'
+
+import { Button } from '@janhq/uikit'
+
+import { CopyIcon, CheckIcon } from 'lucide-react'
+
+import { useClipboard } from '@/hooks/useClipboard'
+import { useLogs } from '@/hooks/useLogs'
+
+const AppLogs = () => {
+  const { getLogs } = useLogs()
+  const [logs, setLogs] = useState([])
+
+  useEffect(() => {
+    getLogs('app').then((log) => {
+      if (typeof log?.split === 'function') {
+        setLogs(log.split(/\r?\n|\r|\n/g))
+      }
+    })
+
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [])
+
+  const clipboard = useClipboard({ timeout: 1000 })
+
+  return (
+    <>
+      <div className="absolute -top-11 right-2">
+        <Button
+          themes="outline"
+          className="bg-white dark:bg-secondary/50"
+          onClick={() => {
+            clipboard.copy(logs.slice(-50) ?? '')
+          }}
+        >
+          <div className="flex items-center space-x-2">
+            {clipboard.copied ? (
+              <>
+                <CheckIcon size={14} className="text-green-600" />
+                <span>Copying...</span>
+              </>
+            ) : (
+              <>
+                <CopyIcon size={14} />
+                <span>Copy All</span>
+              </>
+            )}
+          </div>
+        </Button>
+      </div>
+      <div className="overflow-hidden">
+        {logs.length > 1 ? (
+          <div className="h-full overflow-auto">
+            <code className="inline-block whitespace-pre-line text-xs">
+              {logs.slice(-100).map((log, i) => {
+                return (
+                  <p key={i} className="my-2 leading-relaxed">
+                    {log}
+                  </p>
+                )
+              })}
+            </code>
+          </div>
+        ) : (
+          <div className="mt-24 flex flex-col items-center justify-center">
+            <svg
+              width="115"
+              height="115"
+              viewBox="0 0 115 115"
+              fill="none"
+              xmlns="http://www.w3.org/2000/svg"
+            >
+              <circle cx="57.4999" cy="57.5009" r="50.2314" fill="#DADADA" />
+              <circle
+                cx="57.5"
+                cy="57.5"
+                r="55.9425"
+                fill="#E7E7E7"
+                stroke="white"
+                strokeWidth="3.1151"
+              />
+              <mask
+                id="mask0_1206_120508"
+                maskUnits="userSpaceOnUse"
+                x="3"
+                y="3"
+                width="109"
+                height="109"
+              >
+                <circle cx="57.4993" cy="57.5003" r="54.1253" fill="white" />
+              </mask>
+              <g mask="url(#mask0_1206_120508)">
+                <path
+                  d="M47.5039 116.445H58.5351L74.3593 39.8282L63.7828 37.6406L47.5039 116.445Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M72.165 39.4563L74.3716 39.8457L72.4246 38.418L72.165 39.4563Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M45.6797 114.947H56.7108L72.4257 38.4193L61.9585 36.1426L45.6797 114.947Z"
+                  fill="url(#paint0_linear_1206_120508)"
+                />
+                <path
+                  d="M93.1887 90.6726L26.5474 76.906L24.6602 75.2136L31.7058 51.9418L34.7984 52.1448L30.0296 49.6041L32.757 36.0039L99.3983 49.7705L101.29 51.467L98.5257 64.844L93.2456 64.9414L96.1515 65.4974L98.0387 67.1898L93.1887 90.6726Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M91.3015 88.9801L24.6602 75.2136L29.8186 50.2454L32.9112 50.4483L30.3299 47.7656L32.757 36.0039L99.3983 49.7705L96.6345 63.1475L91.3583 63.2449L96.1515 65.4974L91.3015 88.9801Z"
+                  fill="url(#paint1_linear_1206_120508)"
+                />
+                <path
+                  d="M92.7826 63.1065C92.7826 63.1065 92.7298 63.1065 92.6243 63.1065L92.1576 63.0741L90.3637 62.9279L89.069 62.8143L87.5308 62.6317C86.431 62.4937 85.1688 62.3638 83.7929 62.1365L81.6216 61.8078C80.8667 61.6901 80.0875 61.5359 79.2798 61.4019C77.6564 61.126 75.9396 60.7647 74.1295 60.3995C70.5133 59.6324 66.5563 58.703 62.4247 57.6518C54.1655 55.5252 46.7221 53.4797 41.2918 52.1525C39.9403 51.8075 38.7065 51.5275 37.6391 51.2677C36.5717 51.008 35.6098 50.797 34.8631 50.6306L33.1098 50.2247L32.6552 50.1151C32.6025 50.1035 32.5508 50.0872 32.501 50.0664C32.5545 50.0686 32.6076 50.0768 32.6593 50.0908L33.1219 50.176L34.8834 50.5291C35.6504 50.6833 36.5879 50.8822 37.6675 51.1297C38.7471 51.3773 39.9849 51.6452 41.3446 51.978C46.783 53.2605 54.2386 55.2816 62.4937 57.4043C66.6253 58.4554 70.5742 59.3929 74.1823 60.1722C75.9924 60.5415 77.7051 60.9109 79.3245 61.195C80.1362 61.3411 80.9114 61.4953 81.6622 61.6008L83.8254 61.9458C85.2012 62.1852 86.4553 62.3273 87.5552 62.4775L89.0893 62.6804L90.3799 62.8143L92.1698 63.0091L92.6324 63.0659L92.7826 63.1065Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M96.131 60.9773C96.0789 60.948 96.0288 60.9155 95.9808 60.8799L95.5749 60.5755C95.2056 60.3117 94.678 59.8937 93.9515 59.3985C91.9511 57.9951 89.8665 56.7156 87.7095 55.5673C84.5067 53.8752 81.1551 52.4813 77.697 51.4032C73.4578 50.101 69.0819 49.2947 64.6569 49.0005C59.9449 48.6555 55.4481 49.1142 51.353 49.2075C49.411 49.2762 47.4666 49.2369 45.529 49.0898C41.3921 48.7494 37.3342 47.762 33.5035 46.1636C32.6918 45.8267 32.0952 45.5426 31.6853 45.3519L31.2226 45.1165L31.0684 45.0312C31.1262 45.0462 31.1821 45.068 31.2348 45.0962L31.7096 45.3072C32.1155 45.4939 32.7364 45.7658 33.54 46.0865C35.8079 46.9951 38.1522 47.7 40.5451 48.1929C42.1954 48.5323 43.8654 48.7681 45.5452 48.899C47.4754 49.0336 49.4114 49.0647 51.3449 48.9924C55.4278 48.8869 59.9368 48.4201 64.6731 48.7651C69.1177 49.0615 73.5121 49.8788 77.766 51.2002C81.2331 52.295 84.5906 53.7108 87.7947 55.4293C89.949 56.5876 92.0247 57.8864 94.0083 59.3173C94.7105 59.8206 95.2259 60.2549 95.5912 60.5349L95.997 60.8596C96.0446 60.8953 96.0894 60.9347 96.131 60.9773Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M63.9192 43.0816C63.8188 43.1282 63.7141 43.1649 63.6067 43.1912L62.6935 43.4631C62.2876 43.5849 61.8128 43.7188 61.2405 43.8487C60.6683 43.9786 60.023 44.1572 59.2924 44.287C58.5619 44.4169 57.7745 44.5914 56.91 44.6929C56.0456 44.7943 55.1283 44.9364 54.1583 45.046C52.0463 45.2502 49.9242 45.3328 47.8027 45.2936C45.6814 45.2371 43.565 45.0623 41.4632 44.77C40.4973 44.6158 39.58 44.4818 38.7278 44.2951C37.8755 44.1084 37.1043 43.9461 36.3697 43.7675C35.6351 43.589 35.0101 43.4063 34.446 43.244C33.8818 43.0816 33.3989 42.9315 33.0092 42.7975L32.1082 42.485C32.0022 42.4531 31.8991 42.4123 31.7998 42.3633C31.9103 42.3761 32.0191 42.4006 32.1245 42.4363L33.0377 42.7042C33.4435 42.826 33.9143 42.968 34.4825 43.1101C35.0507 43.2521 35.7001 43.4469 36.4103 43.5971C37.1206 43.7472 37.916 43.942 38.7683 44.0922C39.6206 44.2424 40.5338 44.3966 41.4957 44.5427C43.5877 44.8202 45.693 44.9868 47.8027 45.0419C49.9143 45.0792 52.0264 45.0034 54.1299 44.8146C55.0959 44.7091 56.0172 44.6239 56.8735 44.4859C57.7299 44.3479 58.5253 44.2302 59.2518 44.08C59.9783 43.9299 60.6277 43.8 61.1999 43.6742C61.7722 43.5484 62.2633 43.4347 62.661 43.3292L63.5823 43.106C63.6933 43.0854 63.8063 43.0772 63.9192 43.0816Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M46.1782 66.8891C46.1782 66.8891 46.2837 66.9459 46.4786 67.0677L47.3552 67.6075C48.1263 68.0742 49.2546 68.7885 50.7644 69.5962C52.5839 70.6072 54.5341 71.3624 56.56 71.8405C57.1712 71.9765 57.7909 72.0714 58.4148 72.1246C59.0677 72.2062 59.729 72.063 60.2898 71.7188C60.5621 71.5185 60.7593 71.2327 60.8499 70.9071C60.9379 70.5705 60.9379 70.2169 60.8499 69.8803C60.6372 69.1763 60.1849 68.5689 59.5714 68.1635C54.4901 64.7949 47.3349 62.3395 39.2381 62.1122C38.2275 62.0797 37.2088 62.0797 36.1698 62.1122C35.1309 62.1447 34.0756 62.3882 33.3816 63.1593C33.2064 63.3413 33.0692 63.5562 32.9779 63.7918C32.8866 64.0273 32.8431 64.2786 32.85 64.5311C32.8877 65.0471 33.0864 65.5383 33.4181 65.9354C34.0716 66.7714 35.0132 67.3518 35.9182 67.9646C39.5709 70.4403 43.4387 72.8998 47.7895 74.6044C52.1402 76.309 56.7629 77.0761 61.1177 76.4308C62.1922 76.2718 63.2512 76.0219 64.2834 75.684C65.3 75.3967 66.2119 74.8217 66.9093 74.0281C67.5327 73.2028 67.8626 72.1929 67.8468 71.1587C67.8497 70.1451 67.625 69.1437 67.1893 68.2284C66.3039 66.4723 64.9462 64.9979 63.2688 63.971C61.6898 62.9951 59.9765 62.2554 58.1834 61.7753C56.4585 61.2761 54.7499 60.919 53.1183 60.5578L48.4226 59.4944L34.2542 56.276L30.4067 55.3872L29.4083 55.1518C29.181 55.099 29.0674 55.0625 29.0674 55.0625L29.4124 55.1274L30.4189 55.3385L34.2786 56.1827L48.4632 59.324L53.1589 60.3711C54.7824 60.7404 56.5032 61.0895 58.2402 61.5887C60.0548 62.0698 61.7887 62.8151 63.3865 63.8006C65.1016 64.8462 66.4904 66.3503 67.3963 68.1432C67.8467 69.0889 68.0797 70.1234 68.0782 71.1709C68.0964 72.2575 67.7507 73.319 67.096 74.1864C66.3707 75.017 65.4208 75.6203 64.3605 75.9235C63.3146 76.2697 62.2404 76.5237 61.1502 76.6824C56.7426 77.3399 52.0631 76.5566 47.7002 74.8479C43.3372 73.1393 39.441 70.6798 35.7965 68.1919C34.8955 67.5669 33.9376 66.9743 33.2477 66.0936C32.8831 65.658 32.6657 65.1181 32.6267 64.5514C32.6196 64.2683 32.6687 63.9866 32.7711 63.7226C32.8735 63.4586 33.0272 63.2174 33.2233 63.0132C33.599 62.6113 34.0734 62.3147 34.5992 62.1528C35.1094 61.9991 35.6373 61.9118 36.1698 61.893C37.2169 61.8525 38.2438 61.8565 39.2584 61.893C47.4039 62.1406 54.5794 64.6163 59.6932 68.0336C60.3373 68.4648 60.8099 69.1082 61.0285 69.8519C61.1239 70.2164 61.1239 70.5994 61.0285 70.9639C60.9286 71.3211 60.7095 71.6333 60.4075 71.8487C59.8169 72.2131 59.12 72.3662 58.431 72.2829C57.7989 72.2243 57.1713 72.1253 56.5519 71.9867C54.5186 71.4945 52.5639 70.7213 50.7441 69.6895C49.2343 68.8778 48.1142 68.1391 47.3512 67.6602C46.9778 67.4208 46.6896 67.2544 46.4907 67.1002C46.2919 66.9459 46.1782 66.8891 46.1782 66.8891Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M94.8364 71.2204C94.6993 71.2055 94.5635 71.1797 94.4305 71.1433C94.1789 71.0743 93.8014 71.0012 93.3185 70.916C91.9393 70.7187 90.5384 70.7297 89.1625 70.9484C87.1263 71.2911 85.1507 71.9282 83.2979 72.8397C81.0433 73.9901 78.866 75.2861 76.7799 76.7197C74.6823 78.1612 72.4837 79.4497 70.201 80.5753C68.3181 81.4721 66.3087 82.0743 64.243 82.3611C62.8484 82.5487 61.4325 82.5089 60.0505 82.2434C59.6768 82.1692 59.3081 82.0716 58.9466 81.9512C58.8182 81.9168 58.6932 81.8706 58.5732 81.8132C58.7037 81.8336 58.8326 81.8634 58.9588 81.9025C59.2104 81.9755 59.5838 82.0567 60.0668 82.15C61.4407 82.3746 62.841 82.3869 64.2187 82.1866C66.2604 81.8789 68.2442 81.266 70.1036 80.3683C72.3696 79.236 74.5543 77.9477 76.6419 76.5127C78.7383 75.0733 80.9295 73.777 83.2005 72.6327C85.0755 71.7192 87.077 71.0926 89.1382 70.7739C90.5308 70.568 91.9473 70.5845 93.3347 70.8226C93.72 70.8867 94.1009 70.9748 94.4752 71.0864C94.5995 71.1198 94.7204 71.1646 94.8364 71.2204Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M93.6026 77.826C93.6026 77.8504 93.286 77.7205 92.7016 77.5906C91.8761 77.4114 91.0248 77.3839 90.1894 77.5095C88.9516 77.719 87.7468 78.0901 86.6057 78.6134C85.195 79.2299 83.8293 79.9446 82.5187 80.7523C81.1063 81.5883 79.7589 82.4041 78.4602 83.025C77.321 83.5882 76.1214 84.0199 74.8846 84.3116C74.0488 84.5016 73.1926 84.5861 72.3358 84.5632C72.1034 84.5575 71.8716 84.5372 71.6418 84.5024C71.5603 84.4985 71.4797 84.4835 71.4023 84.4577C71.4023 84.4293 71.7392 84.4577 72.3358 84.4577C73.1828 84.4453 74.0257 84.3364 74.8481 84.133C76.0637 83.8193 77.242 83.3757 78.3628 82.8099C79.6371 82.1849 80.9724 81.3692 82.3888 80.529C83.7103 79.7132 85.0914 78.9983 86.5204 78.3902C87.683 77.8677 88.9122 77.5085 90.1731 77.3228C91.0279 77.2097 91.8965 77.2648 92.73 77.4851C92.9548 77.5461 93.1757 77.6207 93.3916 77.7083C93.4671 77.7375 93.5381 77.7771 93.6026 77.826Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M72.1531 44.1988C72.1531 44.2678 69.584 43.7645 66.4468 43.0746C63.3095 42.3846 60.7648 41.7718 60.7932 41.7069C60.8216 41.6419 63.3623 42.1411 66.4995 42.8311C69.6368 43.521 72.1531 44.1339 72.1531 44.1988Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M87.7278 22.8493C87.9286 21.4011 85.8726 20.21 84.3238 20.0848C83.5886 20.0273 82.8227 20.139 82.1249 19.8987C80.6135 19.3743 80.011 17.432 78.5371 16.8128C77.4342 16.3526 76.1544 16.762 75.0957 17.2967C74.0371 17.8313 72.9717 18.5046 71.7769 18.5825C70.7557 18.6468 69.6086 18.2644 68.7133 18.7686C68.0326 19.1442 67.6922 19.9224 67.059 20.3792C66.4259 20.836 65.6498 20.9206 64.8941 20.9612C64.1384 21.0018 63.3521 21.012 62.6611 21.3233C61.9701 21.6346 61.4017 22.3655 61.5446 23.1031L87.7278 22.8493Z"
+                  fill="#ABABAB"
+                />
+                <path
+                  d="M39.1881 32.5312C39.3293 31.4869 37.8655 30.6287 36.7662 30.5385C36.2413 30.4963 35.6955 30.5769 35.1993 30.4022C34.121 30.0182 33.6916 28.6264 32.64 28.1791C31.8556 27.847 30.951 28.1426 30.1895 28.5285C29.428 28.9144 28.6741 29.4001 27.8229 29.4538C27.0824 29.5018 26.2789 29.2254 25.632 29.5901C25.1491 29.8608 24.8972 30.4195 24.4525 30.742C24.0078 31.0645 23.4486 31.126 22.9085 31.1624C22.3684 31.1989 21.8092 31.1989 21.3187 31.4254C20.8282 31.652 20.4198 32.1741 20.5229 32.7078L39.1881 32.5312Z"
+                  fill="#ABABAB"
+                />
+                <path
+                  d="M76.46 61.6777L78.8178 62.1824L80.1702 66.9562L80.2674 66.977L83.4556 63.1752L85.8134 63.6799L80.8041 69.3391L80.0506 72.8588L77.9602 72.4114L78.7137 68.8917L76.46 61.6777Z"
+                  fill="white"
+                />
+                <path
+                  d="M67.148 61.4992L67.5195 59.7637L75.6965 61.514L75.325 63.2496L72.2769 62.5971L70.5171 70.8178L68.4364 70.3724L70.1962 62.1517L67.148 61.4992Z"
+                  fill="white"
+                />
+                <path
+                  d="M56.9049 67.9016L59.0361 57.9453L62.9642 58.7862C63.7193 58.9478 64.3318 59.2297 64.8016 59.632C65.272 60.0309 65.5922 60.5147 65.762 61.0832C65.9357 61.6491 65.9518 62.2627 65.8103 62.9238C65.6688 63.585 65.4013 64.1379 65.0078 64.5824C64.6144 65.0269 64.1169 65.3323 63.5153 65.4984C62.9169 65.6652 62.2353 65.6667 61.4705 65.503L58.9668 64.967L59.3279 63.2801L61.4913 63.7432C61.8964 63.8299 62.2451 63.8317 62.5375 63.7485C62.8338 63.6628 63.0734 63.5091 63.2565 63.2872C63.4435 63.0629 63.572 62.7871 63.6421 62.4597C63.7128 62.1291 63.7082 61.8265 63.628 61.5517C63.5518 61.2744 63.3954 61.0392 63.1587 60.8462C62.9228 60.65 62.6007 60.5082 62.1923 60.4207L60.7728 60.1169L59.0099 68.3522L56.9049 67.9016Z"
+                  fill="white"
+                />
+                <path
+                  d="M46.5049 55.2637L49.1009 55.8194L50.4108 63.0957L50.5275 63.1206L54.7013 57.0182L57.2973 57.5739L55.1661 67.5302L53.1243 67.0931L54.5114 60.6128L54.4288 60.5951L50.4754 66.4753L49.0851 66.1776L47.8905 59.1701L47.8078 59.1524L46.4154 65.657L44.3736 65.2199L46.5049 55.2637Z"
+                  fill="white"
+                />
+                <path
+                  d="M35.9977 63.425L38.1289 53.4688L44.8377 54.9048L44.4662 56.6404L39.8624 55.6549L39.3546 58.0273L43.6132 58.9389L43.2417 60.6744L38.9831 59.7628L38.4742 62.1401L43.0974 63.1297L42.7259 64.8653L35.9977 63.425Z"
+                  fill="white"
+                />
+              </g>
+              <defs>
+                <linearGradient
+                  id="paint0_linear_1206_120508"
+                  x1="59.1074"
+                  y1="36.1426"
+                  x2="59.1074"
+                  y2="114.947"
+                  gradientUnits="userSpaceOnUse"
+                >
+                  <stop stopColor="#CFCFCF" />
+                  <stop offset="1" stopColor="#C6C6C6" />
+                </linearGradient>
+                <linearGradient
+                  id="paint1_linear_1206_120508"
+                  x1="62.0292"
+                  y1="36.0039"
+                  x2="62.0292"
+                  y2="88.9801"
+                  gradientUnits="userSpaceOnUse"
+                >
+                  <stop stopColor="#DDDDDD" />
+                  <stop offset="1" stopColor="#B6B6B6" />
+                </linearGradient>
+              </defs>
+            </svg>
+            <p className="mt-4 text-muted-foreground">Empty logs</p>
+          </div>
+        )}
+      </div>
+    </>
+  )
+}
+
+export default AppLogs
diff --git a/web/containers/ModalTroubleShoot/DeviceSpecs.tsx b/web/containers/ModalTroubleShoot/DeviceSpecs.tsx
new file mode 100644
index 0000000000..5ebb610d16
--- /dev/null
+++ b/web/containers/ModalTroubleShoot/DeviceSpecs.tsx
@@ -0,0 +1,46 @@
+import React from 'react'
+
+import { Button } from '@janhq/uikit'
+
+import { CopyIcon, CheckIcon } from 'lucide-react'
+
+import { useClipboard } from '@/hooks/useClipboard'
+
+// TODO @Louis help add missing information device specs
+const DeviceSpecs = () => {
+  const userAgent = window.navigator.userAgent
+  const clipboard = useClipboard({ timeout: 1000 })
+
+  return (
+    <>
+      <div className="absolute -top-11 right-2">
+        <Button
+          themes="outline"
+          className="bg-white dark:bg-secondary/50"
+          onClick={() => {
+            clipboard.copy(userAgent ?? '')
+          }}
+        >
+          <div className="flex items-center space-x-2">
+            {clipboard.copied ? (
+              <>
+                <CheckIcon size={14} className="text-green-600" />
+                <span>Copying...</span>
+              </>
+            ) : (
+              <>
+                <CopyIcon size={14} />
+                <span>Copy All</span>
+              </>
+            )}
+          </div>
+        </Button>
+      </div>
+      <div>
+        <p className="leading-relaxed">{userAgent}</p>
+      </div>
+    </>
+  )
+}
+
+export default DeviceSpecs
diff --git a/web/containers/ModalTroubleShoot/index.tsx b/web/containers/ModalTroubleShoot/index.tsx
new file mode 100644
index 0000000000..547398c4f3
--- /dev/null
+++ b/web/containers/ModalTroubleShoot/index.tsx
@@ -0,0 +1,121 @@
+import { useState } from 'react'
+import ScrollToBottom from 'react-scroll-to-bottom'
+
+import { Modal, ModalContent, ModalHeader, ModalTitle } from '@janhq/uikit'
+import { motion as m } from 'framer-motion'
+import { atom, useAtom } from 'jotai'
+import { twMerge } from 'tailwind-merge'
+
+import ServerLogs from '../ServerLogs'
+
+import AppLogs from './AppLogs'
+import DeviceSpecs from './DeviceSpecs'
+
+export const modalTroubleShootingAtom = atom(false)
+const logOption = ['App Logs', 'Server Logs', 'Device Specs']
+
+const ModalTroubleShooting: React.FC = () => {
+  const [modalTroubleShooting, setModalTroubleShooting] = useAtom(
+    modalTroubleShootingAtom
+  )
+  const [isTabActive, setIsTabActivbe] = useState(0)
+
+  return (
+    <Modal open={modalTroubleShooting} onOpenChange={setModalTroubleShooting}>
+      <ModalContent className="max-w-[60%] pb-4 pt-8">
+        <ModalHeader>
+          <ModalTitle>Troubleshooting Assistance</ModalTitle>
+        </ModalHeader>
+        <p className="-mt-2 pr-3 leading-relaxed text-muted-foreground">
+          {`We're here to help! Your report is crucial for debugging and shaping
+          the next version. Here’s how you can report & get further support:`}
+        </p>
+
+        <div className="rounded-lg border border-border p-4 shadow">
+          <h2 className="font-semibold">Step 1</h2>
+          <p className="mt-1 text-muted-foreground">
+            Follow our&nbsp;
+            <a
+              href="https://jan.ai/guides/troubleshooting"
+              target="_blank"
+              className="text-blue-600 hover:underline dark:text-blue-300"
+            >
+              troubleshooting guide
+            </a>
+            &nbsp;for step-by-step solutions.
+          </p>
+        </div>
+
+        <div className="block overflow-hidden rounded-lg border border-border pb-2 pt-4 shadow">
+          <div className="px-4">
+            <h2 className="font-semibold">Step 2</h2>
+            <p className="mt-1 text-muted-foreground">
+              {`If you can't find what you need in our troubleshooting guide, feel
+            free reach out to us for extra help:`}
+            </p>
+            <ul className="mt-2 list-disc space-y-2 pl-6">
+              <li>
+                <p className="font-medium">
+                  Copy your 2-hour logs & device specifications provided below.{' '}
+                </p>
+              </li>
+              <li>
+                <p className="font-medium">
+                  Go to our&nbsp;
+                  <a
+                    href="https://discord.gg/AsJ8krTT3N"
+                    target="_blank"
+                    className="text-blue-600 hover:underline dark:text-blue-300"
+                  >
+                    Discord
+                  </a>
+                  &nbsp; & send it to #🆘|get-help channel for further support.
+                </p>
+              </li>
+            </ul>
+          </div>
+
+          <div className="flex flex-col pt-4">
+            {/* TODO @faisal replace this once we have better tabs component UI */}
+            <div className="relative bg-zinc-100 px-4 py-2 dark:bg-secondary/50">
+              <ul className="inline-flex space-x-2 rounded-lg bg-zinc-200 px-1 dark:bg-secondary">
+                {logOption.map((name, i) => {
+                  return (
+                    <li
+                      className="relative cursor-pointer px-4 py-2"
+                      key={i}
+                      onClick={() => setIsTabActivbe(i)}
+                    >
+                      <span
+                        className={twMerge(
+                          'relative z-50 font-medium text-muted-foreground',
+                          isTabActive === i &&
+                            'font-bold text-foreground dark:text-black'
+                        )}
+                      >
+                        {name}
+                      </span>
+                      {isTabActive === i && (
+                        <m.div
+                          className="absolute left-0 top-1 h-[calc(100%-8px)] w-full rounded-md bg-background dark:bg-white"
+                          layoutId="log-state-active"
+                        />
+                      )}
+                    </li>
+                  )
+                })}
+              </ul>
+            </div>
+            <ScrollToBottom className={twMerge('relative h-[140px] px-4 py-2')}>
+              {isTabActive === 0 && <AppLogs />}
+              {isTabActive === 1 && <ServerLogs limit={50} withCopy />}
+              {isTabActive === 2 && <DeviceSpecs />}
+            </ScrollToBottom>
+          </div>
+        </div>
+      </ModalContent>
+    </Modal>
+  )
+}
+
+export default ModalTroubleShooting
diff --git a/web/containers/OpenAiKeyInput/index.tsx b/web/containers/OpenAiKeyInput/index.tsx
index 444c8074ff..7ef97cf38b 100644
--- a/web/containers/OpenAiKeyInput/index.tsx
+++ b/web/containers/OpenAiKeyInput/index.tsx
@@ -30,7 +30,7 @@ const OpenAiKeyInput: React.FC = () => {
   }
 
   return (
-    <div className="mt-4">
+    <div className="my-4">
       <label
         id="thread-title"
         className="mb-2 inline-block font-bold text-gray-600 dark:text-gray-300"
diff --git a/web/containers/Providers/DataLoader.tsx b/web/containers/Providers/DataLoader.tsx
new file mode 100644
index 0000000000..d7b630043b
--- /dev/null
+++ b/web/containers/Providers/DataLoader.tsx
@@ -0,0 +1,24 @@
+'use client'
+
+import { Fragment, ReactNode } from 'react'
+
+import useAssistants from '@/hooks/useAssistants'
+import useGetSystemResources from '@/hooks/useGetSystemResources'
+import useModels from '@/hooks/useModels'
+import useThreads from '@/hooks/useThreads'
+
+type Props = {
+  children: ReactNode
+}
+
+const DataLoader: React.FC<Props> = ({ children }) => {
+  useModels()
+  useThreads()
+  useAssistants()
+  useGetSystemResources()
+  console.debug('Load Data...')
+
+  return <Fragment>{children}</Fragment>
+}
+
+export default DataLoader
diff --git a/web/containers/Providers/EventHandler.tsx b/web/containers/Providers/EventHandler.tsx
index ec0fbfc907..102fa5f1c0 100644
--- a/web/containers/Providers/EventHandler.tsx
+++ b/web/containers/Providers/EventHandler.tsx
@@ -2,23 +2,28 @@
 import { ReactNode, useCallback, useEffect, useRef } from 'react'
 
 import {
+  ChatCompletionMessage,
+  ChatCompletionRole,
   events,
   ThreadMessage,
   ExtensionTypeEnum,
   MessageStatus,
+  MessageRequest,
   Model,
   ConversationalExtension,
   MessageEvent,
+  MessageRequestType,
   ModelEvent,
+  Thread,
 } from '@janhq/core'
 import { useAtomValue, useSetAtom } from 'jotai'
+import { ulid } from 'ulid'
 
 import {
   activeModelAtom,
   loadModelErrorAtom,
   stateModelAtom,
 } from '@/hooks/useActiveModel'
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
 
 import { queuedMessageAtom } from '@/hooks/useSendChatMessage'
 
@@ -26,19 +31,24 @@ import { toaster } from '../Toast'
 
 import { extensionManager } from '@/extension'
 import {
+  getCurrentChatMessagesAtom,
   addNewMessageAtom,
   updateMessageAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
 import {
   updateThreadWaitingForResponseAtom,
   threadsAtom,
   isGeneratingResponseAtom,
+  updateThreadAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 export default function EventHandler({ children }: { children: ReactNode }) {
+  const messages = useAtomValue(getCurrentChatMessagesAtom)
   const addNewMessage = useSetAtom(addNewMessageAtom)
   const updateMessage = useSetAtom(updateMessageAtom)
-  const { downloadedModels } = useGetDownloadedModels()
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
+  const activeModel = useAtomValue(activeModelAtom)
   const setActiveModel = useSetAtom(activeModelAtom)
   const setStateModel = useSetAtom(stateModelAtom)
   const setQueuedMessage = useSetAtom(queuedMessageAtom)
@@ -49,6 +59,9 @@ export default function EventHandler({ children }: { children: ReactNode }) {
   const modelsRef = useRef(downloadedModels)
   const threadsRef = useRef(threads)
   const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
+  const updateThread = useSetAtom(updateThreadAtom)
+  const messagesRef = useRef(messages)
+  const activeModelRef = useRef(activeModel)
 
   useEffect(() => {
     threadsRef.current = threads
@@ -58,9 +71,19 @@ export default function EventHandler({ children }: { children: ReactNode }) {
     modelsRef.current = downloadedModels
   }, [downloadedModels])
 
+  useEffect(() => {
+    messagesRef.current = messages
+  }, [messages])
+
+  useEffect(() => {
+    activeModelRef.current = activeModel
+  }, [activeModel])
+
   const onNewMessageResponse = useCallback(
     (message: ThreadMessage) => {
-      addNewMessage(message)
+      if (message.type === MessageRequestType.Thread) {
+        addNewMessage(message)
+      }
     },
     [addNewMessage]
   )
@@ -91,20 +114,60 @@ export default function EventHandler({ children }: { children: ReactNode }) {
 
   const onModelInitFailed = useCallback(
     (res: any) => {
-      const errorMessage = `${res.error}`
-      console.error('Failed to load model: ' + errorMessage)
-      setLoadModelError(errorMessage)
+      const errorMessage = res?.error ?? res
+      console.error('Failed to load model: ', errorMessage)
       setStateModel(() => ({
         state: 'start',
         loading: false,
         model: res.modelId,
       }))
+      setLoadModelError(errorMessage)
       setQueuedMessage(false)
     },
     [setStateModel, setQueuedMessage, setLoadModelError]
   )
 
-  const onMessageResponseUpdate = useCallback(
+  const updateThreadTitle = useCallback(
+    (message: ThreadMessage) => {
+      // Update only when it's finished
+      if (message.status !== MessageStatus.Ready) {
+        return
+      }
+
+      const thread = threadsRef.current?.find((e) => e.id == message.thread_id)
+      const messageContent = message.content[0]?.text?.value
+
+      // The thread title should not be updated if the message is less than 10 words
+      // And no new line character is present
+      // And non-alphanumeric characters should be removed
+      if (thread && messageContent && !messageContent.includes('\n')) {
+        // Remove non-alphanumeric characters
+        const cleanedMessageContent = messageContent
+          .replace(/[^a-z0-9\s]/gi, '')
+          .trim()
+        // Split the message into words
+        const words = cleanedMessageContent.split(' ')
+        // Check if the message is less than 10 words
+        if (words.length < 10) {
+          // Update the Thread title with the response of the inference on the 1st prompt
+          updateThread({
+            ...thread,
+            title: cleanedMessageContent,
+            metadata: thread.metadata,
+          })
+
+          extensionManager
+            .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
+            ?.saveThread({
+              ...thread,
+            })
+        }
+      }
+    },
+    [updateThread]
+  )
+
+  const updateThreadMessage = useCallback(
     (message: ThreadMessage) => {
       updateMessage(
         message.id,
@@ -114,7 +177,6 @@ export default function EventHandler({ children }: { children: ReactNode }) {
       )
       if (message.status === MessageStatus.Pending) {
         if (message.content.length) {
-          updateThreadWaiting(message.thread_id, false)
           setIsGeneratingResponse(false)
         }
         return
@@ -126,11 +188,17 @@ export default function EventHandler({ children }: { children: ReactNode }) {
 
       const thread = threadsRef.current?.find((e) => e.id == message.thread_id)
       if (thread) {
-        const messageContent = message.content[0]?.text.value ?? ''
+        const messageContent = message.content[0]?.text?.value
         const metadata = {
           ...thread.metadata,
-          lastMessage: messageContent,
+          ...(messageContent && { lastMessage: messageContent }),
         }
+
+        updateThread({
+          ...thread,
+          metadata,
+        })
+
         extensionManager
           .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
           ?.saveThread({
@@ -138,20 +206,84 @@ export default function EventHandler({ children }: { children: ReactNode }) {
             metadata,
           })
 
+        // If this is not the summary of the Thread, don't need to add it to the Thread
         extensionManager
           .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
           ?.addNewMessage(message)
+
+        // Attempt to generate the title of the Thread when needed
+        generateThreadTitle(message, thread)
       }
     },
-    [updateMessage, updateThreadWaiting]
+    [setIsGeneratingResponse, updateMessage, updateThread, updateThreadWaiting]
   )
 
+  const onMessageResponseUpdate = useCallback(
+    (message: ThreadMessage) => {
+      switch (message.type) {
+        case MessageRequestType.Summary:
+          updateThreadTitle(message)
+          break
+        default:
+          updateThreadMessage(message)
+      }
+    },
+    [updateThreadMessage, updateThreadTitle]
+  )
+
+  const generateThreadTitle = (message: ThreadMessage, thread: Thread) => {
+    // If this is the first ever prompt in the thread
+    if (
+      thread &&
+      thread.title?.trim() === 'New Thread' &&
+      activeModelRef.current
+    ) {
+      // This is the first time message comes in on a new thread
+      //  Summarize the first message, and make that the title of the Thread
+      // 1. Get the summary of the first prompt using whatever engine user is currently using
+      const threadMessages = messagesRef?.current
+
+      if (!threadMessages || threadMessages.length === 0) return
+
+      const summarizeFirstPrompt = `Summarize this text "${threadMessages[0].content[0].text.value}" for a conversation title in less than 10 words`
+      // Prompt: Given this query from user {query}, return to me the summary in 5 words as the title
+      const msgId = ulid()
+      const messages: ChatCompletionMessage[] = [
+        {
+          role: ChatCompletionRole.System,
+          content:
+            'The conversation below is for a text summarization, user asks assistant to summarize a text and assistant should response in just less than 10 words',
+        },
+        {
+          role: ChatCompletionRole.User,
+          content: summarizeFirstPrompt,
+        },
+      ]
+
+      const messageRequest: MessageRequest = {
+        id: msgId,
+        threadId: message.thread_id,
+        type: MessageRequestType.Summary,
+        messages,
+        model: {
+          ...activeModelRef.current,
+          parameters: {
+            stream: false,
+          },
+        },
+      }
+
+      // 2. Update the title with the result of the inference
+      setTimeout(() => {
+        events.emit(MessageEvent.OnMessageSent, messageRequest)
+      }, 1000)
+    }
+  }
+
   useEffect(() => {
-    console.log('Registering events')
     if (window.core?.events) {
       events.on(MessageEvent.OnMessageResponse, onNewMessageResponse)
       events.on(MessageEvent.OnMessageUpdate, onMessageResponseUpdate)
-
       events.on(ModelEvent.OnModelReady, onModelReady)
       events.on(ModelEvent.OnModelFail, onModelInitFailed)
       events.on(ModelEvent.OnModelStopped, onModelStopped)
diff --git a/web/containers/Providers/EventListener.tsx b/web/containers/Providers/EventListener.tsx
index 62d4cacb61..938db69c02 100644
--- a/web/containers/Providers/EventListener.tsx
+++ b/web/containers/Providers/EventListener.tsx
@@ -1,91 +1,62 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
+import { PropsWithChildren, useCallback, useEffect } from 'react'
 
-import { PropsWithChildren, useEffect, useRef } from 'react'
+import React from 'react'
 
-import { baseName } from '@janhq/core'
-import { useAtomValue, useSetAtom } from 'jotai'
+import { DownloadEvent, events, DownloadState } from '@janhq/core'
+import { useSetAtom } from 'jotai'
 
-import { useDownloadState } from '@/hooks/useDownloadState'
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
-
-import { modelBinFileName } from '@/utils/model'
+import { setDownloadStateAtom } from '@/hooks/useDownloadState'
 
 import EventHandler from './EventHandler'
 
 import { appDownloadProgress } from './Jotai'
 
-import { downloadingModelsAtom } from '@/helpers/atoms/Model.atom'
-
-export default function EventListenerWrapper({ children }: PropsWithChildren) {
+const EventListenerWrapper = ({ children }: PropsWithChildren) => {
+  const setDownloadState = useSetAtom(setDownloadStateAtom)
   const setProgress = useSetAtom(appDownloadProgress)
-  const models = useAtomValue(downloadingModelsAtom)
-  const modelsRef = useRef(models)
-
-  const { setDownloadedModels, downloadedModels } = useGetDownloadedModels()
-  const {
-    setDownloadState,
-    setDownloadStateSuccess,
-    setDownloadStateFailed,
-    setDownloadStateCancelled,
-  } = useDownloadState()
-  const downloadedModelRef = useRef(downloadedModels)
 
-  useEffect(() => {
-    modelsRef.current = models
-  }, [models])
-  useEffect(() => {
-    downloadedModelRef.current = downloadedModels
-  }, [downloadedModels])
+  const onFileDownloadUpdate = useCallback(
+    async (state: DownloadState) => {
+      console.debug('onFileDownloadUpdate', state)
+      setDownloadState(state)
+    },
+    [setDownloadState]
+  )
+
+  const onFileDownloadError = useCallback(
+    (state: DownloadState) => {
+      console.debug('onFileDownloadError', state)
+      setDownloadState(state)
+    },
+    [setDownloadState]
+  )
+
+  const onFileDownloadSuccess = useCallback(
+    (state: DownloadState) => {
+      console.debug('onFileDownloadSuccess', state)
+      setDownloadState(state)
+    },
+    [setDownloadState]
+  )
 
   useEffect(() => {
-    if (window && window.electronAPI) {
-      window.electronAPI.onFileDownloadUpdate(
-        async (_event: string, state: any | undefined) => {
-          if (!state) return
-          const modelName = await baseName(state.fileName)
-          const model = modelsRef.current.find(
-            (model) => modelBinFileName(model) === modelName
-          )
-          if (model)
-            setDownloadState({
-              ...state,
-              modelId: model.id,
-            })
-        }
-      )
+    console.debug('EventListenerWrapper: registering event listeners...')
 
-      window.electronAPI.onFileDownloadError(
-        async (_event: string, state: any) => {
-          const modelName = await baseName(state.fileName)
-          const model = modelsRef.current.find(
-            (model) => modelBinFileName(model) === modelName
-          )
-          if (model) {
-            if (state.err?.message !== 'aborted') {
-              console.error('Download error', state)
-              setDownloadStateFailed(model.id, state.err.message)
-            } else {
-              setDownloadStateCancelled(model.id)
-            }
-          }
-        }
-      )
+    events.on(DownloadEvent.onFileDownloadUpdate, onFileDownloadUpdate)
+    events.on(DownloadEvent.onFileDownloadError, onFileDownloadError)
+    events.on(DownloadEvent.onFileDownloadSuccess, onFileDownloadSuccess)
 
-      window.electronAPI.onFileDownloadSuccess(
-        async (_event: string, state: any) => {
-          if (state && state.fileName) {
-            const modelName = await baseName(state.fileName)
-            const model = modelsRef.current.find(
-              (model) => modelBinFileName(model) === modelName
-            )
-            if (model) {
-              setDownloadStateSuccess(model.id)
-              setDownloadedModels([...downloadedModelRef.current, model])
-            }
-          }
-        }
-      )
+    return () => {
+      console.debug('EventListenerWrapper: unregistering event listeners...')
+      events.off(DownloadEvent.onFileDownloadUpdate, onFileDownloadUpdate)
+      events.off(DownloadEvent.onFileDownloadError, onFileDownloadError)
+      events.off(DownloadEvent.onFileDownloadSuccess, onFileDownloadSuccess)
+    }
+  }, [onFileDownloadUpdate, onFileDownloadError, onFileDownloadSuccess])
 
+  useEffect(() => {
+    if (window && window.electronAPI) {
       window.electronAPI.onAppUpdateDownloadUpdate(
         (_event: string, progress: any) => {
           setProgress(progress.percent)
@@ -105,14 +76,9 @@ export default function EventListenerWrapper({ children }: PropsWithChildren) {
       })
     }
     return () => {}
-  }, [
-    setDownloadState,
-    setDownloadStateCancelled,
-    setDownloadStateFailed,
-    setDownloadStateSuccess,
-    setDownloadedModels,
-    setProgress,
-  ])
+  }, [setDownloadState, setProgress])
 
   return <EventHandler>{children}</EventHandler>
 }
+
+export default EventListenerWrapper
diff --git a/web/containers/Providers/Jotai.tsx b/web/containers/Providers/Jotai.tsx
index 103f0d9eec..5907ac7462 100644
--- a/web/containers/Providers/Jotai.tsx
+++ b/web/containers/Providers/Jotai.tsx
@@ -8,6 +8,7 @@ type Props = {
   children: ReactNode
 }
 
+export const editPromptAtom = atom<string>('')
 export const currentPromptAtom = atom<string>('')
 export const fileUploadAtom = atom<FileInfo[]>([])
 export const appDownloadProgress = atom<number>(-1)
diff --git a/web/containers/Providers/index.tsx b/web/containers/Providers/index.tsx
index c8a20bca71..e7a179ec43 100644
--- a/web/containers/Providers/index.tsx
+++ b/web/containers/Providers/index.tsx
@@ -23,6 +23,8 @@ import Umami from '@/utils/umami'
 
 import Loader from '../Loader'
 
+import DataLoader from './DataLoader'
+
 import KeyListener from './KeyListener'
 
 import { extensionManager } from '@/extension'
@@ -81,7 +83,9 @@ const Providers = (props: PropsWithChildren) => {
           <KeyListener>
             <FeatureToggleWrapper>
               <EventListenerWrapper>
-                <TooltipProvider delayDuration={0}>{children}</TooltipProvider>
+                <TooltipProvider delayDuration={0}>
+                  <DataLoader>{children}</DataLoader>
+                </TooltipProvider>
                 {!isMac && <GPUDriverPrompt />}
               </EventListenerWrapper>
               <Toaster />
diff --git a/web/containers/ServerLogs/index.tsx b/web/containers/ServerLogs/index.tsx
new file mode 100644
index 0000000000..a980fefffd
--- /dev/null
+++ b/web/containers/ServerLogs/index.tsx
@@ -0,0 +1,232 @@
+/* eslint-disable @typescript-eslint/naming-convention */
+import { useCallback, useEffect, useState } from 'react'
+
+import React from 'react'
+
+import { Button } from '@janhq/uikit'
+import { useAtomValue } from 'jotai'
+
+import { CopyIcon, CheckIcon } from 'lucide-react'
+
+import { useClipboard } from '@/hooks/useClipboard'
+import { useLogs } from '@/hooks/useLogs'
+
+import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
+
+type ServerLogsProps = { limit?: number; withCopy?: boolean }
+
+const ServerLogs = (props: ServerLogsProps) => {
+  const { limit = 0 } = props
+  const { getLogs } = useLogs()
+  const serverEnabled = useAtomValue(serverEnabledAtom)
+  const [logs, setLogs] = useState([])
+
+  const clipboard = useClipboard({ timeout: 1000 })
+
+  const updateLogs = useCallback(
+    () =>
+      getLogs('server').then((log) => {
+        if (typeof log?.split === 'function') {
+          setLogs(log.split(/\r?\n|\r|\n/g))
+        }
+      }),
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+    []
+  )
+
+  useEffect(() => {
+    if (serverEnabled) {
+      updateLogs()
+    }
+  }, [serverEnabled, updateLogs])
+
+  useEffect(() => {
+    updateLogs()
+
+    // Log polling interval
+    const intervalId = setInterval(() => {
+      updateLogs()
+    }, window.core?.api?.pollingInterval ?? 1000)
+
+    // clean up interval
+    return () => clearInterval(intervalId)
+  }, [updateLogs])
+
+  return (
+    <>
+      <div className="absolute -top-11 right-2">
+        <Button
+          themes="outline"
+          className="bg-white dark:bg-secondary/50"
+          onClick={() => {
+            clipboard.copy(logs.slice(-100) ?? '')
+          }}
+        >
+          <div className="flex items-center space-x-2">
+            {clipboard.copied ? (
+              <>
+                <CheckIcon size={14} className="text-green-600" />
+                <span>Copying...</span>
+              </>
+            ) : (
+              <>
+                <CopyIcon size={14} />
+                <span>Copy All</span>
+              </>
+            )}
+          </div>
+        </Button>
+      </div>
+      <div className="overflow-hidden">
+        {logs.length > 1 ? (
+          <div className="h-full overflow-auto">
+            <code className="inline-block whitespace-pre-line text-xs">
+              {logs.slice(-limit).map((log, i) => {
+                return (
+                  <p key={i} className="my-2 leading-relaxed">
+                    {log}
+                  </p>
+                )
+              })}
+            </code>
+          </div>
+        ) : (
+          <div className="mt-24 flex flex-col items-center justify-center">
+            <svg
+              width="115"
+              height="115"
+              viewBox="0 0 115 115"
+              fill="none"
+              xmlns="http://www.w3.org/2000/svg"
+            >
+              <circle cx="57.4999" cy="57.5009" r="50.2314" fill="#DADADA" />
+              <circle
+                cx="57.5"
+                cy="57.5"
+                r="55.9425"
+                fill="#E7E7E7"
+                stroke="white"
+                strokeWidth="3.1151"
+              />
+              <mask
+                id="mask0_1206_120508"
+                maskUnits="userSpaceOnUse"
+                x="3"
+                y="3"
+                width="109"
+                height="109"
+              >
+                <circle cx="57.4993" cy="57.5003" r="54.1253" fill="white" />
+              </mask>
+              <g mask="url(#mask0_1206_120508)">
+                <path
+                  d="M47.5039 116.445H58.5351L74.3593 39.8282L63.7828 37.6406L47.5039 116.445Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M72.165 39.4563L74.3716 39.8457L72.4246 38.418L72.165 39.4563Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M45.6797 114.947H56.7108L72.4257 38.4193L61.9585 36.1426L45.6797 114.947Z"
+                  fill="url(#paint0_linear_1206_120508)"
+                />
+                <path
+                  d="M93.1887 90.6726L26.5474 76.906L24.6602 75.2136L31.7058 51.9418L34.7984 52.1448L30.0296 49.6041L32.757 36.0039L99.3983 49.7705L101.29 51.467L98.5257 64.844L93.2456 64.9414L96.1515 65.4974L98.0387 67.1898L93.1887 90.6726Z"
+                  fill="#8D8D8D"
+                />
+                <path
+                  d="M91.3015 88.9801L24.6602 75.2136L29.8186 50.2454L32.9112 50.4483L30.3299 47.7656L32.757 36.0039L99.3983 49.7705L96.6345 63.1475L91.3583 63.2449L96.1515 65.4974L91.3015 88.9801Z"
+                  fill="url(#paint1_linear_1206_120508)"
+                />
+                <path
+                  d="M92.7826 63.1065C92.7826 63.1065 92.7298 63.1065 92.6243 63.1065L92.1576 63.0741L90.3637 62.9279L89.069 62.8143L87.5308 62.6317C86.431 62.4937 85.1688 62.3638 83.7929 62.1365L81.6216 61.8078C80.8667 61.6901 80.0875 61.5359 79.2798 61.4019C77.6564 61.126 75.9396 60.7647 74.1295 60.3995C70.5133 59.6324 66.5563 58.703 62.4247 57.6518C54.1655 55.5252 46.7221 53.4797 41.2918 52.1525C39.9403 51.8075 38.7065 51.5275 37.6391 51.2677C36.5717 51.008 35.6098 50.797 34.8631 50.6306L33.1098 50.2247L32.6552 50.1151C32.6025 50.1035 32.5508 50.0872 32.501 50.0664C32.5545 50.0686 32.6076 50.0768 32.6593 50.0908L33.1219 50.176L34.8834 50.5291C35.6504 50.6833 36.5879 50.8822 37.6675 51.1297C38.7471 51.3773 39.9849 51.6452 41.3446 51.978C46.783 53.2605 54.2386 55.2816 62.4937 57.4043C66.6253 58.4554 70.5742 59.3929 74.1823 60.1722C75.9924 60.5415 77.7051 60.9109 79.3245 61.195C80.1362 61.3411 80.9114 61.4953 81.6622 61.6008L83.8254 61.9458C85.2012 62.1852 86.4553 62.3273 87.5552 62.4775L89.0893 62.6804L90.3799 62.8143L92.1698 63.0091L92.6324 63.0659L92.7826 63.1065Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M96.131 60.9773C96.0789 60.948 96.0288 60.9155 95.9808 60.8799L95.5749 60.5755C95.2056 60.3117 94.678 59.8937 93.9515 59.3985C91.9511 57.9951 89.8665 56.7156 87.7095 55.5673C84.5067 53.8752 81.1551 52.4813 77.697 51.4032C73.4578 50.101 69.0819 49.2947 64.6569 49.0005C59.9449 48.6555 55.4481 49.1142 51.353 49.2075C49.411 49.2762 47.4666 49.2369 45.529 49.0898C41.3921 48.7494 37.3342 47.762 33.5035 46.1636C32.6918 45.8267 32.0952 45.5426 31.6853 45.3519L31.2226 45.1165L31.0684 45.0312C31.1262 45.0462 31.1821 45.068 31.2348 45.0962L31.7096 45.3072C32.1155 45.4939 32.7364 45.7658 33.54 46.0865C35.8079 46.9951 38.1522 47.7 40.5451 48.1929C42.1954 48.5323 43.8654 48.7681 45.5452 48.899C47.4754 49.0336 49.4114 49.0647 51.3449 48.9924C55.4278 48.8869 59.9368 48.4201 64.6731 48.7651C69.1177 49.0615 73.5121 49.8788 77.766 51.2002C81.2331 52.295 84.5906 53.7108 87.7947 55.4293C89.949 56.5876 92.0247 57.8864 94.0083 59.3173C94.7105 59.8206 95.2259 60.2549 95.5912 60.5349L95.997 60.8596C96.0446 60.8953 96.0894 60.9347 96.131 60.9773Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M63.9192 43.0816C63.8188 43.1282 63.7141 43.1649 63.6067 43.1912L62.6935 43.4631C62.2876 43.5849 61.8128 43.7188 61.2405 43.8487C60.6683 43.9786 60.023 44.1572 59.2924 44.287C58.5619 44.4169 57.7745 44.5914 56.91 44.6929C56.0456 44.7943 55.1283 44.9364 54.1583 45.046C52.0463 45.2502 49.9242 45.3328 47.8027 45.2936C45.6814 45.2371 43.565 45.0623 41.4632 44.77C40.4973 44.6158 39.58 44.4818 38.7278 44.2951C37.8755 44.1084 37.1043 43.9461 36.3697 43.7675C35.6351 43.589 35.0101 43.4063 34.446 43.244C33.8818 43.0816 33.3989 42.9315 33.0092 42.7975L32.1082 42.485C32.0022 42.4531 31.8991 42.4123 31.7998 42.3633C31.9103 42.3761 32.0191 42.4006 32.1245 42.4363L33.0377 42.7042C33.4435 42.826 33.9143 42.968 34.4825 43.1101C35.0507 43.2521 35.7001 43.4469 36.4103 43.5971C37.1206 43.7472 37.916 43.942 38.7683 44.0922C39.6206 44.2424 40.5338 44.3966 41.4957 44.5427C43.5877 44.8202 45.693 44.9868 47.8027 45.0419C49.9143 45.0792 52.0264 45.0034 54.1299 44.8146C55.0959 44.7091 56.0172 44.6239 56.8735 44.4859C57.7299 44.3479 58.5253 44.2302 59.2518 44.08C59.9783 43.9299 60.6277 43.8 61.1999 43.6742C61.7722 43.5484 62.2633 43.4347 62.661 43.3292L63.5823 43.106C63.6933 43.0854 63.8063 43.0772 63.9192 43.0816Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M46.1782 66.8891C46.1782 66.8891 46.2837 66.9459 46.4786 67.0677L47.3552 67.6075C48.1263 68.0742 49.2546 68.7885 50.7644 69.5962C52.5839 70.6072 54.5341 71.3624 56.56 71.8405C57.1712 71.9765 57.7909 72.0714 58.4148 72.1246C59.0677 72.2062 59.729 72.063 60.2898 71.7188C60.5621 71.5185 60.7593 71.2327 60.8499 70.9071C60.9379 70.5705 60.9379 70.2169 60.8499 69.8803C60.6372 69.1763 60.1849 68.5689 59.5714 68.1635C54.4901 64.7949 47.3349 62.3395 39.2381 62.1122C38.2275 62.0797 37.2088 62.0797 36.1698 62.1122C35.1309 62.1447 34.0756 62.3882 33.3816 63.1593C33.2064 63.3413 33.0692 63.5562 32.9779 63.7918C32.8866 64.0273 32.8431 64.2786 32.85 64.5311C32.8877 65.0471 33.0864 65.5383 33.4181 65.9354C34.0716 66.7714 35.0132 67.3518 35.9182 67.9646C39.5709 70.4403 43.4387 72.8998 47.7895 74.6044C52.1402 76.309 56.7629 77.0761 61.1177 76.4308C62.1922 76.2718 63.2512 76.0219 64.2834 75.684C65.3 75.3967 66.2119 74.8217 66.9093 74.0281C67.5327 73.2028 67.8626 72.1929 67.8468 71.1587C67.8497 70.1451 67.625 69.1437 67.1893 68.2284C66.3039 66.4723 64.9462 64.9979 63.2688 63.971C61.6898 62.9951 59.9765 62.2554 58.1834 61.7753C56.4585 61.2761 54.7499 60.919 53.1183 60.5578L48.4226 59.4944L34.2542 56.276L30.4067 55.3872L29.4083 55.1518C29.181 55.099 29.0674 55.0625 29.0674 55.0625L29.4124 55.1274L30.4189 55.3385L34.2786 56.1827L48.4632 59.324L53.1589 60.3711C54.7824 60.7404 56.5032 61.0895 58.2402 61.5887C60.0548 62.0698 61.7887 62.8151 63.3865 63.8006C65.1016 64.8462 66.4904 66.3503 67.3963 68.1432C67.8467 69.0889 68.0797 70.1234 68.0782 71.1709C68.0964 72.2575 67.7507 73.319 67.096 74.1864C66.3707 75.017 65.4208 75.6203 64.3605 75.9235C63.3146 76.2697 62.2404 76.5237 61.1502 76.6824C56.7426 77.3399 52.0631 76.5566 47.7002 74.8479C43.3372 73.1393 39.441 70.6798 35.7965 68.1919C34.8955 67.5669 33.9376 66.9743 33.2477 66.0936C32.8831 65.658 32.6657 65.1181 32.6267 64.5514C32.6196 64.2683 32.6687 63.9866 32.7711 63.7226C32.8735 63.4586 33.0272 63.2174 33.2233 63.0132C33.599 62.6113 34.0734 62.3147 34.5992 62.1528C35.1094 61.9991 35.6373 61.9118 36.1698 61.893C37.2169 61.8525 38.2438 61.8565 39.2584 61.893C47.4039 62.1406 54.5794 64.6163 59.6932 68.0336C60.3373 68.4648 60.8099 69.1082 61.0285 69.8519C61.1239 70.2164 61.1239 70.5994 61.0285 70.9639C60.9286 71.3211 60.7095 71.6333 60.4075 71.8487C59.8169 72.2131 59.12 72.3662 58.431 72.2829C57.7989 72.2243 57.1713 72.1253 56.5519 71.9867C54.5186 71.4945 52.5639 70.7213 50.7441 69.6895C49.2343 68.8778 48.1142 68.1391 47.3512 67.6602C46.9778 67.4208 46.6896 67.2544 46.4907 67.1002C46.2919 66.9459 46.1782 66.8891 46.1782 66.8891Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M94.8364 71.2204C94.6993 71.2055 94.5635 71.1797 94.4305 71.1433C94.1789 71.0743 93.8014 71.0012 93.3185 70.916C91.9393 70.7187 90.5384 70.7297 89.1625 70.9484C87.1263 71.2911 85.1507 71.9282 83.2979 72.8397C81.0433 73.9901 78.866 75.2861 76.7799 76.7197C74.6823 78.1612 72.4837 79.4497 70.201 80.5753C68.3181 81.4721 66.3087 82.0743 64.243 82.3611C62.8484 82.5487 61.4325 82.5089 60.0505 82.2434C59.6768 82.1692 59.3081 82.0716 58.9466 81.9512C58.8182 81.9168 58.6932 81.8706 58.5732 81.8132C58.7037 81.8336 58.8326 81.8634 58.9588 81.9025C59.2104 81.9755 59.5838 82.0567 60.0668 82.15C61.4407 82.3746 62.841 82.3869 64.2187 82.1866C66.2604 81.8789 68.2442 81.266 70.1036 80.3683C72.3696 79.236 74.5543 77.9477 76.6419 76.5127C78.7383 75.0733 80.9295 73.777 83.2005 72.6327C85.0755 71.7192 87.077 71.0926 89.1382 70.7739C90.5308 70.568 91.9473 70.5845 93.3347 70.8226C93.72 70.8867 94.1009 70.9748 94.4752 71.0864C94.5995 71.1198 94.7204 71.1646 94.8364 71.2204Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M93.6026 77.826C93.6026 77.8504 93.286 77.7205 92.7016 77.5906C91.8761 77.4114 91.0248 77.3839 90.1894 77.5095C88.9516 77.719 87.7468 78.0901 86.6057 78.6134C85.195 79.2299 83.8293 79.9446 82.5187 80.7523C81.1063 81.5883 79.7589 82.4041 78.4602 83.025C77.321 83.5882 76.1214 84.0199 74.8846 84.3116C74.0488 84.5016 73.1926 84.5861 72.3358 84.5632C72.1034 84.5575 71.8716 84.5372 71.6418 84.5024C71.5603 84.4985 71.4797 84.4835 71.4023 84.4577C71.4023 84.4293 71.7392 84.4577 72.3358 84.4577C73.1828 84.4453 74.0257 84.3364 74.8481 84.133C76.0637 83.8193 77.242 83.3757 78.3628 82.8099C79.6371 82.1849 80.9724 81.3692 82.3888 80.529C83.7103 79.7132 85.0914 78.9983 86.5204 78.3902C87.683 77.8677 88.9122 77.5085 90.1731 77.3228C91.0279 77.2097 91.8965 77.2648 92.73 77.4851C92.9548 77.5461 93.1757 77.6207 93.3916 77.7083C93.4671 77.7375 93.5381 77.7771 93.6026 77.826Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M72.1531 44.1988C72.1531 44.2678 69.584 43.7645 66.4468 43.0746C63.3095 42.3846 60.7648 41.7718 60.7932 41.7069C60.8216 41.6419 63.3623 42.1411 66.4995 42.8311C69.6368 43.521 72.1531 44.1339 72.1531 44.1988Z"
+                  fill="#A9A9A9"
+                />
+                <path
+                  d="M87.7278 22.8493C87.9286 21.4011 85.8726 20.21 84.3238 20.0848C83.5886 20.0273 82.8227 20.139 82.1249 19.8987C80.6135 19.3743 80.011 17.432 78.5371 16.8128C77.4342 16.3526 76.1544 16.762 75.0957 17.2967C74.0371 17.8313 72.9717 18.5046 71.7769 18.5825C70.7557 18.6468 69.6086 18.2644 68.7133 18.7686C68.0326 19.1442 67.6922 19.9224 67.059 20.3792C66.4259 20.836 65.6498 20.9206 64.8941 20.9612C64.1384 21.0018 63.3521 21.012 62.6611 21.3233C61.9701 21.6346 61.4017 22.3655 61.5446 23.1031L87.7278 22.8493Z"
+                  fill="#ABABAB"
+                />
+                <path
+                  d="M39.1881 32.5312C39.3293 31.4869 37.8655 30.6287 36.7662 30.5385C36.2413 30.4963 35.6955 30.5769 35.1993 30.4022C34.121 30.0182 33.6916 28.6264 32.64 28.1791C31.8556 27.847 30.951 28.1426 30.1895 28.5285C29.428 28.9144 28.6741 29.4001 27.8229 29.4538C27.0824 29.5018 26.2789 29.2254 25.632 29.5901C25.1491 29.8608 24.8972 30.4195 24.4525 30.742C24.0078 31.0645 23.4486 31.126 22.9085 31.1624C22.3684 31.1989 21.8092 31.1989 21.3187 31.4254C20.8282 31.652 20.4198 32.1741 20.5229 32.7078L39.1881 32.5312Z"
+                  fill="#ABABAB"
+                />
+                <path
+                  d="M76.46 61.6777L78.8178 62.1824L80.1702 66.9562L80.2674 66.977L83.4556 63.1752L85.8134 63.6799L80.8041 69.3391L80.0506 72.8588L77.9602 72.4114L78.7137 68.8917L76.46 61.6777Z"
+                  fill="white"
+                />
+                <path
+                  d="M67.148 61.4992L67.5195 59.7637L75.6965 61.514L75.325 63.2496L72.2769 62.5971L70.5171 70.8178L68.4364 70.3724L70.1962 62.1517L67.148 61.4992Z"
+                  fill="white"
+                />
+                <path
+                  d="M56.9049 67.9016L59.0361 57.9453L62.9642 58.7862C63.7193 58.9478 64.3318 59.2297 64.8016 59.632C65.272 60.0309 65.5922 60.5147 65.762 61.0832C65.9357 61.6491 65.9518 62.2627 65.8103 62.9238C65.6688 63.585 65.4013 64.1379 65.0078 64.5824C64.6144 65.0269 64.1169 65.3323 63.5153 65.4984C62.9169 65.6652 62.2353 65.6667 61.4705 65.503L58.9668 64.967L59.3279 63.2801L61.4913 63.7432C61.8964 63.8299 62.2451 63.8317 62.5375 63.7485C62.8338 63.6628 63.0734 63.5091 63.2565 63.2872C63.4435 63.0629 63.572 62.7871 63.6421 62.4597C63.7128 62.1291 63.7082 61.8265 63.628 61.5517C63.5518 61.2744 63.3954 61.0392 63.1587 60.8462C62.9228 60.65 62.6007 60.5082 62.1923 60.4207L60.7728 60.1169L59.0099 68.3522L56.9049 67.9016Z"
+                  fill="white"
+                />
+                <path
+                  d="M46.5049 55.2637L49.1009 55.8194L50.4108 63.0957L50.5275 63.1206L54.7013 57.0182L57.2973 57.5739L55.1661 67.5302L53.1243 67.0931L54.5114 60.6128L54.4288 60.5951L50.4754 66.4753L49.0851 66.1776L47.8905 59.1701L47.8078 59.1524L46.4154 65.657L44.3736 65.2199L46.5049 55.2637Z"
+                  fill="white"
+                />
+                <path
+                  d="M35.9977 63.425L38.1289 53.4688L44.8377 54.9048L44.4662 56.6404L39.8624 55.6549L39.3546 58.0273L43.6132 58.9389L43.2417 60.6744L38.9831 59.7628L38.4742 62.1401L43.0974 63.1297L42.7259 64.8653L35.9977 63.425Z"
+                  fill="white"
+                />
+              </g>
+              <defs>
+                <linearGradient
+                  id="paint0_linear_1206_120508"
+                  x1="59.1074"
+                  y1="36.1426"
+                  x2="59.1074"
+                  y2="114.947"
+                  gradientUnits="userSpaceOnUse"
+                >
+                  <stop stopColor="#CFCFCF" />
+                  <stop offset="1" stopColor="#C6C6C6" />
+                </linearGradient>
+                <linearGradient
+                  id="paint1_linear_1206_120508"
+                  x1="62.0292"
+                  y1="36.0039"
+                  x2="62.0292"
+                  y2="88.9801"
+                  gradientUnits="userSpaceOnUse"
+                >
+                  <stop stopColor="#DDDDDD" />
+                  <stop offset="1" stopColor="#B6B6B6" />
+                </linearGradient>
+              </defs>
+            </svg>
+            <p className="mt-4 text-muted-foreground">Empty logs</p>
+          </div>
+        )}
+      </div>
+    </>
+  )
+}
+
+export default ServerLogs
diff --git a/web/containers/Toast/index.tsx b/web/containers/Toast/index.tsx
index 7cffa89b98..eae340fee5 100644
--- a/web/containers/Toast/index.tsx
+++ b/web/containers/Toast/index.tsx
@@ -19,8 +19,8 @@ const ErrorIcon = () => {
       xmlns="http://www.w3.org/2000/svg"
     >
       <path
-        fill-rule="evenodd"
-        clip-rule="evenodd"
+        fillRule="evenodd"
+        clipRule="evenodd"
         d="M20 10C20 15.5228 15.5228 20 10 20H0.993697C0.110179 20 -0.332289 18.9229 0.292453 18.2929L2.2495 16.3195C0.843343 14.597 1.21409e-08 12.397 1.21409e-08 10C1.21409e-08 4.47715 4.47715 0 10 0C15.5228 0 20 4.47715 20 10ZM13.2071 6.79289C13.5976 7.18342 13.5976 7.81658 13.2071 8.20711L11.4142 10L13.2071 11.7929C13.5976 12.1834 13.5976 12.8166 13.2071 13.2071C12.8166 13.5976 12.1834 13.5976 11.7929 13.2071L10 11.4142L8.20711 13.2071C7.81658 13.5976 7.18342 13.5976 6.79289 13.2071C6.40237 12.8166 6.40237 12.1834 6.79289 11.7929L8.58579 10L6.79289 8.20711C6.40237 7.81658 6.40237 7.18342 6.79289 6.79289C7.18342 6.40237 7.81658 6.40237 8.20711 6.79289L10 8.58579L11.7929 6.79289C12.1834 6.40237 12.8166 6.40237 13.2071 6.79289Z"
         fill="#EA2E4E"
       />
@@ -38,8 +38,8 @@ const WarningIcon = () => {
       xmlns="http://www.w3.org/2000/svg"
     >
       <path
-        fill-rule="evenodd"
-        clip-rule="evenodd"
+        fillRule="evenodd"
+        clipRule="evenodd"
         d="M20 10C20 15.5228 15.5228 20 10 20H0.993697C0.110179 20 -0.332289 18.9229 0.292453 18.2929L2.2495 16.3195C0.843343 14.597 1.21409e-08 12.397 1.21409e-08 10C1.21409e-08 4.47715 4.47715 0 10 0C15.5228 0 20 4.47715 20 10ZM10.99 6C10.99 5.44772 10.5446 5 9.99502 5C9.44549 5 9 5.44772 9 6V10C9 10.5523 9.44549 11 9.99502 11C10.5446 11 10.99 10.5523 10.99 10V6ZM9.99502 13C9.44549 13 9 13.4477 9 14C9 14.5523 9.44549 15 9.99502 15H10.005C10.5545 15 11 14.5523 11 14C11 13.4477 10.5545 13 10.005 13H9.99502Z"
         fill="#FACC15"
       />
@@ -57,8 +57,8 @@ const SuccessIcon = () => {
       xmlns="http://www.w3.org/2000/svg"
     >
       <path
-        fill-rule="evenodd"
-        clip-rule="evenodd"
+        fillRule="evenodd"
+        clipRule="evenodd"
         d="M20 10C20 15.5228 15.5228 20 10 20H0.993697C0.110179 20 -0.332289 18.9229 0.292453 18.2929L2.2495 16.3195C0.843343 14.597 1.21409e-08 12.397 1.21409e-08 10C1.21409e-08 4.47715 4.47715 0 10 0C15.5228 0 20 4.47715 20 10ZM13.7071 8.70711C14.0976 8.31658 14.0976 7.68342 13.7071 7.29289C13.3166 6.90237 12.6834 6.90237 12.2929 7.29289L9 10.5858L7.70711 9.2929C7.31658 8.90237 6.68342 8.90237 6.29289 9.2929C5.90237 9.68342 5.90237 10.3166 6.29289 10.7071L8.29289 12.7071C8.48043 12.8946 8.73478 13 9 13C9.26522 13 9.51957 12.8946 9.70711 12.7071L13.7071 8.70711Z"
         fill="#34D399"
       />
@@ -76,8 +76,8 @@ const DefaultIcon = () => {
       xmlns="http://www.w3.org/2000/svg"
     >
       <path
-        fill-rule="evenodd"
-        clip-rule="evenodd"
+        fillRule="evenodd"
+        clipRule="evenodd"
         d="M10 20C15.5228 20 20 15.5228 20 10C20 4.47715 15.5228 0 10 0C4.47715 0 2.11188e-08 4.47715 2.11188e-08 10C2.11188e-08 12.397 0.843343 14.597 2.2495 16.3195L0.292453 18.2929C-0.332289 18.9229 0.110179 20 0.993697 20H10ZM5.5 8C5.5 7.44772 5.94772 7 6.5 7H13.5C14.0523 7 14.5 7.44772 14.5 8C14.5 8.55229 14.0523 9 13.5 9H6.5C5.94772 9 5.5 8.55229 5.5 8ZM6.5 11C5.94772 11 5.5 11.4477 5.5 12C5.5 12.5523 5.94772 13 6.5 13H9.5C10.0523 13 10.5 12.5523 10.5 12C10.5 11.4477 10.0523 11 9.5 11H6.5Z"
         fill="#60A5FA"
       />
diff --git a/web/context/FeatureToggle.tsx b/web/context/FeatureToggle.tsx
index 6444359b0b..5a63eb66eb 100644
--- a/web/context/FeatureToggle.tsx
+++ b/web/context/FeatureToggle.tsx
@@ -4,18 +4,26 @@ interface FeatureToggleContextType {
   experimentalFeature: boolean
   ignoreSSL: boolean
   proxy: string
+  proxyEnabled: boolean
+  vulkanEnabled: boolean
   setExperimentalFeature: (on: boolean) => void
+  setVulkanEnabled: (on: boolean) => void
   setIgnoreSSL: (on: boolean) => void
   setProxy: (value: string) => void
+  setProxyEnabled: (on: boolean) => void
 }
 
 const initialContext: FeatureToggleContextType = {
   experimentalFeature: false,
   ignoreSSL: false,
   proxy: '',
+  proxyEnabled: false,
+  vulkanEnabled: false,
   setExperimentalFeature: () => {},
+  setVulkanEnabled: () => {},
   setIgnoreSSL: () => {},
   setProxy: () => {},
+  setProxyEnabled: () => {},
 }
 
 export const FeatureToggleContext =
@@ -27,10 +35,15 @@ export default function FeatureToggleWrapper({
   children: ReactNode
 }) {
   const EXPERIMENTAL_FEATURE = 'experimentalFeature'
+  const VULKAN_ENABLED = 'vulkanEnabled'
   const IGNORE_SSL = 'ignoreSSLFeature'
   const HTTPS_PROXY_FEATURE = 'httpsProxyFeature'
+  const PROXY_FEATURE_ENABLED = 'proxyFeatureEnabled'
+
   const [experimentalFeature, directSetExperimentalFeature] =
     useState<boolean>(false)
+  const [proxyEnabled, directSetProxyEnabled] = useState<boolean>(false)
+  const [vulkanEnabled, directEnableVulkan] = useState<boolean>(false)
   const [ignoreSSL, directSetIgnoreSSL] = useState<boolean>(false)
   const [proxy, directSetProxy] = useState<string>('')
 
@@ -40,6 +53,9 @@ export default function FeatureToggleWrapper({
     )
     directSetIgnoreSSL(localStorage.getItem(IGNORE_SSL) === 'true')
     directSetProxy(localStorage.getItem(HTTPS_PROXY_FEATURE) ?? '')
+    directSetProxyEnabled(
+      localStorage.getItem(PROXY_FEATURE_ENABLED) === 'true'
+    )
   }, [])
 
   const setExperimentalFeature = (on: boolean) => {
@@ -47,6 +63,11 @@ export default function FeatureToggleWrapper({
     directSetExperimentalFeature(on)
   }
 
+  const setVulkanEnabled = (on: boolean) => {
+    localStorage.setItem(VULKAN_ENABLED, on ? 'true' : 'false')
+    directEnableVulkan(on)
+  }
+
   const setIgnoreSSL = (on: boolean) => {
     localStorage.setItem(IGNORE_SSL, on ? 'true' : 'false')
     directSetIgnoreSSL(on)
@@ -57,15 +78,24 @@ export default function FeatureToggleWrapper({
     directSetProxy(proxy)
   }
 
+  const setProxyEnabled = (on: boolean) => {
+    localStorage.setItem(PROXY_FEATURE_ENABLED, on ? 'true' : 'false')
+    directSetProxyEnabled(on)
+  }
+
   return (
     <FeatureToggleContext.Provider
       value={{
         experimentalFeature,
         ignoreSSL,
         proxy,
+        proxyEnabled,
+        vulkanEnabled,
         setExperimentalFeature,
+        setVulkanEnabled,
         setIgnoreSSL,
         setProxy,
+        setProxyEnabled,
       }}
     >
       {children}
diff --git a/web/extension/ExtensionManager.ts b/web/extension/ExtensionManager.ts
index 3074177bb8..1259021f73 100644
--- a/web/extension/ExtensionManager.ts
+++ b/web/extension/ExtensionManager.ts
@@ -83,7 +83,10 @@ export class ExtensionManager {
     // Import class
     const extensionUrl = window.electronAPI
       ? extension.url
-      : extension.url.replace('extension://', `${API_BASE_URL}/extensions/`)
+      : extension.url.replace(
+          'extension://',
+          `${window.core?.api?.baseApiUrl ?? ''}/extensions/`
+        )
     await import(/* webpackIgnore: true */ extensionUrl).then(
       (extensionClass) => {
         // Register class if it has a default export
diff --git a/web/helpers/atoms/Assistant.atom.ts b/web/helpers/atoms/Assistant.atom.ts
new file mode 100644
index 0000000000..e90923d3d2
--- /dev/null
+++ b/web/helpers/atoms/Assistant.atom.ts
@@ -0,0 +1,4 @@
+import { Assistant } from '@janhq/core/.'
+import { atom } from 'jotai'
+
+export const assistantsAtom = atom<Assistant[]>([])
diff --git a/web/helpers/atoms/ChatMessage.atom.ts b/web/helpers/atoms/ChatMessage.atom.ts
index b11e8f3be2..0061eca7cf 100644
--- a/web/helpers/atoms/ChatMessage.atom.ts
+++ b/web/helpers/atoms/ChatMessage.atom.ts
@@ -16,6 +16,8 @@ import {
  */
 export const chatMessages = atom<Record<string, ThreadMessage[]>>({})
 
+export const readyThreadsMessagesAtom = atom<Record<string, boolean>>({})
+
 /**
  * Return the chat messages for the current active conversation
  */
@@ -34,6 +36,10 @@ export const setConvoMessagesAtom = atom(
     }
     newData[threadId] = messages
     set(chatMessages, newData)
+    set(readyThreadsMessagesAtom, {
+      ...get(readyThreadsMessagesAtom),
+      [threadId]: true,
+    })
   }
 )
 
@@ -70,11 +76,12 @@ export const addNewMessageAtom = atom(
     set(chatMessages, newData)
 
     // Update thread last message
-    set(
-      updateThreadStateLastMessageAtom,
-      newMessage.thread_id,
-      newMessage.content
-    )
+    if (newMessage.content.length)
+      set(
+        updateThreadStateLastMessageAtom,
+        newMessage.thread_id,
+        newMessage.content
+      )
   }
 )
 
@@ -108,6 +115,8 @@ export const deleteMessageAtom = atom(null, (get, set, id: string) => {
   }
 })
 
+export const editMessageAtom = atom('')
+
 export const updateMessageAtom = atom(
   null,
   (
@@ -131,7 +140,8 @@ export const updateMessageAtom = atom(
       newData[conversationId] = updatedMessages
       set(chatMessages, newData)
       // Update thread last message
-      set(updateThreadStateLastMessageAtom, conversationId, text)
+      if (text.length)
+        set(updateThreadStateLastMessageAtom, conversationId, text)
     }
   }
 )
diff --git a/web/helpers/atoms/Model.atom.ts b/web/helpers/atoms/Model.atom.ts
index 6eb7f2ad68..512518df1f 100644
--- a/web/helpers/atoms/Model.atom.ts
+++ b/web/helpers/atoms/Model.atom.ts
@@ -4,23 +4,32 @@ import { atom } from 'jotai'
 export const stateModel = atom({ state: 'start', loading: false, model: '' })
 export const activeAssistantModelAtom = atom<Model | undefined>(undefined)
 
-export const downloadingModelsAtom = atom<Model[]>([])
+/**
+ * Stores the list of models which are being downloaded.
+ */
+const downloadingModelsAtom = atom<Model[]>([])
 
-export const addNewDownloadingModelAtom = atom(
-  null,
-  (get, set, model: Model) => {
-    const currentModels = get(downloadingModelsAtom)
-    set(downloadingModelsAtom, [...currentModels, model])
+export const getDownloadingModelAtom = atom((get) => get(downloadingModelsAtom))
+
+export const addDownloadingModelAtom = atom(null, (get, set, model: Model) => {
+  const downloadingModels = get(downloadingModelsAtom)
+  if (!downloadingModels.find((e) => e.id === model.id)) {
+    set(downloadingModelsAtom, [...downloadingModels, model])
   }
-)
+})
 
 export const removeDownloadingModelAtom = atom(
   null,
   (get, set, modelId: string) => {
-    const currentModels = get(downloadingModelsAtom)
+    const downloadingModels = get(downloadingModelsAtom)
+
     set(
       downloadingModelsAtom,
-      currentModels.filter((e) => e.id !== modelId)
+      downloadingModels.filter((e) => e.id !== modelId)
     )
   }
 )
+
+export const downloadedModelsAtom = atom<Model[]>([])
+
+export const configuredModelsAtom = atom<Model[]>([])
diff --git a/web/helpers/atoms/SystemBar.atom.ts b/web/helpers/atoms/SystemBar.atom.ts
index 42ef7b29f0..3c9a48f79c 100644
--- a/web/helpers/atoms/SystemBar.atom.ts
+++ b/web/helpers/atoms/SystemBar.atom.ts
@@ -2,6 +2,10 @@ import { atom } from 'jotai'
 
 export const totalRamAtom = atom<number>(0)
 export const usedRamAtom = atom<number>(0)
-export const availableRamAtom = atom<number>(0)
 
 export const cpuUsageAtom = atom<number>(0)
+export const ramUtilitizedAtom = atom<number>(0)
+
+export const gpusAtom = atom<Record<string, never>[]>([])
+
+export const nvidiaTotalVramAtom = atom<number>(0)
diff --git a/web/helpers/atoms/Thread.atom.ts b/web/helpers/atoms/Thread.atom.ts
index cab286bd16..f55541380a 100644
--- a/web/helpers/atoms/Thread.atom.ts
+++ b/web/helpers/atoms/Thread.atom.ts
@@ -28,6 +28,10 @@ export const isGeneratingResponseAtom = atom<boolean | undefined>(undefined)
  * Stores all thread states for the current user
  */
 export const threadStatesAtom = atom<Record<string, ThreadState>>({})
+
+// Whether thread data is ready or not
+export const threadDataReadyAtom = atom<boolean>(false)
+
 export const activeThreadStateAtom = atom<ThreadState | undefined>((get) => {
   const threadId = get(activeThreadIdAtom)
   if (!threadId) {
diff --git a/web/hooks/useActiveModel.ts b/web/hooks/useActiveModel.ts
index 54a1fdbe06..1b61a0dd19 100644
--- a/web/hooks/useActiveModel.ts
+++ b/web/hooks/useActiveModel.ts
@@ -3,9 +3,9 @@ import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 
 import { toaster } from '@/containers/Toast'
 
-import { useGetDownloadedModels } from './useGetDownloadedModels'
 import { LAST_USED_MODEL_ID } from './useRecommendedModel'
 
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
 import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 export const activeModelAtom = atom<Model | undefined>(undefined)
@@ -21,7 +21,7 @@ export function useActiveModel() {
   const [activeModel, setActiveModel] = useAtom(activeModelAtom)
   const activeThread = useAtomValue(activeThreadAtom)
   const [stateModel, setStateModel] = useAtom(stateModelAtom)
-  const { downloadedModels } = useGetDownloadedModels()
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
   const setLoadModelError = useSetAtom(loadModelErrorAtom)
 
   const startModel = async (modelId: string) => {
diff --git a/web/hooks/useAssistants.ts b/web/hooks/useAssistants.ts
new file mode 100644
index 0000000000..61679bce5e
--- /dev/null
+++ b/web/hooks/useAssistants.ts
@@ -0,0 +1,39 @@
+import { useCallback, useEffect } from 'react'
+
+import {
+  Assistant,
+  AssistantEvent,
+  AssistantExtension,
+  ExtensionTypeEnum,
+  events,
+} from '@janhq/core'
+
+import { useSetAtom } from 'jotai'
+
+import { extensionManager } from '@/extension'
+import { assistantsAtom } from '@/helpers/atoms/Assistant.atom'
+
+const useAssistants = () => {
+  const setAssistants = useSetAtom(assistantsAtom)
+
+  const getData = useCallback(async () => {
+    const assistants = await getLocalAssistants()
+    setAssistants(assistants)
+  }, [setAssistants])
+
+  useEffect(() => {
+    getData()
+
+    events.on(AssistantEvent.OnAssistantsUpdate, () => getData())
+    return () => {
+      events.off(AssistantEvent.OnAssistantsUpdate, () => getData())
+    }
+  }, [getData])
+}
+
+const getLocalAssistants = async (): Promise<Assistant[]> =>
+  extensionManager
+    .get<AssistantExtension>(ExtensionTypeEnum.Assistant)
+    ?.getAssistants() ?? []
+
+export default useAssistants
diff --git a/web/hooks/useCreateNewThread.ts b/web/hooks/useCreateNewThread.ts
index ee8df22df6..722e5b7e4f 100644
--- a/web/hooks/useCreateNewThread.ts
+++ b/web/hooks/useCreateNewThread.ts
@@ -1,3 +1,5 @@
+import { useContext } from 'react'
+
 import {
   Assistant,
   ConversationalExtension,
@@ -6,12 +8,17 @@ import {
   ThreadAssistantInfo,
   ThreadState,
   Model,
+  AssistantTool,
+  events,
+  InferenceEvent,
 } from '@janhq/core'
-import { atom, useSetAtom } from 'jotai'
+import { atom, useAtomValue, useSetAtom } from 'jotai'
 
 import { selectedModelAtom } from '@/containers/DropdownListSidebar'
 import { fileUploadAtom } from '@/containers/Providers/Jotai'
 
+import { FeatureToggleContext } from '@/context/FeatureToggle'
+
 import { generateThreadId } from '@/utils/thread'
 
 import useRecommendedModel from './useRecommendedModel'
@@ -19,11 +26,13 @@ import useRecommendedModel from './useRecommendedModel'
 import useSetActiveThread from './useSetActiveThread'
 
 import { extensionManager } from '@/extension'
+
 import {
   threadsAtom,
   threadStatesAtom,
   updateThreadAtom,
   setThreadModelParamsAtom,
+  isGeneratingResponseAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 const createNewThreadAtom = atom(null, (get, set, newThread: Thread) => {
@@ -50,20 +59,42 @@ export const useCreateNewThread = () => {
   const setFileUpload = useSetAtom(fileUploadAtom)
   const setSelectedModel = useSetAtom(selectedModelAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
+  const { experimentalFeature } = useContext(FeatureToggleContext)
+  const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
 
   const { recommendedModel, downloadedModels } = useRecommendedModel()
 
+  const threads = useAtomValue(threadsAtom)
+
   const requestCreateNewThread = async (
     assistant: Assistant,
     model?: Model | undefined
   ) => {
+    // Stop generating if any
+    setIsGeneratingResponse(false)
+    events.emit(InferenceEvent.OnInferenceStopped, {})
+
     const defaultModel = model ?? recommendedModel ?? downloadedModels[0]
 
+    // check last thread message, if there empty last message use can not create thread
+    const lastMessage = threads[0]?.metadata?.lastMessage
+
+    if (!lastMessage && threads.length) {
+      return null
+    }
+
+    // modify assistant tools when experimental on, retieval toggle enabled in default
+    const assistantTools: AssistantTool = {
+      type: 'retrieval',
+      enabled: true,
+      settings: assistant.tools && assistant.tools[0].settings,
+    }
+
     const createdAt = Date.now()
     const assistantInfo: ThreadAssistantInfo = {
       assistant_id: assistant.id,
       assistant_name: assistant.name,
-      tools: assistant.tools,
+      tools: experimentalFeature ? [assistantTools] : assistant.tools,
       model: {
         id: defaultModel?.id ?? '*',
         settings: defaultModel?.settings ?? {},
diff --git a/web/hooks/useDeleteModel.ts b/web/hooks/useDeleteModel.ts
index fa0cfb45ea..d9f2b94be2 100644
--- a/web/hooks/useDeleteModel.ts
+++ b/web/hooks/useDeleteModel.ts
@@ -1,13 +1,14 @@
 import { ExtensionTypeEnum, ModelExtension, Model } from '@janhq/core'
 
-import { toaster } from '@/containers/Toast'
+import { useAtom } from 'jotai'
 
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
+import { toaster } from '@/containers/Toast'
 
 import { extensionManager } from '@/extension/ExtensionManager'
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
 
 export default function useDeleteModel() {
-  const { setDownloadedModels, downloadedModels } = useGetDownloadedModels()
+  const [downloadedModels, setDownloadedModels] = useAtom(downloadedModelsAtom)
 
   const deleteModel = async (model: Model) => {
     await extensionManager
diff --git a/web/hooks/useDownloadModel.ts b/web/hooks/useDownloadModel.ts
index 528108d187..59333fbdec 100644
--- a/web/hooks/useDownloadModel.ts
+++ b/web/hooks/useDownloadModel.ts
@@ -1,4 +1,4 @@
-import { useContext } from 'react'
+import { useCallback, useContext } from 'react'
 
 import {
   Model,
@@ -7,29 +7,47 @@ import {
   abortDownload,
   joinPath,
   ModelArtifact,
+  DownloadState,
 } from '@janhq/core'
 
 import { useSetAtom } from 'jotai'
 
 import { FeatureToggleContext } from '@/context/FeatureToggle'
 
-import { modelBinFileName } from '@/utils/model'
-
-import { useDownloadState } from './useDownloadState'
+import { setDownloadStateAtom } from './useDownloadState'
 
 import { extensionManager } from '@/extension/ExtensionManager'
-import { addNewDownloadingModelAtom } from '@/helpers/atoms/Model.atom'
+import { addDownloadingModelAtom } from '@/helpers/atoms/Model.atom'
 
 export default function useDownloadModel() {
-  const { ignoreSSL, proxy } = useContext(FeatureToggleContext)
-  const { setDownloadState } = useDownloadState()
-  const addNewDownloadingModel = useSetAtom(addNewDownloadingModelAtom)
+  const { ignoreSSL, proxy, proxyEnabled } = useContext(FeatureToggleContext)
+  const setDownloadState = useSetAtom(setDownloadStateAtom)
+  const addDownloadingModel = useSetAtom(addDownloadingModelAtom)
+
+  const downloadModel = useCallback(
+    async (model: Model) => {
+      const childProgresses: DownloadState[] = model.sources.map(
+        (source: ModelArtifact) => ({
+          fileName: source.filename,
+          modelId: model.id,
+          time: {
+            elapsed: 0,
+            remaining: 0,
+          },
+          speed: 0,
+          percent: 0,
+          size: {
+            total: 0,
+            transferred: 0,
+          },
+          downloadState: 'downloading',
+        })
+      )
 
-  const downloadModel = async (model: Model) => {
-    const childrenDownloadProgress: DownloadState[] = []
-    model.sources.forEach((source: ModelArtifact) => {
-      childrenDownloadProgress.push({
-        modelId: source.filename,
+      // set an initial download state
+      setDownloadState({
+        fileName: '',
+        modelId: model.id,
         time: {
           elapsed: 0,
           remaining: 0,
@@ -40,40 +58,35 @@ export default function useDownloadModel() {
           total: 0,
           transferred: 0,
         },
+        children: childProgresses,
+        downloadState: 'downloading',
       })
-    })
-
-    // set an initial download state
-    setDownloadState({
-      modelId: model.id,
-      time: {
-        elapsed: 0,
-        remaining: 0,
-      },
-      speed: 0,
-      percent: 0,
-      size: {
-        total: 0,
-        transferred: 0,
-      },
-      children: childrenDownloadProgress,
-    })
 
-    addNewDownloadingModel(model)
+      addDownloadingModel(model)
 
-    await extensionManager
-      .get<ModelExtension>(ExtensionTypeEnum.Model)
-      ?.downloadModel(model, { ignoreSSL, proxy })
-  }
+      await localDownloadModel(model, ignoreSSL, proxyEnabled ? proxy : '')
+    },
+    [ignoreSSL, proxy, proxyEnabled, addDownloadingModel, setDownloadState]
+  )
 
-  const abortModelDownload = async (model: Model) => {
-    await abortDownload(
-      await joinPath(['models', model.id, modelBinFileName(model)])
-    )
-  }
+  const abortModelDownload = useCallback(async (model: Model) => {
+    for (const source of model.sources) {
+      const path = await joinPath(['models', model.id, source.filename])
+      await abortDownload(path)
+    }
+  }, [])
 
   return {
     downloadModel,
     abortModelDownload,
   }
 }
+
+const localDownloadModel = async (
+  model: Model,
+  ignoreSSL: boolean,
+  proxy: string
+) =>
+  extensionManager
+    .get<ModelExtension>(ExtensionTypeEnum.Model)
+    ?.downloadModel(model, { ignoreSSL, proxy })
diff --git a/web/hooks/useDownloadState.ts b/web/hooks/useDownloadState.ts
index 37f41d2a1e..06de9bef60 100644
--- a/web/hooks/useDownloadState.ts
+++ b/web/hooks/useDownloadState.ts
@@ -1,96 +1,140 @@
-import { atom, useSetAtom, useAtomValue } from 'jotai'
+import { DownloadState } from '@janhq/core'
+import { atom } from 'jotai'
 
 import { toaster } from '@/containers/Toast'
 
+import {
+  configuredModelsAtom,
+  downloadedModelsAtom,
+  removeDownloadingModelAtom,
+} from '@/helpers/atoms/Model.atom'
+
 // download states
-const modelDownloadStateAtom = atom<Record<string, DownloadState>>({})
-
-const setDownloadStateAtom = atom(null, (get, set, state: DownloadState) => {
-  const currentState = { ...get(modelDownloadStateAtom) }
-  console.debug(
-    `current download state for ${state.modelId} is ${JSON.stringify(state)}`
-  )
-  currentState[state.modelId] = state
-  set(modelDownloadStateAtom, currentState)
-})
-
-const setDownloadStateSuccessAtom = atom(null, (get, set, modelId: string) => {
-  const currentState = { ...get(modelDownloadStateAtom) }
-  const state = currentState[modelId]
-  if (!state) {
-    console.debug(`Cannot find download state for ${modelId}`)
-    return
-  }
-  delete currentState[modelId]
-  set(modelDownloadStateAtom, currentState)
-  toaster({
-    title: 'Download Completed',
-    description: `Download ${modelId} completed`,
-    type: 'success',
-  })
-})
-
-const setDownloadStateFailedAtom = atom(
-  null,
-  (get, set, modelId: string, error: string) => {
-    const currentState = { ...get(modelDownloadStateAtom) }
-    const state = currentState[modelId]
-    if (!state) {
-      console.debug(`Cannot find download state for ${modelId}`)
-      return
-    }
-    if (error.includes('certificate')) {
-      error += '. To fix enable "Ignore SSL Certificates" in Advanced settings.'
-    }
-    toaster({
-      title: 'Download Failed',
-      description: `Model ${modelId} download failed: ${error}`,
-      type: 'error',
-    })
+export const modelDownloadStateAtom = atom<Record<string, DownloadState>>({})
 
-    delete currentState[modelId]
-    set(modelDownloadStateAtom, currentState)
-  }
-)
-const setDownloadStateCancelledAtom = atom(
+/**
+ * Used to set the download state for a particular model.
+ */
+export const setDownloadStateAtom = atom(
   null,
-  (get, set, modelId: string) => {
+  (get, set, state: DownloadState) => {
     const currentState = { ...get(modelDownloadStateAtom) }
-    const state = currentState[modelId]
-    if (!state) {
-      console.debug(`Cannot find download state for ${modelId}`)
-      toaster({
-        title: 'Cancel Download',
-        description: `Model ${modelId} cancel download`,
-        type: 'warning',
-      })
-
-      return
-    }
-    delete currentState[modelId]
-    set(modelDownloadStateAtom, currentState)
-  }
-)
 
-export function useDownloadState() {
-  const modelDownloadState = useAtomValue(modelDownloadStateAtom)
-  const setDownloadState = useSetAtom(setDownloadStateAtom)
-  const setDownloadStateSuccess = useSetAtom(setDownloadStateSuccessAtom)
-  const setDownloadStateFailed = useSetAtom(setDownloadStateFailedAtom)
-  const setDownloadStateCancelled = useSetAtom(setDownloadStateCancelledAtom)
+    if (state.downloadState === 'end') {
+      const modelDownloadState = currentState[state.modelId]
 
-  const downloadStates: DownloadState[] = []
-  for (const [, value] of Object.entries(modelDownloadState)) {
-    downloadStates.push(value)
-  }
+      const updatedChildren: DownloadState[] =
+        modelDownloadState.children!.filter(
+          (m) => m.fileName !== state.fileName
+        )
+      updatedChildren.push(state)
+      modelDownloadState.children = updatedChildren
+      currentState[state.modelId] = modelDownloadState
+
+      const isAllChildrenDownloadEnd = modelDownloadState.children?.every(
+        (m) => m.downloadState === 'end'
+      )
 
-  return {
-    modelDownloadStateAtom,
-    modelDownloadState,
-    setDownloadState,
-    setDownloadStateSuccess,
-    setDownloadStateFailed,
-    setDownloadStateCancelled,
-    downloadStates,
+      if (isAllChildrenDownloadEnd) {
+        // download successfully
+        delete currentState[state.modelId]
+        set(removeDownloadingModelAtom, state.modelId)
+
+        const model = get(configuredModelsAtom).find(
+          (e) => e.id === state.modelId
+        )
+        if (model) set(downloadedModelsAtom, (prev) => [...prev, model])
+        toaster({
+          title: 'Download Completed',
+          description: `Download ${state.modelId} completed`,
+          type: 'success',
+        })
+      }
+    } else if (state.downloadState === 'error') {
+      // download error
+      delete currentState[state.modelId]
+      set(removeDownloadingModelAtom, state.modelId)
+      if (state.error === 'aborted') {
+        toaster({
+          title: 'Cancel Download',
+          description: `Model ${state.modelId} download cancelled`,
+          type: 'warning',
+        })
+      } else {
+        let error = state.error
+        if (
+          typeof error?.includes === 'function' &&
+          state.error?.includes('certificate')
+        ) {
+          error +=
+            '. To fix enable "Ignore SSL Certificates" in Advanced settings.'
+        }
+        toaster({
+          title: 'Download Failed',
+          description: `Model ${state.modelId} download failed: ${error}`,
+          type: 'error',
+        })
+      }
+    } else {
+      // download in progress
+      if (state.size.total === 0) {
+        // this is initial state, just set the state
+        currentState[state.modelId] = state
+        set(modelDownloadStateAtom, currentState)
+        return
+      }
+
+      const modelDownloadState = currentState[state.modelId]
+      if (!modelDownloadState) {
+        console.debug('setDownloadStateAtom: modelDownloadState not found')
+        return
+      }
+
+      // delete the children if the filename is matched and replace the new state
+      const updatedChildren: DownloadState[] =
+        modelDownloadState.children!.filter(
+          (m) => m.fileName !== state.fileName
+        )
+
+      updatedChildren.push(state)
+
+      // re-calculate the overall progress if we have all the children download data
+      const isAnyChildDownloadNotReady = updatedChildren.some(
+        (m) => m.size.total === 0
+      )
+
+      modelDownloadState.children = updatedChildren
+
+      if (isAnyChildDownloadNotReady) {
+        // just update the children
+        currentState[state.modelId] = modelDownloadState
+        set(modelDownloadStateAtom, currentState)
+
+        return
+      }
+
+      const parentTotalSize = modelDownloadState.size.total
+      if (parentTotalSize === 0) {
+        // calculate the total size of the parent by sum all children total size
+        const totalSize = updatedChildren.reduce(
+          (acc, m) => acc + m.size.total,
+          0
+        )
+
+        modelDownloadState.size.total = totalSize
+      }
+
+      // calculate the total transferred size by sum all children transferred size
+      const transferredSize = updatedChildren.reduce(
+        (acc, m) => acc + m.size.transferred,
+        0
+      )
+      modelDownloadState.size.transferred = transferredSize
+      modelDownloadState.percent =
+        parentTotalSize === 0 ? 0 : transferredSize / parentTotalSize
+      currentState[state.modelId] = modelDownloadState
+    }
+
+    set(modelDownloadStateAtom, currentState)
   }
-}
+)
diff --git a/web/hooks/useFactoryReset.ts b/web/hooks/useFactoryReset.ts
index 56994d4c40..06a637572c 100644
--- a/web/hooks/useFactoryReset.ts
+++ b/web/hooks/useFactoryReset.ts
@@ -26,29 +26,18 @@ export default function useFactoryReset() {
     console.debug('appConfiguration: ', appConfiguration)
     const janDataFolderPath = appConfiguration!.data_folder
 
-    if (defaultJanDataFolder === janDataFolderPath) {
-      console.debug('Jan data folder is already at user home')
-    } else {
-      // if jan data folder is not at user home, we update the app configuration to point to user home
-      if (!keepCurrentFolder) {
-        const configuration: AppConfiguration = {
-          data_folder: defaultJanDataFolder,
-        }
-        await window.core?.api?.updateAppConfiguration(configuration)
+    if (!keepCurrentFolder) {
+      // set the default jan data folder to user's home directory
+      const configuration: AppConfiguration = {
+        data_folder: defaultJanDataFolder,
       }
+      await window.core?.api?.updateAppConfiguration(configuration)
     }
-
-    const modelPath = await joinPath([janDataFolderPath, 'models'])
-    const threadPath = await joinPath([janDataFolderPath, 'threads'])
-
-    console.debug(`Removing models at ${modelPath}`)
-    await fs.rmdirSync(modelPath, { recursive: true })
-
-    console.debug(`Removing threads at ${threadPath}`)
-    await fs.rmdirSync(threadPath, { recursive: true })
+    await fs.rmdirSync(janDataFolderPath, { recursive: true })
 
     // reset the localStorage
     localStorage.clear()
+
     await window.core?.api?.relaunch()
   }
 
diff --git a/web/hooks/useGetAssistants.ts b/web/hooks/useGetAssistants.ts
deleted file mode 100644
index 2b34bfbd14..0000000000
--- a/web/hooks/useGetAssistants.ts
+++ /dev/null
@@ -1,27 +0,0 @@
-import { useEffect, useState } from 'react'
-
-import { Assistant, ExtensionTypeEnum, AssistantExtension } from '@janhq/core'
-
-import { extensionManager } from '@/extension/ExtensionManager'
-
-export const getAssistants = async (): Promise<Assistant[]> =>
-  extensionManager
-    .get<AssistantExtension>(ExtensionTypeEnum.Assistant)
-    ?.getAssistants() ?? []
-
-/**
- * Hooks for get assistants
- *
- * @returns assistants
- */
-export default function useGetAssistants() {
-  const [assistants, setAssistants] = useState<Assistant[]>([])
-
-  useEffect(() => {
-    getAssistants()
-      .then((data) => setAssistants(data))
-      .catch((err) => console.error(err))
-  }, [])
-
-  return { assistants }
-}
diff --git a/web/hooks/useGetConfiguredModels.ts b/web/hooks/useGetConfiguredModels.ts
deleted file mode 100644
index 8be052ae27..0000000000
--- a/web/hooks/useGetConfiguredModels.ts
+++ /dev/null
@@ -1,30 +0,0 @@
-import { useCallback, useEffect, useState } from 'react'
-
-import { ExtensionTypeEnum, ModelExtension, Model } from '@janhq/core'
-
-import { extensionManager } from '@/extension/ExtensionManager'
-
-export function useGetConfiguredModels() {
-  const [loading, setLoading] = useState<boolean>(false)
-  const [models, setModels] = useState<Model[]>([])
-
-  const fetchModels = useCallback(async () => {
-    setLoading(true)
-    const models = await getConfiguredModels()
-    setLoading(false)
-    setModels(models)
-  }, [])
-
-  useEffect(() => {
-    fetchModels()
-  }, [fetchModels])
-
-  return { loading, models }
-}
-
-const getConfiguredModels = async (): Promise<Model[]> => {
-  const models = await extensionManager
-    .get<ModelExtension>(ExtensionTypeEnum.Model)
-    ?.getConfiguredModels()
-  return models ?? []
-}
diff --git a/web/hooks/useGetDownloadedModels.ts b/web/hooks/useGetDownloadedModels.ts
deleted file mode 100644
index bba420858b..0000000000
--- a/web/hooks/useGetDownloadedModels.ts
+++ /dev/null
@@ -1,27 +0,0 @@
-import { useEffect } from 'react'
-
-import { ExtensionTypeEnum, ModelExtension, Model } from '@janhq/core'
-
-import { atom, useAtom } from 'jotai'
-
-import { extensionManager } from '@/extension/ExtensionManager'
-
-export const downloadedModelsAtom = atom<Model[]>([])
-
-export function useGetDownloadedModels() {
-  const [downloadedModels, setDownloadedModels] = useAtom(downloadedModelsAtom)
-
-  useEffect(() => {
-    getDownloadedModels().then((downloadedModels) => {
-      setDownloadedModels(downloadedModels)
-    })
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
-
-  return { downloadedModels, setDownloadedModels }
-}
-
-export const getDownloadedModels = async (): Promise<Model[]> =>
-  extensionManager
-    .get<ModelExtension>(ExtensionTypeEnum.Model)
-    ?.getDownloadedModels() ?? []
diff --git a/web/hooks/useGetSystemResources.ts b/web/hooks/useGetSystemResources.ts
index de595ad7b4..ef2f30a61f 100644
--- a/web/hooks/useGetSystemResources.ts
+++ b/web/hooks/useGetSystemResources.ts
@@ -1,4 +1,4 @@
-import { useEffect, useState } from 'react'
+import { useCallback, useEffect, useState } from 'react'
 
 import { ExtensionTypeEnum, MonitoringExtension } from '@janhq/core'
 
@@ -6,21 +6,27 @@ import { useSetAtom } from 'jotai'
 
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
-  availableRamAtom,
   cpuUsageAtom,
   totalRamAtom,
   usedRamAtom,
+  nvidiaTotalVramAtom,
+  gpusAtom,
+  ramUtilitizedAtom,
 } from '@/helpers/atoms/SystemBar.atom'
 
 export default function useGetSystemResources() {
-  const [ram, setRam] = useState<number>(0)
-  const [cpu, setCPU] = useState<number>(0)
+  const [intervalId, setIntervalId] = useState<
+    NodeJS.Timeout | number | undefined
+  >(undefined)
+
   const setTotalRam = useSetAtom(totalRamAtom)
+  const setGpus = useSetAtom(gpusAtom)
   const setUsedRam = useSetAtom(usedRamAtom)
-  const setAvailableRam = useSetAtom(availableRamAtom)
   const setCpuUsage = useSetAtom(cpuUsageAtom)
+  const setTotalNvidiaVram = useSetAtom(nvidiaTotalVramAtom)
+  const setRamUtilitized = useSetAtom(ramUtilitizedAtom)
 
-  const getSystemResources = async () => {
+  const getSystemResources = useCallback(async () => {
     if (
       !extensionManager.get<MonitoringExtension>(
         ExtensionTypeEnum.SystemMonitoring
@@ -34,40 +40,73 @@ export default function useGetSystemResources() {
     const resourceInfor = await monitoring?.getResourcesInfo()
     const currentLoadInfor = await monitoring?.getCurrentLoad()
 
-    const ram =
-      (resourceInfor?.mem?.usedMemory ?? 0) /
-      (resourceInfor?.mem?.totalMemory ?? 1)
     if (resourceInfor?.mem?.usedMemory) setUsedRam(resourceInfor.mem.usedMemory)
     if (resourceInfor?.mem?.totalMemory)
       setTotalRam(resourceInfor.mem.totalMemory)
 
-    setRam(Math.round(ram * 100))
-    if (resourceInfor.mem.totalMemory && resourceInfor.mem.usedMemory)
-      setAvailableRam(
-        resourceInfor.mem.totalMemory - resourceInfor.mem.usedMemory
-      )
-    setCPU(Math.round(currentLoadInfor?.cpu?.usage ?? 0))
+    const ramUtilitized =
+      ((resourceInfor?.mem?.usedMemory ?? 0) /
+        (resourceInfor?.mem?.totalMemory ?? 1)) *
+      100
+    setRamUtilitized(Math.round(ramUtilitized))
+
     setCpuUsage(Math.round(currentLoadInfor?.cpu?.usage ?? 0))
-  }
 
-  useEffect(() => {
+    const gpus = currentLoadInfor?.gpu ?? []
+    setGpus(gpus)
+
+    let totalNvidiaVram = 0
+    if (gpus.length > 0) {
+      totalNvidiaVram = gpus.reduce(
+        (total: number, gpu: { memoryTotal: string }) =>
+          total + Number(gpu.memoryTotal),
+        0
+      )
+    }
+    setTotalNvidiaVram(totalNvidiaVram)
+  }, [
+    setUsedRam,
+    setTotalRam,
+    setRamUtilitized,
+    setCpuUsage,
+    setGpus,
+    setTotalNvidiaVram,
+  ])
+
+  const watch = () => {
     getSystemResources()
 
-    // Fetch interval - every 0.5s
-    // TODO: Will we really need this?
-    // There is a possibility that this will be removed and replaced by the process event hook?
-    const intervalId = setInterval(() => {
+    // Fetch interval - every 2s
+    const itv = setInterval(() => {
       getSystemResources()
-    }, 500)
+    }, 2000)
+    setIntervalId(itv)
+  }
+  const stopWatching = useCallback(() => {
+    if (intervalId) clearInterval(intervalId)
+  }, [intervalId])
 
-    // clean up interval
-    return () => clearInterval(intervalId)
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
+  useEffect(() => {
+    getSystemResources()
+    // Component did unmount
+    // Stop watching if any
+    return () => {
+      stopWatching()
+    }
+  }, [getSystemResources, stopWatching])
 
   return {
-    totalRamAtom,
-    ram,
-    cpu,
+    /**
+     * Fetch resource informations once
+     */
+    getSystemResources,
+    /**
+     *  Fetch & watch for resource update
+     */
+    watch,
+    /**
+     *  Stop watching
+     */
+    stopWatching,
   }
 }
diff --git a/web/hooks/useServerLog.ts b/web/hooks/useLogs.tsx
similarity index 57%
rename from web/hooks/useServerLog.ts
rename to web/hooks/useLogs.tsx
index b263534b66..fc591405f9 100644
--- a/web/hooks/useServerLog.ts
+++ b/web/hooks/useLogs.tsx
@@ -5,14 +5,11 @@ import {
   getJanDataFolderPath,
 } from '@janhq/core'
 
-export const useServerLog = () => {
-  const getServerLog = async () => {
-    if (!(await fs.existsSync(await joinPath(['file://logs', 'server.log']))))
-      return {}
-    const logs = await fs.readFileSync(
-      await joinPath(['file://logs', 'server.log']),
-      'utf-8'
-    )
+export const useLogs = () => {
+  const getLogs = async (file: string) => {
+    const path = await joinPath(['file://logs', `${file}.log`])
+    if (!(await fs.existsSync(path))) return {}
+    const logs = await fs.readFileSync(path, 'utf-8')
 
     return logs
   }
@@ -25,5 +22,5 @@ export const useServerLog = () => {
   const clearServerLog = async () => {
     await fs.writeFileSync(await joinPath(['file://logs', 'server.log']), '')
   }
-  return { getServerLog, openServerLog, clearServerLog }
+  return { getLogs, openServerLog, clearServerLog }
 }
diff --git a/web/hooks/useModels.ts b/web/hooks/useModels.ts
new file mode 100644
index 0000000000..b2aa0b518a
--- /dev/null
+++ b/web/hooks/useModels.ts
@@ -0,0 +1,59 @@
+import { useCallback, useEffect } from 'react'
+
+import {
+  ExtensionTypeEnum,
+  Model,
+  ModelEvent,
+  ModelExtension,
+  events,
+} from '@janhq/core'
+
+import { useSetAtom } from 'jotai'
+
+import { extensionManager } from '@/extension'
+import {
+  configuredModelsAtom,
+  downloadedModelsAtom,
+} from '@/helpers/atoms/Model.atom'
+
+const useModels = () => {
+  const setDownloadedModels = useSetAtom(downloadedModelsAtom)
+  const setConfiguredModels = useSetAtom(configuredModelsAtom)
+
+  const getData = useCallback(() => {
+    const getDownloadedModels = async () => {
+      const models = await getLocalDownloadedModels()
+      setDownloadedModels(models)
+    }
+    const getConfiguredModels = async () => {
+      const models = await getLocalConfiguredModels()
+      setConfiguredModels(models)
+    }
+    getDownloadedModels()
+    getConfiguredModels()
+  }, [setDownloadedModels, setConfiguredModels])
+
+  useEffect(() => {
+    // Try get data on mount
+    getData()
+
+    // Listen for model updates
+    events.on(ModelEvent.OnModelsUpdate, async () => getData())
+    return () => {
+      // Remove listener on unmount
+      events.off(ModelEvent.OnModelsUpdate, async () => {})
+    }
+  }, [getData])
+}
+
+const getLocalConfiguredModels = async (): Promise<Model[]> =>
+  extensionManager
+    .get<ModelExtension>(ExtensionTypeEnum.Model)
+    ?.getConfiguredModels() ?? []
+
+const getLocalDownloadedModels = async (): Promise<Model[]> =>
+  extensionManager
+    .get<ModelExtension>(ExtensionTypeEnum.Model)
+    ?.getDownloadedModels() ?? []
+
+export default useModels
diff --git a/web/hooks/usePath.ts b/web/hooks/usePath.ts
index aea25bef11..35fb853b49 100644
--- a/web/hooks/usePath.ts
+++ b/web/hooks/usePath.ts
@@ -25,6 +25,7 @@ export const usePath = () => {
         if (!selectedModel) return
         filePath = await joinPath(['models', selectedModel.id])
         break
+      case 'Tools':
       case 'Assistant':
         if (!assistantId) return
         filePath = await joinPath(['assistants', assistantId])
@@ -59,6 +60,7 @@ export const usePath = () => {
         filePath = await joinPath(['models', selectedModel.id, 'model.json'])
         break
       case 'Assistant':
+      case 'Tools':
         if (!assistantId) return
         filePath = await joinPath(['assistants', assistantId, 'assistant.json'])
         break
diff --git a/web/hooks/useRecommendedModel.ts b/web/hooks/useRecommendedModel.ts
index 427d2bf731..8122e2b77a 100644
--- a/web/hooks/useRecommendedModel.ts
+++ b/web/hooks/useRecommendedModel.ts
@@ -5,9 +5,9 @@ import { Model, InferenceEngine } from '@janhq/core'
 import { atom, useAtomValue } from 'jotai'
 
 import { activeModelAtom } from './useActiveModel'
-import { getDownloadedModels } from './useGetDownloadedModels'
 
-import { activeThreadAtom, threadStatesAtom } from '@/helpers/atoms/Thread.atom'
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
+import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 export const lastUsedModel = atom<Model | undefined>(undefined)
 
@@ -24,19 +24,20 @@ export const LAST_USED_MODEL_ID = 'last-used-model-id'
  */
 export default function useRecommendedModel() {
   const activeModel = useAtomValue(activeModelAtom)
-  const [downloadedModels, setDownloadedModels] = useState<Model[]>([])
+  const [sortedModels, setSortedModels] = useState<Model[]>([])
   const [recommendedModel, setRecommendedModel] = useState<Model | undefined>()
   const activeThread = useAtomValue(activeThreadAtom)
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
 
   const getAndSortDownloadedModels = useCallback(async (): Promise<Model[]> => {
-    const models = (await getDownloadedModels()).sort((a, b) =>
+    const models = downloadedModels.sort((a, b) =>
       a.engine !== InferenceEngine.nitro && b.engine === InferenceEngine.nitro
         ? 1
         : -1
     )
-    setDownloadedModels(models)
+    setSortedModels(models)
     return models
-  }, [])
+  }, [downloadedModels])
 
   const getRecommendedModel = useCallback(async (): Promise<
     Model | undefined
@@ -98,5 +99,5 @@ export default function useRecommendedModel() {
     getRecommendedModel()
   }, [getRecommendedModel])
 
-  return { recommendedModel, downloadedModels }
+  return { recommendedModel, downloadedModels: sortedModels }
 }
diff --git a/web/hooks/useSendChatMessage.ts b/web/hooks/useSendChatMessage.ts
index 7d89764db2..6c8f98aab3 100644
--- a/web/hooks/useSendChatMessage.ts
+++ b/web/hooks/useSendChatMessage.ts
@@ -6,6 +6,7 @@ import {
   ChatCompletionRole,
   ContentType,
   MessageRequest,
+  MessageRequestType,
   MessageStatus,
   ExtensionTypeEnum,
   Thread,
@@ -23,7 +24,11 @@ import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 import { ulid } from 'ulid'
 
 import { selectedModelAtom } from '@/containers/DropdownListSidebar'
-import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
+import {
+  currentPromptAtom,
+  editPromptAtom,
+  fileUploadAtom,
+} from '@/containers/Providers/Jotai'
 
 import { getBase64 } from '@/utils/base64'
 import { toRuntimeParams, toSettingParams } from '@/utils/modelParam'
@@ -33,6 +38,7 @@ import { loadModelErrorAtom, useActiveModel } from './useActiveModel'
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
   addNewMessageAtom,
+  deleteMessageAtom,
   getCurrentChatMessagesAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
 import {
@@ -53,6 +59,8 @@ export default function useSendChatMessage() {
   const updateThread = useSetAtom(updateThreadAtom)
   const updateThreadWaiting = useSetAtom(updateThreadWaitingForResponseAtom)
   const setCurrentPrompt = useSetAtom(currentPromptAtom)
+  const deleteMessage = useSetAtom(deleteMessageAtom)
+  const setEditPrompt = useSetAtom(editPromptAtom)
 
   const currentMessages = useAtomValue(getCurrentChatMessagesAtom)
   const { activeModel } = useActiveModel()
@@ -112,6 +120,7 @@ export default function useSendChatMessage() {
 
     const messageRequest: MessageRequest = {
       id: ulid(),
+      type: MessageRequestType.Thread,
       messages: messages,
       threadId: activeThread.id,
       model: activeThread.assistants[0].model ?? selectedModel,
@@ -125,6 +134,19 @@ export default function useSendChatMessage() {
       await waitForModelStarting(modelId)
       setQueuedMessage(false)
     }
+
+    if (currentMessage.role !== ChatCompletionRole.User) {
+      // Delete last response before regenerating
+      deleteMessage(currentMessage.id ?? '')
+      if (activeThread) {
+        await extensionManager
+          .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
+          ?.writeMessages(
+            activeThread.id,
+            currentMessages.filter((msg) => msg.id !== currentMessage.id)
+          )
+      }
+    }
     events.emit(MessageEvent.OnMessageSent, messageRequest)
   }
 
@@ -145,6 +167,7 @@ export default function useSendChatMessage() {
     updateThreadWaiting(activeThread.id, true)
     const prompt = message.trim()
     setCurrentPrompt('')
+    setEditPrompt('')
 
     const base64Blob = fileUpload[0]
       ? await getBase64(fileUpload[0].file).then()
@@ -209,6 +232,7 @@ export default function useSendChatMessage() {
     }
     const messageRequest: MessageRequest = {
       id: msgId,
+      type: MessageRequestType.Thread,
       threadId: activeThread.id,
       messages,
       model: {
@@ -218,8 +242,8 @@ export default function useSendChatMessage() {
       },
       thread: activeThread,
     }
-    const timestamp = Date.now()
 
+    const timestamp = Date.now()
     const content: any = []
 
     if (base64Blob && fileUpload[0]?.type === 'image') {
@@ -273,6 +297,10 @@ export default function useSendChatMessage() {
     const updatedThread: Thread = {
       ...activeThread,
       updated: timestamp,
+      metadata: {
+        ...(activeThread.metadata ?? {}),
+        lastMessage: prompt,
+      },
     }
 
     // change last update thread when send message
diff --git a/web/hooks/useSetActiveThread.ts b/web/hooks/useSetActiveThread.ts
index f5649ccaff..486a14d038 100644
--- a/web/hooks/useSetActiveThread.ts
+++ b/web/hooks/useSetActiveThread.ts
@@ -1,49 +1,31 @@
-import {
-  InferenceEvent,
-  ExtensionTypeEnum,
-  Thread,
-  events,
-  ConversationalExtension,
-} from '@janhq/core'
+import { ExtensionTypeEnum, Thread, ConversationalExtension } from '@janhq/core'
 
 import { useAtomValue, useSetAtom } from 'jotai'
 
-import { loadModelErrorAtom } from './useActiveModel'
-
 import { extensionManager } from '@/extension'
-import { setConvoMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
+import {
+  readyThreadsMessagesAtom,
+  setConvoMessagesAtom,
+} from '@/helpers/atoms/ChatMessage.atom'
 import {
   ModelParams,
-  getActiveThreadIdAtom,
-  isGeneratingResponseAtom,
   setActiveThreadIdAtom,
   setThreadModelParamsAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 export default function useSetActiveThread() {
-  const activeThreadId = useAtomValue(getActiveThreadIdAtom)
   const setActiveThreadId = useSetAtom(setActiveThreadIdAtom)
   const setThreadMessage = useSetAtom(setConvoMessagesAtom)
   const setThreadModelParams = useSetAtom(setThreadModelParamsAtom)
-  const setIsGeneratingResponse = useSetAtom(isGeneratingResponseAtom)
-  const setLoadModelError = useSetAtom(loadModelErrorAtom)
+  const readyMessageThreads = useAtomValue(readyThreadsMessagesAtom)
 
   const setActiveThread = async (thread: Thread) => {
-    if (activeThreadId === thread.id) {
-      console.debug('Thread already active')
-      return
+    // Load local messages only if there are no messages in the state
+    if (!readyMessageThreads[thread.id]) {
+      const messages = await getLocalThreadMessage(thread.id)
+      setThreadMessage(thread.id, messages)
     }
 
-    setIsGeneratingResponse(false)
-    setLoadModelError(undefined)
-    events.emit(InferenceEvent.OnInferenceStopped, thread.id)
-
-    // load the corresponding messages
-    const messages = await extensionManager
-      .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
-      ?.getAllMessages(thread.id)
-    setThreadMessage(thread.id, messages ?? [])
-
     setActiveThreadId(thread.id)
     const modelParams: ModelParams = {
       ...thread.assistants[0]?.model?.parameters,
@@ -52,5 +34,10 @@ export default function useSetActiveThread() {
     setThreadModelParams(thread.id, modelParams)
   }
 
-  return { activeThreadId, setActiveThread }
+  return { setActiveThread }
 }
+
+const getLocalThreadMessage = async (threadId: string) =>
+  extensionManager
+    .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
+    ?.getAllMessages(threadId) ?? []
diff --git a/web/hooks/useSettings.ts b/web/hooks/useSettings.ts
index 168e724894..9ff89827e8 100644
--- a/web/hooks/useSettings.ts
+++ b/web/hooks/useSettings.ts
@@ -24,7 +24,7 @@ export const useSettings = () => {
         ((settings.nvidia_driver?.exist && !settings.cuda?.exist) ||
           !settings.nvidia_driver?.exist)
       ) {
-        setShowNotification(true)
+        setShowNotification(false)
       }
 
       // Check if run_mode is 'gpu' or 'cpu' and update state accordingly
@@ -47,15 +47,34 @@ export const useSettings = () => {
   const saveSettings = async ({
     runMode,
     notify,
+    gpusInUse,
+    vulkan,
   }: {
     runMode?: string | undefined
     notify?: boolean | undefined
+    gpusInUse?: string[] | undefined
+    vulkan?: boolean | undefined
   }) => {
     const settingsFile = await joinPath(['file://settings', 'settings.json'])
     const settings = await readSettings()
     if (runMode != null) settings.run_mode = runMode
     if (notify != null) settings.notify = notify
+    if (gpusInUse != null) settings.gpus_in_use = gpusInUse
+    if (vulkan != null) {
+      settings.vulkan = vulkan
+      // GPU enabled, set run_mode to 'gpu'
+      if (settings.vulkan) {
+        settings.run_mode = 'gpu'
+      } else {
+        settings.run_mode = settings.gpus?.length > 0 ? 'gpu' : 'cpu'
+      }
+    }
     await fs.writeFileSync(settingsFile, JSON.stringify(settings))
+
+    // Relaunch to apply settings
+    if (vulkan != null) {
+      window.location.reload()
+    }
   }
 
   return {
diff --git a/web/hooks/useThreads.ts b/web/hooks/useThreads.ts
index b7de014cc0..fd0b3456d4 100644
--- a/web/hooks/useThreads.ts
+++ b/web/hooks/useThreads.ts
@@ -1,3 +1,5 @@
+import { useEffect } from 'react'
+
 import {
   ExtensionTypeEnum,
   Thread,
@@ -5,14 +7,12 @@ import {
   ConversationalExtension,
 } from '@janhq/core'
 
-import { useAtomValue, useSetAtom } from 'jotai'
-
-import useSetActiveThread from './useSetActiveThread'
+import { useSetAtom } from 'jotai'
 
 import { extensionManager } from '@/extension/ExtensionManager'
 import {
   ModelParams,
-  activeThreadAtom,
+  threadDataReadyAtom,
   threadModelParamsAtom,
   threadStatesAtom,
   threadsAtom,
@@ -22,11 +22,10 @@ const useThreads = () => {
   const setThreadStates = useSetAtom(threadStatesAtom)
   const setThreads = useSetAtom(threadsAtom)
   const setThreadModelRuntimeParams = useSetAtom(threadModelParamsAtom)
-  const activeThread = useAtomValue(activeThreadAtom)
-  const { setActiveThread } = useSetActiveThread()
+  const setThreadDataReady = useSetAtom(threadDataReadyAtom)
 
-  const getThreads = async () => {
-    try {
+  useEffect(() => {
+    const getThreads = async () => {
       const localThreads = await getLocalThreads()
       const localThreadStates: Record<string, ThreadState> = {}
       const threadModelParams: Record<string, ModelParams> = {}
@@ -54,17 +53,16 @@ const useThreads = () => {
       setThreadStates(localThreadStates)
       setThreads(localThreads)
       setThreadModelRuntimeParams(threadModelParams)
-      if (localThreads.length && !activeThread) {
-        setActiveThread(localThreads[0])
-      }
-    } catch (error) {
-      console.error(error)
+      setThreadDataReady(true)
     }
-  }
 
-  return {
-    getThreads,
-  }
+    getThreads()
+  }, [
+    setThreadModelRuntimeParams,
+    setThreadStates,
+    setThreads,
+    setThreadDataReady,
+  ])
 }
 
 const getLocalThreads = async (): Promise<Thread[]> =>
diff --git a/web/next.config.js b/web/next.config.js
index a2e202c515..a4b3e6d436 100644
--- a/web/next.config.js
+++ b/web/next.config.js
@@ -6,6 +6,11 @@ const webpack = require('webpack')
 const packageJson = require('./package.json')
 
 const nextConfig = {
+  eslint: {
+    // Warning: This allows production builds to successfully complete even if
+    // your project has ESLint errors.
+    ignoreDuringBuilds: true,
+  },
   output: 'export',
   assetPrefix: '.',
   images: {
@@ -27,7 +32,9 @@ const nextConfig = {
         VERSION: JSON.stringify(packageJson.version),
         ANALYTICS_ID: JSON.stringify(process.env.ANALYTICS_ID),
         ANALYTICS_HOST: JSON.stringify(process.env.ANALYTICS_HOST),
-        API_BASE_URL: JSON.stringify('http://localhost:1337'),
+        API_BASE_URL: JSON.stringify(
+          process.env.API_BASE_URL ?? 'http://localhost:1337'
+        ),
         isMac: process.platform === 'darwin',
         isWindows: process.platform === 'win32',
         isLinux: process.platform === 'linux',
diff --git a/web/public/umami_script.js b/web/public/umami_script.js
new file mode 100644
index 0000000000..b9db0b0241
--- /dev/null
+++ b/web/public/umami_script.js
@@ -0,0 +1,210 @@
+!(function () {
+  'use strict'
+  !(function (t) {
+    var e = t.screen,
+      n = e.width,
+      r = e.height,
+      a = t.navigator.language,
+      i = t.location,
+      o = t.localStorage,
+      u = t.document,
+      c = t.history,
+      f = 'jan.ai',
+      s = 'mainpage',
+      l = i.search,
+      d = u.currentScript
+    if (d) {
+      var m = 'data-',
+        h = d.getAttribute.bind(d),
+        v = h(m + 'website-id'),
+        p = h(m + 'host-url'),
+        g = 'false' !== h(m + 'auto-track'),
+        y = h(m + 'do-not-track'),
+        b = h(m + 'domains') || '',
+        S = b.split(',').map(function (t) {
+          return t.trim()
+        }),
+        k =
+          (p ? p.replace(/\/$/, '') : d.src.split('/').slice(0, -1).join('/')) +
+          '/api/send',
+        w = n + 'x' + r,
+        N = /data-umami-event-([\w-_]+)/,
+        T = m + 'umami-event',
+        j = 300,
+        A = function (t, e, n) {
+          var r = t[e]
+          return function () {
+            for (var e = [], a = arguments.length; a--; ) e[a] = arguments[a]
+            return n.apply(null, e), r.apply(t, e)
+          }
+        },
+        x = function () {
+          return {
+            website: v,
+            hostname: f,
+            screen: w,
+            language: a,
+            title: M,
+            url: I,
+            referrer: J,
+          }
+        },
+        E = function () {
+          return (
+            (o && o.getItem('umami.disabled')) ||
+            (y &&
+              (function () {
+                var e = t.doNotTrack,
+                  n = t.navigator,
+                  r = t.external,
+                  a = 'msTrackingProtectionEnabled',
+                  i =
+                    e ||
+                    n.doNotTrack ||
+                    n.msDoNotTrack ||
+                    (r && a in r && r[a]())
+                return '1' == i || 'yes' === i
+              })()) ||
+            (b && !S.includes(f))
+          )
+        },
+        O = function (t, e, n) {
+          n &&
+            ((J = I),
+            (I = (function (t) {
+              try {
+                return new URL(t).pathname
+              } catch (e) {
+                return t
+              }
+            })(n.toString())) !== J && setTimeout(D, j))
+        },
+        L = function (t, e) {
+          if ((void 0 === e && (e = 'event'), !E())) {
+            var n = {
+              // eslint-disable-next-line @typescript-eslint/naming-convention
+              'Content-Type': 'application/json',
+            }
+            return (
+              void 0 !== K && (n['x-umami-cache'] = K),
+              fetch(k, {
+                method: 'POST',
+                body: JSON.stringify({
+                  type: e,
+                  payload: t,
+                }),
+                headers: n,
+              })
+                .then(function (t) {
+                  return t.text()
+                })
+                .then(function (t) {
+                  return (K = t)
+                })
+                .catch(function () {})
+            )
+          }
+        },
+        D = function (t, e) {
+          return L(
+            'string' == typeof t
+              ? Object.assign({}, x(), {
+                  name: t,
+                  data: 'object' == typeof e ? e : void 0,
+                })
+              : 'object' == typeof t
+                ? t
+                : 'function' == typeof t
+                  ? t(x())
+                  : x()
+          )
+        }
+      t.umami ||
+        (t.umami = {
+          track: D,
+          identify: function (t) {
+            return L(
+              Object.assign({}, x(), {
+                data: t,
+              }),
+              'identify'
+            )
+          },
+        })
+      var K,
+        P,
+        _,
+        q,
+        C,
+        I = '' + s + l,
+        J = u.referrer,
+        M = u.title
+      if (g && !E()) {
+        ;(c.pushState = A(c, 'pushState', O)),
+          (c.replaceState = A(c, 'replaceState', O)),
+          (C = function (t) {
+            var e = t.getAttribute.bind(t),
+              n = e(T)
+            if (n) {
+              var r = {}
+              return (
+                t.getAttributeNames().forEach(function (t) {
+                  var n = t.match(N)
+                  n && (r[n[1]] = e(t))
+                }),
+                D(n, r)
+              )
+            }
+            return Promise.resolve()
+          }),
+          u.addEventListener(
+            'click',
+            function (t) {
+              var e = t.target,
+                n =
+                  'A' === e.tagName
+                    ? e
+                    : (function (t, e) {
+                        for (var n = t, r = 0; r < e; r++) {
+                          if ('A' === n.tagName) return n
+                          if (!(n = n.parentElement)) return null
+                        }
+                        return null
+                      })(e, 10)
+              if (n) {
+                var r = n.href,
+                  a =
+                    '_blank' === n.target ||
+                    t.ctrlKey ||
+                    t.shiftKey ||
+                    t.metaKey ||
+                    (t.button && 1 === t.button)
+                if (n.getAttribute(T) && r)
+                  return (
+                    a || t.preventDefault(),
+                    C(n).then(function () {
+                      a || (i.href = r)
+                    })
+                  )
+              } else C(e)
+            },
+            !0
+          ),
+          (_ = new MutationObserver(function (t) {
+            var e = t[0]
+            M = e && e.target ? e.target.text : void 0
+          })),
+          (q = u.querySelector('head > title')) &&
+            _.observe(q, {
+              subtree: !0,
+              characterData: !0,
+              childList: !0,
+            })
+        var R = function () {
+          'complete' !== u.readyState || P || (D(), (P = !0))
+        }
+        u.addEventListener('readystatechange', R, !0), R()
+      }
+    }
+  })(window)
+})()
diff --git a/web/screens/Chat/ChatBody/index.tsx b/web/screens/Chat/ChatBody/index.tsx
index 66f14d076e..ee0b4592d6 100644
--- a/web/screens/Chat/ChatBody/index.tsx
+++ b/web/screens/Chat/ChatBody/index.tsx
@@ -10,9 +10,6 @@ import LogoMark from '@/containers/Brand/Logo/Mark'
 
 import { MainViewState } from '@/constants/screens'
 
-import { loadModelErrorAtom } from '@/hooks/useActiveModel'
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
-
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import ChatItem from '../ChatItem'
@@ -20,10 +17,13 @@ import ChatItem from '../ChatItem'
 import ErrorMessage from '../ErrorMessage'
 
 import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
 
 const ChatBody: React.FC = () => {
   const messages = useAtomValue(getCurrentChatMessagesAtom)
-  const { downloadedModels } = useGetDownloadedModels()
+
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
+
   const { setMainViewState } = useMainViewState()
 
   if (downloadedModels.length === 0)
@@ -81,7 +81,8 @@ const ChatBody: React.FC = () => {
         <ScrollToBottom className="flex h-full w-full flex-col">
           {messages.map((message, index) => (
             <div key={message.id}>
-              {(message.status !== MessageStatus.Pending ||
+              {((message.status !== MessageStatus.Error &&
+                message.status !== MessageStatus.Pending) ||
                 message.content.length > 0) && (
                 <ChatItem {...message} key={message.id} />
               )}
diff --git a/web/screens/Chat/ChatInput/index.tsx b/web/screens/Chat/ChatInput/index.tsx
index ee1ac9a410..5b81284397 100644
--- a/web/screens/Chat/ChatInput/index.tsx
+++ b/web/screens/Chat/ChatInput/index.tsx
@@ -38,6 +38,8 @@ import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
 import {
   activeThreadAtom,
   getActiveThreadIdAtom,
+  isGeneratingResponseAtom,
+  threadStatesAtom,
   waitingToSendMessage,
 } from '@/helpers/atoms/Thread.atom'
 
@@ -57,6 +59,12 @@ const ChatInput: React.FC = () => {
   const imageInputRef = useRef<HTMLInputElement>(null)
   const [showAttacmentMenus, setShowAttacmentMenus] = useState(false)
   const { experimentalFeature } = useContext(FeatureToggleContext)
+  const isGeneratingResponse = useAtomValue(isGeneratingResponseAtom)
+  const threadStates = useAtomValue(threadStatesAtom)
+
+  const isStreamingResponse = Object.values(threadStates).some(
+    (threadState) => threadState.waitingForResponse
+  )
 
   const onPromptChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
     setCurrentPrompt(e.target.value)
@@ -112,14 +120,12 @@ const ChatInput: React.FC = () => {
     const file = event.target.files?.[0]
     if (!file) return
     setFileUpload([{ file: file, type: 'pdf' }])
-    setCurrentPrompt('Summarize this for me')
   }
 
   const handleImageChange = (event: React.ChangeEvent<HTMLInputElement>) => {
     const file = event.target.files?.[0]
     if (!file) return
     setFileUpload([{ file: file, type: 'image' }])
-    setCurrentPrompt('What do you see in this image?')
   }
 
   const renderPreview = (fileUpload: any) => {
@@ -139,7 +145,7 @@ const ChatInput: React.FC = () => {
 
         <Textarea
           className={twMerge(
-            'max-h-[400px] resize-none overflow-y-hidden pr-20',
+            'max-h-[400px] resize-none pr-20',
             fileUpload.length && 'rounded-t-none'
           )}
           style={{ height: '40px' }}
@@ -237,7 +243,9 @@ const ChatInput: React.FC = () => {
         accept="application/pdf"
       />
 
-      {messages[messages.length - 1]?.status !== MessageStatus.Pending ? (
+      {messages[messages.length - 1]?.status !== MessageStatus.Pending &&
+      !isGeneratingResponse &&
+      !isStreamingResponse ? (
         <Button
           size="lg"
           disabled={
diff --git a/web/screens/Chat/CleanThreadModal/index.tsx b/web/screens/Chat/CleanThreadModal/index.tsx
new file mode 100644
index 0000000000..6ef505e6f6
--- /dev/null
+++ b/web/screens/Chat/CleanThreadModal/index.tsx
@@ -0,0 +1,65 @@
+import React, { useCallback } from 'react'
+
+import {
+  Button,
+  Modal,
+  ModalClose,
+  ModalContent,
+  ModalFooter,
+  ModalHeader,
+  ModalPortal,
+  ModalTitle,
+  ModalTrigger,
+} from '@janhq/uikit'
+import { Paintbrush } from 'lucide-react'
+
+import useDeleteThread from '@/hooks/useDeleteThread'
+
+type Props = {
+  threadId: string
+}
+
+const CleanThreadModal: React.FC<Props> = ({ threadId }) => {
+  const { cleanThread } = useDeleteThread()
+  const onCleanThreadClick = useCallback(
+    (e: React.MouseEvent<HTMLButtonElement, MouseEvent>) => {
+      e.stopPropagation()
+      cleanThread(threadId)
+    },
+    [cleanThread, threadId]
+  )
+
+  return (
+    <Modal>
+      <ModalTrigger asChild onClick={(e) => e.stopPropagation()}>
+        <div className="flex cursor-pointer items-center space-x-2 px-4 py-2 hover:bg-secondary">
+          <Paintbrush size={16} className="text-muted-foreground" />
+          <span className="text-bold text-black dark:text-muted-foreground">
+            Clean thread
+          </span>
+        </div>
+      </ModalTrigger>
+      <ModalPortal />
+      <ModalContent>
+        <ModalHeader>
+          <ModalTitle>Clean Thread</ModalTitle>
+        </ModalHeader>
+        <p>Are you sure you want to clean this thread?</p>
+        <ModalFooter>
+          <div className="flex gap-x-2">
+            <ModalClose asChild onClick={(e) => e.stopPropagation()}>
+              <Button themes="ghost">No</Button>
+            </ModalClose>
+            <ModalClose asChild>
+              <Button themes="danger" onClick={onCleanThreadClick} autoFocus>
+                Yes
+              </Button>
+            </ModalClose>
+          </div>
+        </ModalFooter>
+      </ModalContent>
+    </Modal>
+  )
+}
+
+export default React.memo(CleanThreadModal)
diff --git a/web/screens/Chat/DeleteThreadModal/index.tsx b/web/screens/Chat/DeleteThreadModal/index.tsx
new file mode 100644
index 0000000000..edbdb09b49
--- /dev/null
+++ b/web/screens/Chat/DeleteThreadModal/index.tsx
@@ -0,0 +1,68 @@
+import React, { useCallback } from 'react'
+
+import {
+  Modal,
+  ModalTrigger,
+  ModalPortal,
+  ModalContent,
+  ModalHeader,
+  ModalTitle,
+  ModalFooter,
+  ModalClose,
+  Button,
+} from '@janhq/uikit'
+import { Trash2Icon } from 'lucide-react'
+
+import useDeleteThread from '@/hooks/useDeleteThread'
+
+type Props = {
+  threadId: string
+}
+
+const DeleteThreadModal: React.FC<Props> = ({ threadId }) => {
+  const { deleteThread } = useDeleteThread()
+  const onDeleteThreadClick = useCallback(
+    (e: React.MouseEvent<HTMLButtonElement, MouseEvent>) => {
+      e.stopPropagation()
+      deleteThread(threadId)
+    },
+    [deleteThread, threadId]
+  )
+
+  return (
+    <Modal>
+      <ModalTrigger asChild onClick={(e) => e.stopPropagation()}>
+        <div className="flex cursor-pointer items-center space-x-2 px-4 py-2 hover:bg-secondary">
+          <Trash2Icon size={16} className="text-red-600 dark:text-red-300" />
+          <span className="text-bold text-red-600 dark:text-red-300">
+            Delete thread
+          </span>
+        </div>
+      </ModalTrigger>
+      <ModalPortal />
+      <ModalContent>
+        <ModalHeader>
+          <ModalTitle>Delete Thread</ModalTitle>
+        </ModalHeader>
+        <p>
+          Are you sure you want to delete this thread? This action cannot be
+          undone.
+        </p>
+        <ModalFooter>
+          <div className="flex gap-x-2">
+            <ModalClose asChild onClick={(e) => e.stopPropagation()}>
+              <Button themes="ghost">No</Button>
+            </ModalClose>
+            <ModalClose asChild>
+              <Button autoFocus themes="danger" onClick={onDeleteThreadClick}>
+                Yes
+              </Button>
+            </ModalClose>
+          </div>
+        </ModalFooter>
+      </ModalContent>
+    </Modal>
+  )
+}
+
+export default React.memo(DeleteThreadModal)
diff --git a/web/screens/Chat/EditChatInput/index.tsx b/web/screens/Chat/EditChatInput/index.tsx
new file mode 100644
index 0000000000..240dc51063
--- /dev/null
+++ b/web/screens/Chat/EditChatInput/index.tsx
@@ -0,0 +1,192 @@
+/* eslint-disable @typescript-eslint/no-explicit-any */
+import { useEffect, useRef, useState } from 'react'
+
+import {
+  ConversationalExtension,
+  ExtensionTypeEnum,
+  InferenceEvent,
+  MessageStatus,
+  ThreadMessage,
+  events,
+} from '@janhq/core'
+
+import {
+  Textarea,
+  Button,
+  Modal,
+  ModalClose,
+  ModalContent,
+  ModalFooter,
+  ModalHeader,
+  ModalPortal,
+  ModalTitle,
+} from '@janhq/uikit'
+import { useAtom, useAtomValue, useSetAtom } from 'jotai'
+
+import { twMerge } from 'tailwind-merge'
+
+import { editPromptAtom } from '@/containers/Providers/Jotai'
+
+import { useActiveModel } from '@/hooks/useActiveModel'
+
+import useSendChatMessage from '@/hooks/useSendChatMessage'
+
+import { extensionManager } from '@/extension'
+
+import {
+  editMessageAtom,
+  getCurrentChatMessagesAtom,
+  setConvoMessagesAtom,
+} from '@/helpers/atoms/ChatMessage.atom'
+import {
+  activeThreadAtom,
+  getActiveThreadIdAtom,
+  waitingToSendMessage,
+} from '@/helpers/atoms/Thread.atom'
+
+type Props = {
+  message: ThreadMessage
+}
+
+const EditChatInput: React.FC<Props> = ({ message }) => {
+  const activeThread = useAtomValue(activeThreadAtom)
+  const { stateModel } = useActiveModel()
+  const messages = useAtomValue(getCurrentChatMessagesAtom)
+
+  const [editPrompt, setEditPrompt] = useAtom(editPromptAtom)
+  const { sendChatMessage } = useSendChatMessage()
+  const setMessages = useSetAtom(setConvoMessagesAtom)
+  const activeThreadId = useAtomValue(getActiveThreadIdAtom)
+
+  const [isWaitingToSend, setIsWaitingToSend] = useAtom(waitingToSendMessage)
+  const textareaRef = useRef<HTMLTextAreaElement>(null)
+  const setEditMessage = useSetAtom(editMessageAtom)
+  const [showDialog, setshowDialog] = useState(false)
+
+  const onPromptChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
+    setEditPrompt(e.target.value)
+  }
+
+  useEffect(() => {
+    if (isWaitingToSend && activeThreadId) {
+      setIsWaitingToSend(false)
+      sendChatMessage(editPrompt)
+    }
+  }, [
+    activeThreadId,
+    isWaitingToSend,
+    editPrompt,
+    setIsWaitingToSend,
+    sendChatMessage,
+  ])
+
+  useEffect(() => {
+    if (textareaRef.current) {
+      textareaRef.current.focus()
+    }
+  }, [activeThreadId])
+
+  useEffect(() => {
+    if (textareaRef.current) {
+      textareaRef.current.style.height = '40px'
+      textareaRef.current.style.height = textareaRef.current.scrollHeight + 'px'
+    }
+  }, [editPrompt])
+
+  useEffect(() => {
+    setEditPrompt(message.content[0]?.text?.value)
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [])
+
+  const sendEditMessage = async () => {
+    setEditMessage('')
+    const messageIdx = messages.findIndex((msg) => msg.id === message.id)
+    const newMessages = messages.slice(0, messageIdx)
+    if (activeThread) {
+      setMessages(activeThread.id, newMessages)
+      await extensionManager
+        .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
+        ?.writeMessages(
+          activeThread.id,
+          // Remove all of the messages below this
+          newMessages
+        )
+        .then(() => {
+          sendChatMessage(editPrompt)
+        })
+    }
+  }
+
+  const onKeyDown = async (e: React.KeyboardEvent<HTMLTextAreaElement>) => {
+    if (e.key === 'Enter' && !e.shiftKey) {
+      e.preventDefault()
+      if (messages[messages.length - 1]?.status !== MessageStatus.Pending)
+        sendEditMessage()
+      else onStopInferenceClick()
+    }
+  }
+
+  const onStopInferenceClick = async () => {
+    events.emit(InferenceEvent.OnInferenceStopped, {})
+  }
+
+  return (
+    <div className="mx-auto flex w-full flex-shrink-0 items-end justify-center space-x-4 pb-0 pt-1">
+      <div className="relative flex w-full flex-col">
+        <Textarea
+          className={twMerge(
+            'max-h-[400px] resize-none overflow-y-hidden pr-20'
+          )}
+          style={{ height: '40px' }}
+          ref={textareaRef}
+          onKeyDown={onKeyDown}
+          placeholder="Enter your message..."
+          disabled={stateModel.loading || !activeThread}
+          value={editPrompt}
+          onChange={onPromptChange}
+        />
+      </div>
+
+      <div className="flex items-center space-x-2">
+        <Button
+          disabled={
+            stateModel.loading ||
+            !activeThread ||
+            editPrompt.trim().length === 0
+          }
+          themes="primary"
+          onClick={sendEditMessage}
+        >
+          Submit
+        </Button>
+        <Button themes="outline" onClick={() => setEditMessage('')}>
+          Cancel
+        </Button>
+      </div>
+
+      <Modal open={showDialog} onOpenChange={() => setshowDialog(false)}>
+        <ModalPortal />
+        <ModalContent>
+          <ModalHeader>
+            <ModalTitle>Edit Message</ModalTitle>
+          </ModalHeader>
+          <p className="text-muted-foreground">
+            Do you want to discard the change
+          </p>
+          <ModalFooter>
+            <div className="flex gap-x-2">
+              <ModalClose asChild onClick={() => setshowDialog(false)}>
+                <Button themes="outline">Cancel</Button>
+              </ModalClose>
+              <ModalClose asChild onClick={() => setEditMessage('')}>
+                <Button autoFocus>Yes</Button>
+              </ModalClose>
+            </div>
+          </ModalFooter>
+        </ModalContent>
+      </Modal>
+    </div>
+  )
+}
+
+export default EditChatInput
diff --git a/web/screens/Chat/EngineSetting/index.tsx b/web/screens/Chat/EngineSetting/index.tsx
index 2153bcbde4..272434471e 100644
--- a/web/screens/Chat/EngineSetting/index.tsx
+++ b/web/screens/Chat/EngineSetting/index.tsx
@@ -1,36 +1,25 @@
-/* eslint-disable @typescript-eslint/no-explicit-any */
-import { useAtomValue } from 'jotai'
-
-import { selectedModelAtom } from '@/containers/DropdownListSidebar'
-
-import { getConfigurationsData } from '@/utils/componentSettings'
-import { toSettingParams } from '@/utils/modelParam'
-
-import SettingComponentBuilder from '../ModelSetting/SettingComponent'
-
-import { getActiveThreadModelParamsAtom } from '@/helpers/atoms/Thread.atom'
-
-const EngineSetting = ({ enabled = true }: { enabled?: boolean }) => {
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-  const selectedModel = useAtomValue(selectedModelAtom)
-
-  if (!selectedModel || !activeModelParams) return null
-
-  const modelSettingParams = toSettingParams(activeModelParams)
-
-  const componentData = getConfigurationsData(
-    modelSettingParams,
-    selectedModel
-  ).toSorted((a, b) => a.title.localeCompare(b.title))
-
+import SettingComponentBuilder from '../../Chat/ModelSetting/SettingComponent'
+import { SettingComponentData } from '../ModelSetting/SettingComponent'
+
+const EngineSetting = ({
+  componentData,
+  enabled = true,
+}: {
+  componentData: SettingComponentData[]
+  enabled?: boolean
+}) => {
   return (
-    <div className="flex flex-col">
-      <SettingComponentBuilder
-        componentData={componentData}
-        enabled={enabled}
-        selector={(e) => e.name !== 'prompt_template'}
-      />
-    </div>
+    <>
+      {componentData.filter((e) => e.name !== 'prompt_template').length && (
+        <div className="flex flex-col">
+          <SettingComponentBuilder
+            componentData={componentData}
+            enabled={enabled}
+            selector={(e) => e.name !== 'prompt_template'}
+          />
+        </div>
+      )}
+    </>
   )
 }
 
diff --git a/web/screens/Chat/ErrorMessage/index.tsx b/web/screens/Chat/ErrorMessage/index.tsx
index 84a89cee86..5aa0cd6ce4 100644
--- a/web/screens/Chat/ErrorMessage/index.tsx
+++ b/web/screens/Chat/ErrorMessage/index.tsx
@@ -1,55 +1,34 @@
-import {
-  ChatCompletionRole,
-  ConversationalExtension,
-  ExtensionTypeEnum,
-  MessageStatus,
-  ThreadMessage,
-} from '@janhq/core'
+import { MessageStatus, ThreadMessage } from '@janhq/core'
 import { Button } from '@janhq/uikit'
 import { useAtomValue, useSetAtom } from 'jotai'
 import { RefreshCcw } from 'lucide-react'
 
-import { useActiveModel } from '@/hooks/useActiveModel'
+import ModalTroubleShooting, {
+  modalTroubleShootingAtom,
+} from '@/containers/ModalTroubleShoot'
+
+import { loadModelErrorAtom } from '@/hooks/useActiveModel'
 import useSendChatMessage from '@/hooks/useSendChatMessage'
 
-import { extensionManager } from '@/extension'
-import {
-  deleteMessageAtom,
-  getCurrentChatMessagesAtom,
-} from '@/helpers/atoms/ChatMessage.atom'
-import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
+import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
 
 const ErrorMessage = ({ message }: { message: ThreadMessage }) => {
   const messages = useAtomValue(getCurrentChatMessagesAtom)
-  const thread = useAtomValue(activeThreadAtom)
-  const deleteMessage = useSetAtom(deleteMessageAtom)
   const { resendChatMessage } = useSendChatMessage()
+  const setModalTroubleShooting = useSetAtom(modalTroubleShootingAtom)
+  const loadModelError = useAtomValue(loadModelErrorAtom)
+  const PORT_NOT_AVAILABLE = 'PORT_NOT_AVAILABLE'
 
   const regenerateMessage = async () => {
     const lastMessageIndex = messages.length - 1
     const message = messages[lastMessageIndex]
-    if (message.role !== ChatCompletionRole.User) {
-      // Delete last response before regenerating
-      deleteMessage(message.id ?? '')
-      if (thread) {
-        await extensionManager
-          .get<ConversationalExtension>(ExtensionTypeEnum.Conversational)
-          ?.writeMessages(
-            thread.id,
-            messages.filter((msg) => msg.id !== message.id)
-          )
-      }
-      const targetMessage = messages[lastMessageIndex - 1]
-      if (targetMessage) resendChatMessage(targetMessage)
-    } else {
-      resendChatMessage(message)
-    }
+    resendChatMessage(message)
   }
 
   return (
-    <>
+    <div className="mt-10">
       {message.status === MessageStatus.Stopped && (
-        <div key={message.id} className="mt-10 flex flex-col items-center">
+        <div key={message.id} className="flex flex-col items-center">
           <span className="mb-3 text-center text-sm font-medium text-gray-500">
             Oops! The generation was interrupted. Let&apos;s give it another go!
           </span>
@@ -65,32 +44,47 @@ const ErrorMessage = ({ message }: { message: ThreadMessage }) => {
         </div>
       )}
       {message.status === MessageStatus.Error && (
-        <div key={message.id} className="mt-10 flex flex-col items-center">
-          <span className="mb-3 text-center text-sm font-medium text-gray-500">
-            <>
-              <p>Apologies, something&apos;s amiss!</p>
-              Jan&apos;s in beta. Find troubleshooting guides{' '}
-              <a
-                href="https://jan.ai/guides/troubleshooting"
-                target="_blank"
-                className="text-blue-600 hover:underline dark:text-blue-300"
-              >
-                here
-              </a>{' '}
-              or reach out to us on{' '}
-              <a
-                href="https://discord.gg/AsJ8krTT3N"
-                target="_blank"
-                className="text-blue-600 hover:underline dark:text-blue-300"
-              >
-                Discord
-              </a>{' '}
-              for assistance.
-            </>
-          </span>
-        </div>
+        <>
+          {loadModelError === PORT_NOT_AVAILABLE ? (
+            <div
+              key={message.id}
+              className="flex flex-col items-center text-center text-sm font-medium text-gray-500 w-full"
+            >
+              <p className="w-[90%]">
+                Port 3928 is currently unavailable. Check for conflicting apps,
+                or access&nbsp;
+                <span
+                  className="cursor-pointer text-primary dark:text-blue-400"
+                  onClick={() => setModalTroubleShooting(true)}
+                >
+                  troubleshooting assistance
+                </span>
+                &nbsp;for further support.
+              </p>
+              <ModalTroubleShooting />
+            </div>
+          ) : (
+            <div
+              key={message.id}
+              className="flex flex-col items-center text-center text-sm font-medium text-gray-500"
+            >
+              <p>{`Apologies, something’s amiss!`}</p>
+              <p>
+                Jan’s in beta. Access&nbsp;
+                <span
+                  className="cursor-pointer text-primary dark:text-blue-400"
+                  onClick={() => setModalTroubleShooting(true)}
+                >
+                  troubleshooting assistance
+                </span>
+                &nbsp;now.
+              </p>
+              <ModalTroubleShooting />
+            </div>
+          )}
+        </>
       )}
-    </>
+    </div>
   )
 }
 export default ErrorMessage
diff --git a/web/screens/Chat/MessageQueuedBanner/index.tsx b/web/screens/Chat/MessageQueuedBanner/index.tsx
deleted file mode 100644
index 5847394b41..0000000000
--- a/web/screens/Chat/MessageQueuedBanner/index.tsx
+++ /dev/null
@@ -1,21 +0,0 @@
-import { useAtomValue } from 'jotai'
-
-import { queuedMessageAtom } from '@/hooks/useSendChatMessage'
-
-const MessageQueuedBanner: React.FC = () => {
-  const queuedMessage = useAtomValue(queuedMessageAtom)
-
-  return (
-    <div>
-      {queuedMessage && (
-        <div className="my-2 py-2 text-center">
-          <span className="rounded-lg border border-border px-4 py-2 shadow-lg">
-            Message queued. It can be sent once the model has started
-          </span>
-        </div>
-      )}
-    </div>
-  )
-}
-
-export default MessageQueuedBanner
diff --git a/web/screens/Chat/MessageToolbar/index.tsx b/web/screens/Chat/MessageToolbar/index.tsx
index 070022122a..e5d81475ea 100644
--- a/web/screens/Chat/MessageToolbar/index.tsx
+++ b/web/screens/Chat/MessageToolbar/index.tsx
@@ -7,7 +7,13 @@ import {
   ContentType,
 } from '@janhq/core'
 import { useAtomValue, useSetAtom } from 'jotai'
-import { RefreshCcw, CopyIcon, Trash2Icon, CheckIcon } from 'lucide-react'
+import {
+  RefreshCcw,
+  CopyIcon,
+  Trash2Icon,
+  CheckIcon,
+  PencilIcon,
+} from 'lucide-react'
 
 import { twMerge } from 'tailwind-merge'
 
@@ -17,12 +23,14 @@ import useSendChatMessage from '@/hooks/useSendChatMessage'
 import { extensionManager } from '@/extension'
 import {
   deleteMessageAtom,
+  editMessageAtom,
   getCurrentChatMessagesAtom,
 } from '@/helpers/atoms/ChatMessage.atom'
 import { activeThreadAtom } from '@/helpers/atoms/Thread.atom'
 
 const MessageToolbar = ({ message }: { message: ThreadMessage }) => {
   const deleteMessage = useSetAtom(deleteMessageAtom)
+  const setEditMessage = useSetAtom(editMessageAtom)
   const thread = useAtomValue(activeThreadAtom)
   const messages = useAtomValue(getCurrentChatMessagesAtom)
   const { resendChatMessage } = useSendChatMessage()
@@ -40,11 +48,11 @@ const MessageToolbar = ({ message }: { message: ThreadMessage }) => {
     }
   }
 
+  const onEditClick = async () => {
+    setEditMessage(message.id ?? '')
+  }
+
   const onRegenerateClick = async () => {
-    if (message.role !== ChatCompletionRole.User) {
-      // Delete last response before regenerating
-      await onDeleteClick()
-    }
     resendChatMessage(message)
   }
 
@@ -53,6 +61,16 @@ const MessageToolbar = ({ message }: { message: ThreadMessage }) => {
   return (
     <div className={twMerge('flex flex-row items-center')}>
       <div className="flex overflow-hidden rounded-md border border-border bg-background/20">
+        {message.role === ChatCompletionRole.User &&
+          message.content[0]?.type === ContentType.Text && (
+            <div
+              className="cursor-pointer border-r border-border px-2 py-2 hover:bg-background/80"
+              onClick={onEditClick}
+            >
+              <PencilIcon size={14} />
+            </div>
+          )}
+
         {message.id === messages[messages.length - 1]?.id &&
           messages[messages.length - 1].status !== MessageStatus.Error &&
           messages[messages.length - 1].content[0]?.type !==
diff --git a/web/screens/Chat/ModelSetting/index.tsx b/web/screens/Chat/ModelSetting/index.tsx
index ea95363ebc..51aa6f637b 100644
--- a/web/screens/Chat/ModelSetting/index.tsx
+++ b/web/screens/Chat/ModelSetting/index.tsx
@@ -1,37 +1,26 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
 import React from 'react'
 
-import { useAtomValue } from 'jotai'
-
-import { selectedModelAtom } from '@/containers/DropdownListSidebar'
-
-import { getConfigurationsData } from '@/utils/componentSettings'
-import { toRuntimeParams } from '@/utils/modelParam'
-
-import SettingComponentBuilder from './SettingComponent'
-
-import { getActiveThreadModelParamsAtom } from '@/helpers/atoms/Thread.atom'
-
-const ModelSetting = () => {
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
-  const selectedModel = useAtomValue(selectedModelAtom)
-
-  if (!selectedModel || !activeModelParams) return null
-
-  const modelRuntimeParams = toRuntimeParams(activeModelParams)
-
-  const componentData = getConfigurationsData(
-    modelRuntimeParams,
-    selectedModel
-  ).toSorted((a, b) => a.title.localeCompare(b.title))
-
+import SettingComponentBuilder, {
+  SettingComponentData,
+} from './SettingComponent'
+
+const ModelSetting = ({
+  componentData,
+}: {
+  componentData: SettingComponentData[]
+}) => {
   return (
-    <div className="flex flex-col">
-      <SettingComponentBuilder
-        componentData={componentData}
-        selector={(e) => e.name !== 'prompt_template'}
-      />
-    </div>
+    <>
+      {componentData.filter((e) => e.name !== 'prompt_template').length && (
+        <div className="flex flex-col">
+          <SettingComponentBuilder
+            componentData={componentData}
+            selector={(e) => e.name !== 'prompt_template'}
+          />
+        </div>
+      )}
+    </>
   )
 }
 
diff --git a/web/screens/Chat/RequestDownloadModel/index.tsx b/web/screens/Chat/RequestDownloadModel/index.tsx
index e62dc562dd..88fdadd573 100644
--- a/web/screens/Chat/RequestDownloadModel/index.tsx
+++ b/web/screens/Chat/RequestDownloadModel/index.tsx
@@ -2,15 +2,18 @@ import React, { Fragment, useCallback } from 'react'
 
 import { Button } from '@janhq/uikit'
 
+import { useAtomValue } from 'jotai'
+
 import LogoMark from '@/containers/Brand/Logo/Mark'
 
 import { MainViewState } from '@/constants/screens'
 
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
+
 const RequestDownloadModel: React.FC = () => {
-  const { downloadedModels } = useGetDownloadedModels()
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
   const { setMainViewState } = useMainViewState()
 
   const onClick = useCallback(() => {
diff --git a/web/screens/Chat/Sidebar/index.tsx b/web/screens/Chat/Sidebar/index.tsx
index 8088501b9b..7187c84b38 100644
--- a/web/screens/Chat/Sidebar/index.tsx
+++ b/web/screens/Chat/Sidebar/index.tsx
@@ -1,11 +1,20 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
 import React, { useContext } from 'react'
 
-import { InferenceEngine } from '@janhq/core'
-import { Input, Textarea, Switch } from '@janhq/uikit'
+import {
+  Input,
+  Textarea,
+  Switch,
+  Tooltip,
+  TooltipArrow,
+  TooltipContent,
+  TooltipPortal,
+  TooltipTrigger,
+} from '@janhq/uikit'
 
 import { atom, useAtomValue } from 'jotai'
 
+import { InfoIcon } from 'lucide-react'
 import { twMerge } from 'tailwind-merge'
 
 import LogoMark from '@/containers/Brand/Logo/Mark'
@@ -50,8 +59,14 @@ const Sidebar: React.FC = () => {
       activeThread?.assistants[0]?.tools[0]?.settings) ??
       {}
   )
-  const componentDataEngineSetting = getConfigurationsData(modelEngineParams)
-  const componentDataRuntimeSetting = getConfigurationsData(modelRuntimeParams)
+  const componentDataEngineSetting = getConfigurationsData(
+    modelEngineParams,
+    selectedModel
+  )
+  const componentDataRuntimeSetting = getConfigurationsData(
+    modelRuntimeParams,
+    selectedModel
+  )
 
   return (
     <div
@@ -101,7 +116,7 @@ const Sidebar: React.FC = () => {
           </div>
         </div>
 
-        <CardSidebar title="Assistant">
+        <CardSidebar title="Assistant" isShow={true}>
           <div className="flex flex-col space-y-4 p-2">
             <div className="flex items-center space-x-2">
               <LogoMark width={24} height={24} />
@@ -134,77 +149,10 @@ const Sidebar: React.FC = () => {
                 }}
               />
             </div>
-            {experimentalFeature && (
-              <div>
-                {activeThread?.assistants[0]?.tools &&
-                  componentDataAssistantSetting.length > 0 && (
-                    <div className="mt-2">
-                      <CardSidebar
-                        title="Retrieval"
-                        asChild
-                        rightAction={
-                          <Switch
-                            name="retrieval"
-                            className="mr-2"
-                            checked={
-                              activeThread?.assistants[0].tools[0].enabled
-                            }
-                            onCheckedChange={(e) => {
-                              if (activeThread)
-                                updateThreadMetadata({
-                                  ...activeThread,
-                                  assistants: [
-                                    {
-                                      ...activeThread.assistants[0],
-                                      tools: [
-                                        {
-                                          type: 'retrieval',
-                                          enabled: e,
-                                          settings:
-                                            (activeThread.assistants[0].tools &&
-                                              activeThread.assistants[0]
-                                                .tools[0]?.settings) ??
-                                            {},
-                                        },
-                                      ],
-                                    },
-                                  ],
-                                })
-                            }}
-                          />
-                        }
-                      >
-                        {activeThread?.assistants[0]?.tools[0].enabled && (
-                          <div className="px-2 py-4">
-                            <div className="mb-4">
-                              <label
-                                id="tool-title"
-                                className="mb-2 inline-block font-bold text-zinc-500 dark:text-gray-300"
-                              >
-                                Embedding Engine
-                              </label>
-                              <div className="flex items-center justify-between">
-                                <label className="font-medium text-zinc-500 dark:text-gray-300">
-                                  {selectedModel?.engine ===
-                                  InferenceEngine.openai
-                                    ? 'OpenAI'
-                                    : 'Nitro'}
-                                </label>
-                              </div>
-                            </div>
-                            <AssistantSetting
-                              componentData={componentDataAssistantSetting}
-                            />
-                          </div>
-                        )}
-                      </CardSidebar>
-                    </div>
-                  )}
-              </div>
-            )}
           </div>
         </CardSidebar>
-        <CardSidebar title="Model">
+
+        <CardSidebar title="Model" isShow={true}>
           <div className="px-2 pt-4">
             <DropdownListSidebar />
 
@@ -212,7 +160,7 @@ const Sidebar: React.FC = () => {
               <div className="mt-6">
                 <CardSidebar title="Inference Parameters" asChild>
                   <div className="px-2 py-4">
-                    <ModelSetting />
+                    <ModelSetting componentData={componentDataRuntimeSetting} />
                   </div>
                 </CardSidebar>
               </div>
@@ -237,13 +185,174 @@ const Sidebar: React.FC = () => {
               <div className="my-4">
                 <CardSidebar title="Engine Parameters" asChild>
                   <div className="px-2 py-4">
-                    <EngineSetting />
+                    <EngineSetting componentData={componentDataEngineSetting} />
                   </div>
                 </CardSidebar>
               </div>
             )}
           </div>
         </CardSidebar>
+
+        {experimentalFeature && (
+          <div>
+            {activeThread?.assistants[0]?.tools &&
+              componentDataAssistantSetting.length > 0 && (
+                <CardSidebar title="Tools" isShow={true}>
+                  <div className="px-2 pt-4">
+                    <div className="mb-2">
+                      <div className="flex items-center justify-between">
+                        <label
+                          id="retrieval"
+                          className="inline-flex items-center font-bold text-zinc-500 dark:text-gray-300"
+                        >
+                          Retrieval
+                          <Tooltip>
+                            <TooltipTrigger asChild>
+                              <InfoIcon
+                                size={16}
+                                className="ml-2 flex-shrink-0 text-black dark:text-gray-500"
+                              />
+                            </TooltipTrigger>
+                            <TooltipPortal>
+                              <TooltipContent
+                                side="top"
+                                className="max-w-[240px]"
+                              >
+                                <span>
+                                  Retrieval helps the assistant use information
+                                  from files you send to it. Once you share a
+                                  file, the assistant automatically fetches the
+                                  relevant content based on your request.
+                                </span>
+                                <TooltipArrow />
+                              </TooltipContent>
+                            </TooltipPortal>
+                          </Tooltip>
+                        </label>
+
+                        <div className="flex items-center justify-between">
+                          <Switch
+                            name="retrieval"
+                            className="mr-2"
+                            checked={
+                              activeThread?.assistants[0].tools[0].enabled
+                            }
+                            onCheckedChange={(e) => {
+                              if (activeThread)
+                                updateThreadMetadata({
+                                  ...activeThread,
+                                  assistants: [
+                                    {
+                                      ...activeThread.assistants[0],
+                                      tools: [
+                                        {
+                                          type: 'retrieval',
+                                          enabled: e,
+                                          settings:
+                                            (activeThread.assistants[0].tools &&
+                                              activeThread.assistants[0]
+                                                .tools[0]?.settings) ??
+                                            {},
+                                        },
+                                      ],
+                                    },
+                                  ],
+                                })
+                            }}
+                          />
+                        </div>
+                      </div>
+                    </div>
+                    {activeThread?.assistants[0]?.tools[0].enabled && (
+                      <div className="pb-4 pt-2">
+                        <div className="mb-4">
+                          <div className="item-center mb-2 flex">
+                            <label
+                              id="embedding-model"
+                              className="inline-flex font-bold text-zinc-500 dark:text-gray-300"
+                            >
+                              Embedding Model
+                            </label>
+                            <Tooltip>
+                              <TooltipTrigger asChild>
+                                <InfoIcon
+                                  size={16}
+                                  className="ml-2 flex-shrink-0 dark:text-gray-500"
+                                />
+                              </TooltipTrigger>
+                              <TooltipPortal>
+                                <TooltipContent
+                                  side="top"
+                                  className="max-w-[240px]"
+                                >
+                                  <span>
+                                    Embedding model is crucial for understanding
+                                    and processing the input text effectively by
+                                    converting text to numerical
+                                    representations. Align the model choice with
+                                    your task, evaluate its performance, and
+                                    consider factors like resource availability.
+                                    Experiment to find the best fit for your
+                                    specific use case.
+                                  </span>
+                                  <TooltipArrow />
+                                </TooltipContent>
+                              </TooltipPortal>
+                            </Tooltip>
+                          </div>
+
+                          <div className="flex items-center justify-between">
+                            <Input value={selectedModel?.name} disabled />
+                          </div>
+                        </div>
+                        <div className="mb-4">
+                          <div className="mb-2 flex items-center">
+                            <label
+                              id="vector-database"
+                              className="inline-block font-bold text-zinc-500 dark:text-gray-300"
+                            >
+                              Vector Database
+                            </label>
+                            <Tooltip>
+                              <TooltipTrigger asChild>
+                                <InfoIcon
+                                  size={16}
+                                  className="ml-2 flex-shrink-0 dark:text-gray-500"
+                                />
+                              </TooltipTrigger>
+                              <TooltipPortal>
+                                <TooltipContent
+                                  side="top"
+                                  className="max-w-[240px]"
+                                >
+                                  <span>
+                                    Vector Database is crucial for efficient
+                                    storage and retrieval of embeddings.
+                                    Consider your specific task, available
+                                    resources, and language requirements.
+                                    Experiment to find the best fit for your
+                                    specific use case.
+                                  </span>
+                                  <TooltipArrow />
+                                </TooltipContent>
+                              </TooltipPortal>
+                            </Tooltip>
+                          </div>
+
+                          <div className="flex items-center justify-between">
+                            <Input value="HNSWLib" disabled />
+                          </div>
+                        </div>
+                        <AssistantSetting
+                          componentData={componentDataAssistantSetting}
+                        />
+                      </div>
+                    )}
+                  </div>
+                </CardSidebar>
+              )}
+          </div>
+        )}
       </div>
     </div>
   )
diff --git a/web/screens/Chat/SimpleTextMessage/index.tsx b/web/screens/Chat/SimpleTextMessage/index.tsx
index 261bb34972..f064132b87 100644
--- a/web/screens/Chat/SimpleTextMessage/index.tsx
+++ b/web/screens/Chat/SimpleTextMessage/index.tsx
@@ -18,7 +18,7 @@ import hljs from 'highlight.js'
 
 import { useAtomValue } from 'jotai'
 import { FolderOpenIcon } from 'lucide-react'
-import { Marked, Renderer } from 'marked'
+import { Marked, Renderer, marked as markedDefault } from 'marked'
 
 import { markedHighlight } from 'marked-highlight'
 
@@ -32,18 +32,39 @@ import { usePath } from '@/hooks/usePath'
 import { toGibibytes } from '@/utils/converter'
 import { displayDate } from '@/utils/datetime'
 
+import EditChatInput from '../EditChatInput'
 import Icon from '../FileUploadPreview/Icon'
 import MessageToolbar from '../MessageToolbar'
 
-import { getCurrentChatMessagesAtom } from '@/helpers/atoms/ChatMessage.atom'
+import {
+  editMessageAtom,
+  getCurrentChatMessagesAtom,
+} from '@/helpers/atoms/ChatMessage.atom'
+
+function isMarkdownValue(value: string): boolean {
+  const tokenTypes: string[] = []
+  markedDefault(value, {
+    walkTokens: (token) => {
+      tokenTypes.push(token.type)
+    },
+  })
+  const isMarkdown = ['code', 'codespan'].some((tokenType) => {
+    return tokenTypes.includes(tokenType)
+  })
+  return isMarkdown
+}
 
 const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
   let text = ''
+  const isUser = props.role === ChatCompletionRole.User
+  const isSystem = props.role === ChatCompletionRole.System
+  const editMessage = useAtomValue(editMessageAtom)
+
   if (props.content && props.content.length > 0) {
     text = props.content[0]?.text?.value ?? ''
   }
+
   const clipboard = useClipboard({ timeout: 1000 })
-  const { onViewFile, onViewFileContainer } = usePath()
 
   const marked: Marked = new Marked(
     markedHighlight({
@@ -88,9 +109,8 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
     }
   )
 
+  const { onViewFile, onViewFileContainer } = usePath()
   const parsedText = marked.parse(text)
-  const isUser = props.role === ChatCompletionRole.User
-  const isSystem = props.role === ChatCompletionRole.System
   const [tokenCount, setTokenCount] = useState(0)
   const [lastTimestamp, setLastTimestamp] = useState<number | undefined>()
   const [tokenSpeed, setTokenSpeed] = useState(0)
@@ -260,16 +280,37 @@ const SimpleTextMessage: React.FC<ThreadMessage> = (props) => {
             </div>
           )}
 
-          <div
-            className={twMerge(
-              'message flex flex-grow flex-col gap-y-2 text-[15px] font-normal leading-relaxed',
-              isUser
-                ? 'whitespace-pre-wrap break-words'
-                : 'rounded-xl bg-secondary p-4'
-            )}
-            // eslint-disable-next-line @typescript-eslint/naming-convention
-            dangerouslySetInnerHTML={{ __html: parsedText }}
-          />
+          {isUser && !isMarkdownValue(text) ? (
+            <>
+              {editMessage === props.id ? (
+                <div>
+                  <EditChatInput message={props} />
+                </div>
+              ) : (
+                <div
+                  className={twMerge(
+                    'message flex flex-grow flex-col gap-y-2 text-[15px] font-normal leading-relaxed',
+                    isUser
+                      ? 'whitespace-pre-wrap break-words'
+                      : 'rounded-xl bg-secondary p-4'
+                  )}
+                >
+                  {text}
+                </div>
+              )}
+            </>
+          ) : (
+            <div
+              className={twMerge(
+                'message flex flex-grow flex-col gap-y-2 text-[15px] font-normal leading-relaxed',
+                isUser
+                  ? 'whitespace-pre-wrap break-words'
+                  : 'rounded-xl bg-secondary p-4'
+              )}
+              // eslint-disable-next-line @typescript-eslint/naming-convention
+              dangerouslySetInnerHTML={{ __html: parsedText }}
+            />
+          )}
         </>
       </div>
     </div>
diff --git a/web/screens/Chat/ThreadList/index.tsx b/web/screens/Chat/ThreadList/index.tsx
index b4a045b1d7..eb372f6643 100644
--- a/web/screens/Chat/ThreadList/index.tsx
+++ b/web/screens/Chat/ThreadList/index.tsx
@@ -1,76 +1,68 @@
-import { useEffect, useState } from 'react'
+import { useCallback, useEffect } from 'react'
 
-import {
-  Modal,
-  ModalTrigger,
-  ModalClose,
-  ModalFooter,
-  ModalPortal,
-  ModalContent,
-  ModalHeader,
-  ModalTitle,
-  Button,
-} from '@janhq/uikit'
+import { Thread } from '@janhq/core/'
 
 import { motion as m } from 'framer-motion'
-import { useAtomValue } from 'jotai'
-import {
-  GalleryHorizontalEndIcon,
-  MoreVerticalIcon,
-  Trash2Icon,
-  Paintbrush,
-} from 'lucide-react'
+import { useAtomValue, useSetAtom } from 'jotai'
+import { GalleryHorizontalEndIcon, MoreVerticalIcon } from 'lucide-react'
 
 import { twMerge } from 'tailwind-merge'
 
 import { useCreateNewThread } from '@/hooks/useCreateNewThread'
-import useDeleteThread from '@/hooks/useDeleteThread'
-
-import useGetAssistants from '@/hooks/useGetAssistants'
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
 import useSetActiveThread from '@/hooks/useSetActiveThread'
 
-import useThreads from '@/hooks/useThreads'
-
 import { displayDate } from '@/utils/datetime'
 
+import CleanThreadModal from '../CleanThreadModal'
+
+import DeleteThreadModal from '../DeleteThreadModal'
+
+import { assistantsAtom } from '@/helpers/atoms/Assistant.atom'
+import { editMessageAtom } from '@/helpers/atoms/ChatMessage.atom'
 import {
-  activeThreadAtom,
+  getActiveThreadIdAtom,
+  threadDataReadyAtom,
   threadStatesAtom,
   threadsAtom,
 } from '@/helpers/atoms/Thread.atom'
 
 export default function ThreadList() {
-  const threads = useAtomValue(threadsAtom)
   const threadStates = useAtomValue(threadStatesAtom)
-  const { getThreads } = useThreads()
-  const { assistants } = useGetAssistants()
+  const threads = useAtomValue(threadsAtom)
+  const activeThreadId = useAtomValue(getActiveThreadIdAtom)
+  const { setActiveThread } = useSetActiveThread()
+  const assistants = useAtomValue(assistantsAtom)
+  const threadDataReady = useAtomValue(threadDataReadyAtom)
   const { requestCreateNewThread } = useCreateNewThread()
-  const activeThread = useAtomValue(activeThreadAtom)
-  const { deleteThread, cleanThread } = useDeleteThread()
-  const { downloadedModels } = useGetDownloadedModels()
-  const [isThreadsReady, setIsThreadsReady] = useState(false)
-
-  const { activeThreadId, setActiveThread: onThreadClick } =
-    useSetActiveThread()
+  const setEditMessage = useSetAtom(editMessageAtom)
 
-  useEffect(() => {
-    getThreads().then(() => setIsThreadsReady(true))
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [])
+  const onThreadClick = useCallback(
+    (thread: Thread) => {
+      setActiveThread(thread)
+      setEditMessage('')
+    },
+    [setActiveThread, setEditMessage]
+  )
 
+  /**
+   * Auto create thread
+   * This will create a new thread if there are assistants available
+   * and there are no threads available
+   */
   useEffect(() => {
-    if (
-      isThreadsReady &&
-      downloadedModels.length !== 0 &&
-      threads.length === 0 &&
-      assistants.length !== 0 &&
-      !activeThread
-    ) {
+    if (threadDataReady && assistants.length > 0 && threads.length === 0) {
       requestCreateNewThread(assistants[0])
+    } else if (threadDataReady && !activeThreadId) {
+      setActiveThread(threads[0])
     }
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [assistants, threads, downloadedModels, activeThread, isThreadsReady])
+  }, [
+    assistants,
+    threads,
+    threadDataReady,
+    requestCreateNewThread,
+    activeThreadId,
+    setActiveThread,
+  ])
 
   return (
     <div className="px-3 py-4">
@@ -83,133 +75,46 @@ export default function ThreadList() {
           <h2 className="font-semibold">No Thread History</h2>
         </div>
       ) : (
-        threads.map((thread, i) => {
-          const lastMessage =
-            threadStates[thread.id]?.lastMessage ?? 'No new message'
-          return (
+        threads.map((thread) => (
+          <div
+            key={thread.id}
+            className={twMerge(
+              `group/message relative mb-1 flex cursor-pointer flex-col transition-all hover:rounded-lg hover:bg-gray-100 hover:dark:bg-secondary/50`
+            )}
+            onClick={() => {
+              onThreadClick(thread)
+            }}
+          >
+            <div className="relative z-10 p-4 py-4">
+              <p className="line-clamp-1 text-xs leading-5 text-muted-foreground">
+                {thread.updated && displayDate(thread.updated)}
+              </p>
+              <h2 className="line-clamp-1 font-bold">{thread.title}</h2>
+              <p className="mt-1 line-clamp-1 text-xs text-gray-700 group-hover/message:max-w-[160px] dark:text-gray-300">
+                {threadStates[thread.id]?.lastMessage
+                  ? threadStates[thread.id]?.lastMessage
+                  : 'No new message'}
+              </p>
+            </div>
             <div
-              key={i}
               className={twMerge(
-                `group/message relative mb-1 flex cursor-pointer flex-col transition-all hover:rounded-lg hover:bg-gray-100 hover:dark:bg-secondary/50`
+                `group/icon invisible absolute bottom-2 right-2 z-20 rounded-lg p-1 text-muted-foreground hover:bg-gray-200 group-hover/message:visible hover:dark:bg-secondary`
               )}
-              onClick={() => {
-                onThreadClick(thread)
-              }}
             >
-              <div className="relative z-10 p-4 py-4">
-                <p className="line-clamp-1 text-xs leading-5 text-muted-foreground">
-                  {thread.updated && displayDate(thread.updated)}
-                </p>
-                <h2 className="line-clamp-1 font-bold">{thread.title}</h2>
-                <p className="mt-1 line-clamp-1 text-xs text-gray-700 group-hover/message:max-w-[160px] dark:text-gray-300">
-                  {lastMessage || 'No new message'}
-                </p>
-              </div>
-              <div
-                className={twMerge(
-                  `group/icon invisible absolute bottom-2 right-2 z-20 rounded-lg p-1 text-muted-foreground hover:bg-gray-200 group-hover/message:visible hover:dark:bg-secondary`
-                )}
-              >
-                <MoreVerticalIcon />
-                <div className="invisible absolute right-0 z-20 w-40 overflow-hidden rounded-lg border border-border bg-background shadow-lg group-hover/icon:visible">
-                  <Modal>
-                    <ModalTrigger asChild onClick={(e) => e.stopPropagation()}>
-                      <div className="flex cursor-pointer items-center space-x-2 px-4 py-2 hover:bg-secondary">
-                        <Paintbrush
-                          size={16}
-                          className="text-muted-foreground"
-                        />
-                        <span className="text-bold text-black dark:text-muted-foreground">
-                          Clean thread
-                        </span>
-                      </div>
-                    </ModalTrigger>
-                    <ModalPortal />
-                    <ModalContent>
-                      <ModalHeader>
-                        <ModalTitle>Clean Thread</ModalTitle>
-                      </ModalHeader>
-                      <p>Are you sure you want to clean this thread?</p>
-                      <ModalFooter>
-                        <div className="flex gap-x-2">
-                          <ModalClose
-                            asChild
-                            onClick={(e) => e.stopPropagation()}
-                          >
-                            <Button themes="ghost">No</Button>
-                          </ModalClose>
-                          <ModalClose asChild>
-                            <Button
-                              themes="danger"
-                              onClick={(e) => {
-                                e.stopPropagation()
-                                cleanThread(thread.id)
-                              }}
-                              autoFocus
-                            >
-                              Yes
-                            </Button>
-                          </ModalClose>
-                        </div>
-                      </ModalFooter>
-                    </ModalContent>
-                  </Modal>
-                  <Modal>
-                    <ModalTrigger asChild onClick={(e) => e.stopPropagation()}>
-                      <div className="flex cursor-pointer items-center space-x-2 px-4 py-2 hover:bg-secondary">
-                        <Trash2Icon
-                          size={16}
-                          className="text-red-600 dark:text-red-300"
-                        />
-                        <span className="text-bold text-red-600 dark:text-red-300">
-                          Delete thread
-                        </span>
-                      </div>
-                    </ModalTrigger>
-                    <ModalPortal />
-                    <ModalContent>
-                      <ModalHeader>
-                        <ModalTitle>Delete Thread</ModalTitle>
-                      </ModalHeader>
-                      <p>
-                        Are you sure you want to delete this thread? This action
-                        cannot be undone.
-                      </p>
-                      <ModalFooter>
-                        <div className="flex gap-x-2">
-                          <ModalClose
-                            asChild
-                            onClick={(e) => e.stopPropagation()}
-                          >
-                            <Button themes="ghost">No</Button>
-                          </ModalClose>
-                          <ModalClose asChild>
-                            <Button
-                              autoFocus
-                              themes="danger"
-                              onClick={(e) => {
-                                e.stopPropagation()
-                                deleteThread(thread.id)
-                              }}
-                            >
-                              Yes
-                            </Button>
-                          </ModalClose>
-                        </div>
-                      </ModalFooter>
-                    </ModalContent>
-                  </Modal>
-                </div>
+              <MoreVerticalIcon />
+              <div className="invisible absolute right-0 z-20 w-40 overflow-hidden rounded-lg border border-border bg-background shadow-lg group-hover/icon:visible">
+                <CleanThreadModal threadId={thread.id} />
+                <DeleteThreadModal threadId={thread.id} />
               </div>
-              {activeThreadId === thread.id && (
-                <m.div
-                  className="absolute inset-0 left-0 h-full w-full rounded-lg bg-gray-100 p-4 dark:bg-secondary/50"
-                  layoutId="active-thread"
-                />
-              )}
             </div>
-          )
-        })
+            {activeThreadId === thread.id && (
+              <m.div
+                className="absolute inset-0 left-0 h-full w-full rounded-lg bg-gray-100 p-4 dark:bg-secondary/50"
+                layoutId="active-thread"
+              />
+            )}
+          </div>
+        ))
       )}
     </div>
   )
diff --git a/web/screens/Chat/index.tsx b/web/screens/Chat/index.tsx
index e3eedb6c1f..125e58b3b5 100644
--- a/web/screens/Chat/index.tsx
+++ b/web/screens/Chat/index.tsx
@@ -13,7 +13,7 @@ import GenerateResponse from '@/containers/Loader/GenerateResponse'
 import ModelReload from '@/containers/Loader/ModelReload'
 import ModelStart from '@/containers/Loader/ModelStart'
 
-import { currentPromptAtom, fileUploadAtom } from '@/containers/Providers/Jotai'
+import { fileUploadAtom } from '@/containers/Providers/Jotai'
 import { showLeftSideBarAtom } from '@/containers/Providers/KeyListener'
 
 import { snackbar } from '@/containers/Toast'
@@ -54,7 +54,6 @@ const renderError = (code: string) => {
 }
 
 const ChatScreen: React.FC = () => {
-  const setCurrentPrompt = useSetAtom(currentPromptAtom)
   const activeThread = useAtomValue(activeThreadAtom)
   const showLeftSideBar = useAtomValue(showLeftSideBarAtom)
   const engineParamsUpdate = useAtomValue(engineParamsUpdateAtom)
@@ -110,11 +109,6 @@ const ChatScreen: React.FC = () => {
       const imageType = files[0]?.type.includes('image')
       setFileUpload([{ file: files[0], type: imageType ? 'image' : 'pdf' }])
       setDragOver(false)
-      if (imageType) {
-        setCurrentPrompt('What do you see in this image?')
-      } else {
-        setCurrentPrompt('Summarize this for me')
-      }
     },
     onDropRejected: (e) => {
       if (
@@ -205,7 +199,7 @@ const ChatScreen: React.FC = () => {
           {queuedMessage && !reloadModel && (
             <div className="mb-2 text-center">
               <span className="text-muted-foreground">
-                Message queued. It can be sent once the model has started
+                Message will be sent once the model has started
               </span>
             </div>
           )}
diff --git a/web/screens/ExploreModels/ExploreModelItem/index.tsx b/web/screens/ExploreModels/ExploreModelItem/index.tsx
index 553c73a496..9cdfbc01a3 100644
--- a/web/screens/ExploreModels/ExploreModelItem/index.tsx
+++ b/web/screens/ExploreModels/ExploreModelItem/index.tsx
@@ -1,6 +1,4 @@
-/* eslint-disable react/display-name */
-
-import { forwardRef, useState } from 'react'
+import { useState } from 'react'
 
 import { Model } from '@janhq/core'
 import { Badge } from '@janhq/uikit'
@@ -11,7 +9,7 @@ type Props = {
   model: Model
 }
 
-const ExploreModelItem = forwardRef<HTMLDivElement, Props>(({ model }, ref) => {
+const ExploreModelItem: React.FC<Props> = ({ model }) => {
   const [open, setOpen] = useState('')
 
   const handleToggle = () => {
@@ -23,10 +21,7 @@ const ExploreModelItem = forwardRef<HTMLDivElement, Props>(({ model }, ref) => {
   }
 
   return (
-    <div
-      ref={ref}
-      className="mb-6 flex flex-col overflow-hidden rounded-xl border border-border bg-background/60"
-    >
+    <div className="mb-6 flex flex-col overflow-hidden rounded-xl border border-border bg-background/60">
       <ExploreModelItemHeader
         model={model}
         onClick={handleToggle}
@@ -82,17 +77,11 @@ const ExploreModelItem = forwardRef<HTMLDivElement, Props>(({ model }, ref) => {
               </span>
               <p className="mt-2 font-medium uppercase">{model.format}</p>
             </div>
-            {/* <div className="mt-4">
-              <span className="font-semibold text-muted-foreground">
-                Compatibility
-              </span>
-              <p className="mt-2 font-medium">-</p>
-            </div> */}
           </div>
         </div>
       )}
     </div>
   )
-})
+}
 
 export default ExploreModelItem
diff --git a/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx b/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
index 3ffe2cbace..7af5d3d975 100644
--- a/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
+++ b/web/screens/ExploreModels/ExploreModelItemHeader/index.tsx
@@ -1,5 +1,4 @@
-/* eslint-disable react-hooks/exhaustive-deps */
-import { useCallback, useMemo } from 'react'
+import { useCallback } from 'react'
 
 import { Model } from '@janhq/core'
 import {
@@ -12,7 +11,7 @@ import {
   TooltipTrigger,
 } from '@janhq/uikit'
 
-import { atom, useAtomValue } from 'jotai'
+import { useAtomValue } from 'jotai'
 
 import { ChevronDownIcon } from 'lucide-react'
 
@@ -25,17 +24,21 @@ import { MainViewState } from '@/constants/screens'
 import { useCreateNewThread } from '@/hooks/useCreateNewThread'
 import useDownloadModel from '@/hooks/useDownloadModel'
 
-import { useDownloadState } from '@/hooks/useDownloadState'
-
-import { getAssistants } from '@/hooks/useGetAssistants'
-import { downloadedModelsAtom } from '@/hooks/useGetDownloadedModels'
 import { useMainViewState } from '@/hooks/useMainViewState'
 
 import { toGibibytes } from '@/utils/converter'
 
+import { assistantsAtom } from '@/helpers/atoms/Assistant.atom'
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
 
-import { totalRamAtom } from '@/helpers/atoms/SystemBar.atom'
+import {
+  downloadedModelsAtom,
+  getDownloadingModelAtom,
+} from '@/helpers/atoms/Model.atom'
+import {
+  nvidiaTotalVramAtom,
+  totalRamAtom,
+} from '@/helpers/atoms/SystemBar.atom'
 
 type Props = {
   model: Model
@@ -43,41 +46,68 @@ type Props = {
   open: string
 }
 
+const getLabel = (size: number, ram: number) => {
+  if (size * 1.25 >= ram) {
+    return (
+      <Badge className="rounded-md" themes="danger">
+        Not enough RAM
+      </Badge>
+    )
+  } else {
+    return (
+      <Badge className="rounded-md" themes="success">
+        Recommended
+      </Badge>
+    )
+  }
+}
+
 const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
   const { downloadModel } = useDownloadModel()
+  const downloadingModels = useAtomValue(getDownloadingModelAtom)
   const downloadedModels = useAtomValue(downloadedModelsAtom)
-  const { modelDownloadStateAtom } = useDownloadState()
   const { requestCreateNewThread } = useCreateNewThread()
   const totalRam = useAtomValue(totalRamAtom)
-  const serverEnabled = useAtomValue(serverEnabledAtom)
 
-  const downloadAtom = useMemo(
-    () => atom((get) => get(modelDownloadStateAtom)[model.id]),
-    [model.id]
-  )
-  const downloadState = useAtomValue(downloadAtom)
+  const nvidiaTotalVram = useAtomValue(nvidiaTotalVramAtom)
   const { setMainViewState } = useMainViewState()
 
+  // Default nvidia returns vram in MB, need to convert to bytes to match the unit of totalRamW
+  let ram = nvidiaTotalVram * 1024 * 1024
+  if (ram === 0) {
+    ram = totalRam
+  }
+  const serverEnabled = useAtomValue(serverEnabledAtom)
+  const assistants = useAtomValue(assistantsAtom)
+
   const onDownloadClick = useCallback(() => {
     downloadModel(model)
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [model])
+  }, [model, downloadModel])
 
   const isDownloaded = downloadedModels.find((md) => md.id === model.id) != null
 
   let downloadButton = (
-    <Button onClick={() => onDownloadClick()}>Download</Button>
+    <Button
+      className="z-50"
+      onClick={(e) => {
+        e.stopPropagation()
+        onDownloadClick()
+      }}
+    >
+      Download
+    </Button>
   )
 
+  const isDownloading = downloadingModels.some((md) => md.id === model.id)
+
   const onUseModelClick = useCallback(async () => {
-    const assistants = await getAssistants()
     if (assistants.length === 0) {
       alert('No assistant available')
       return
     }
     await requestCreateNewThread(assistants[0], model)
     setMainViewState(MainViewState.Thread)
-  }, [])
+  }, [assistants, model, requestCreateNewThread, setMainViewState])
 
   if (isDownloaded) {
     downloadButton = (
@@ -102,26 +132,10 @@ const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
         )}
       </Tooltip>
     )
-  } else if (downloadState != null) {
+  } else if (isDownloading) {
     downloadButton = <ModalCancelDownload model={model} />
   }
 
-  const getLabel = (size: number) => {
-    if (size * 1.25 >= totalRam) {
-      return (
-        <Badge className="rounded-md" themes="danger">
-          Not enough RAM
-        </Badge>
-      )
-    } else {
-      return (
-        <Badge className="rounded-md" themes="success">
-          Recommended
-        </Badge>
-      )
-    }
-  }
-
   return (
     <div
       className="cursor-pointer rounded-t-md bg-background"
@@ -144,7 +158,7 @@ const ExploreModelItemHeader: React.FC<Props> = ({ model, onClick, open }) => {
           <span className="mr-4 font-semibold text-muted-foreground">
             {toGibibytes(model.metadata.size)}
           </span>
-          {getLabel(model.metadata.size)}
+          {getLabel(model.metadata.size, ram)}
 
           {downloadButton}
           <ChevronDownIcon
diff --git a/web/screens/ExploreModels/ExploreModelList/index.tsx b/web/screens/ExploreModels/ExploreModelList/index.tsx
index 54c8120dd1..ddd474b53e 100644
--- a/web/screens/ExploreModels/ExploreModelList/index.tsx
+++ b/web/screens/ExploreModels/ExploreModelList/index.tsx
@@ -10,7 +10,7 @@ const ExploreModelList: React.FC<Props> = ({ models }) => {
   const takenModelIds: string[] = []
   const featuredModels = models
     .filter((m) => {
-      if (m.metadata.tags.includes('Featured')) {
+      if (m.metadata?.tags?.includes('Featured')) {
         takenModelIds.push(m.id)
         return m
       }
@@ -19,7 +19,7 @@ const ExploreModelList: React.FC<Props> = ({ models }) => {
 
   const recommendedModels = models
     .filter((m) => {
-      if (m.metadata.tags.includes('Recommended')) {
+      if (m.metadata?.tags?.includes('Recommended')) {
         takenModelIds.push(m.id)
         return m
       }
diff --git a/web/screens/ExploreModels/ModelVersionItem/index.tsx b/web/screens/ExploreModels/ModelVersionItem/index.tsx
deleted file mode 100644
index 50d71b161d..0000000000
--- a/web/screens/ExploreModels/ModelVersionItem/index.tsx
+++ /dev/null
@@ -1,82 +0,0 @@
-import React, { useMemo } from 'react'
-
-import { Model } from '@janhq/core'
-import { Button } from '@janhq/uikit'
-import { atom, useAtomValue } from 'jotai'
-
-import ModalCancelDownload from '@/containers/ModalCancelDownload'
-
-import { MainViewState } from '@/constants/screens'
-
-import useDownloadModel from '@/hooks/useDownloadModel'
-import { useDownloadState } from '@/hooks/useDownloadState'
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
-import { useMainViewState } from '@/hooks/useMainViewState'
-
-type Props = {
-  model: Model
-  isRecommended: boolean
-}
-
-const ModelVersionItem: React.FC<Props> = ({ model }) => {
-  const { downloadModel } = useDownloadModel()
-  const { downloadedModels } = useGetDownloadedModels()
-  const { setMainViewState } = useMainViewState()
-  const isDownloaded =
-    downloadedModels.find(
-      (downloadedModel) => downloadedModel.id === model.id
-    ) != null
-
-  const { modelDownloadStateAtom, downloadStates } = useDownloadState()
-
-  const downloadAtom = useMemo(
-    () => atom((get) => get(modelDownloadStateAtom)[model.id ?? '']),
-    /* eslint-disable react-hooks/exhaustive-deps */
-    [model.id]
-  )
-  const downloadState = useAtomValue(downloadAtom)
-
-  const onDownloadClick = () => {
-    downloadModel(model)
-  }
-
-  let downloadButton = (
-    <Button themes="outline" size="sm" onClick={() => onDownloadClick()}>
-      Download
-    </Button>
-  )
-
-  if (isDownloaded) {
-    downloadButton = (
-      <Button
-        themes="outline"
-        size="sm"
-        onClick={() => {
-          setMainViewState(MainViewState.MyModels)
-        }}
-      >
-        Use
-      </Button>
-    )
-  }
-
-  if (downloadState != null && downloadStates.length > 0) {
-    downloadButton = <ModalCancelDownload model={model} isFromList />
-  }
-
-  return (
-    <div className="flex items-center justify-between gap-4 border-t border-border pb-3 pl-3 pr-4 pt-3 first:border-t-0">
-      <div className="flex items-center gap-2">
-        <span className="line-clamp-1 flex-1" title={model.name}>
-          {model.name}
-        </span>
-      </div>
-      <div className="flex items-center gap-4">
-        <div className="flex justify-end gap-2"></div>
-        {downloadButton}
-      </div>
-    </div>
-  )
-}
-
-export default ModelVersionItem
diff --git a/web/screens/ExploreModels/ModelVersionList/index.tsx b/web/screens/ExploreModels/ModelVersionList/index.tsx
deleted file mode 100644
index 7992b7a513..0000000000
--- a/web/screens/ExploreModels/ModelVersionList/index.tsx
+++ /dev/null
@@ -1,25 +0,0 @@
-import { Model } from '@janhq/core'
-
-import ModelVersionItem from '../ModelVersionItem'
-
-type Props = {
-  models: Model[]
-  recommendedVersion: string
-}
-
-export default function ModelVersionList({
-  models,
-  recommendedVersion,
-}: Props) {
-  return (
-    <div className="pt-4">
-      {models.map((model) => (
-        <ModelVersionItem
-          key={model.name}
-          model={model}
-          isRecommended={model.name === recommendedVersion}
-        />
-      ))}
-    </div>
-  )
-}
diff --git a/web/screens/ExploreModels/index.tsx b/web/screens/ExploreModels/index.tsx
index 398b2db089..7002c60b7b 100644
--- a/web/screens/ExploreModels/index.tsx
+++ b/web/screens/ExploreModels/index.tsx
@@ -1,4 +1,4 @@
-import { useState } from 'react'
+import { useCallback, useState } from 'react'
 
 import { openExternalUrl } from '@janhq/core'
 import {
@@ -12,24 +12,24 @@ import {
   SelectItem,
 } from '@janhq/uikit'
 
+import { useAtomValue } from 'jotai'
 import { SearchIcon } from 'lucide-react'
 
-import Loader from '@/containers/Loader'
-
-import { useGetConfiguredModels } from '@/hooks/useGetConfiguredModels'
-
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
-
 import ExploreModelList from './ExploreModelList'
 
+import {
+  configuredModelsAtom,
+  downloadedModelsAtom,
+} from '@/helpers/atoms/Model.atom'
+
 const ExploreModelsScreen = () => {
-  const { loading, models } = useGetConfiguredModels()
+  const configuredModels = useAtomValue(configuredModelsAtom)
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
   const [searchValue, setsearchValue] = useState('')
-  const { downloadedModels } = useGetDownloadedModels()
   const [sortSelected, setSortSelected] = useState('All Models')
   const sortMenu = ['All Models', 'Recommended', 'Downloaded']
 
-  const filteredModels = models.filter((x) => {
+  const filteredModels = configuredModels.filter((x) => {
     if (sortSelected === 'Downloaded') {
       return (
         x.name.toLowerCase().includes(searchValue.toLowerCase()) &&
@@ -45,11 +45,9 @@ const ExploreModelsScreen = () => {
     }
   })
 
-  const onHowToImportModelClick = () => {
+  const onHowToImportModelClick = useCallback(() => {
     openExternalUrl('https://jan.ai/guides/using-models/import-manually/')
-  }
-
-  if (loading) return <Loader description="loading ..." />
+  }, [])
 
   return (
     <div
diff --git a/web/screens/LocalServer/Logs.tsx b/web/screens/LocalServer/Logs.tsx
deleted file mode 100644
index 125bd93ef9..0000000000
--- a/web/screens/LocalServer/Logs.tsx
+++ /dev/null
@@ -1,179 +0,0 @@
-/* eslint-disable @typescript-eslint/naming-convention */
-import { useEffect, useState } from 'react'
-
-import React from 'react'
-
-import { useAtomValue } from 'jotai'
-
-import { useServerLog } from '@/hooks/useServerLog'
-
-import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-
-const Logs = () => {
-  const { getServerLog } = useServerLog()
-  const serverEnabled = useAtomValue(serverEnabledAtom)
-  const [logs, setLogs] = useState([])
-
-  useEffect(() => {
-    getServerLog().then((log) => {
-      if (typeof log?.split === 'function') {
-        setLogs(log.split(/\r?\n|\r|\n/g))
-      }
-    })
-
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [logs, serverEnabled])
-
-  return (
-    <div className="overflow-hidden">
-      {logs.length > 1 ? (
-        <div className="h-full overflow-auto p-4">
-          <code className="text-xs">
-            {logs.map((log, i) => {
-              return (
-                <p key={i} className="my-2 leading-relaxed">
-                  {log}
-                </p>
-              )
-            })}
-          </code>
-        </div>
-      ) : (
-        <div className="mt-24 flex flex-col items-center justify-center">
-          <svg
-            width="115"
-            height="115"
-            viewBox="0 0 115 115"
-            fill="none"
-            xmlns="http://www.w3.org/2000/svg"
-          >
-            <circle cx="57.4999" cy="57.5009" r="50.2314" fill="#DADADA" />
-            <circle
-              cx="57.5"
-              cy="57.5"
-              r="55.9425"
-              fill="#E7E7E7"
-              stroke="white"
-              strokeWidth="3.1151"
-            />
-            <mask
-              id="mask0_1206_120508"
-              maskUnits="userSpaceOnUse"
-              x="3"
-              y="3"
-              width="109"
-              height="109"
-            >
-              <circle cx="57.4993" cy="57.5003" r="54.1253" fill="white" />
-            </mask>
-            <g mask="url(#mask0_1206_120508)">
-              <path
-                d="M47.5039 116.445H58.5351L74.3593 39.8282L63.7828 37.6406L47.5039 116.445Z"
-                fill="#8D8D8D"
-              />
-              <path
-                d="M72.165 39.4563L74.3716 39.8457L72.4246 38.418L72.165 39.4563Z"
-                fill="#8D8D8D"
-              />
-              <path
-                d="M45.6797 114.947H56.7108L72.4257 38.4193L61.9585 36.1426L45.6797 114.947Z"
-                fill="url(#paint0_linear_1206_120508)"
-              />
-              <path
-                d="M93.1887 90.6726L26.5474 76.906L24.6602 75.2136L31.7058 51.9418L34.7984 52.1448L30.0296 49.6041L32.757 36.0039L99.3983 49.7705L101.29 51.467L98.5257 64.844L93.2456 64.9414L96.1515 65.4974L98.0387 67.1898L93.1887 90.6726Z"
-                fill="#8D8D8D"
-              />
-              <path
-                d="M91.3015 88.9801L24.6602 75.2136L29.8186 50.2454L32.9112 50.4483L30.3299 47.7656L32.757 36.0039L99.3983 49.7705L96.6345 63.1475L91.3583 63.2449L96.1515 65.4974L91.3015 88.9801Z"
-                fill="url(#paint1_linear_1206_120508)"
-              />
-              <path
-                d="M92.7826 63.1065C92.7826 63.1065 92.7298 63.1065 92.6243 63.1065L92.1576 63.0741L90.3637 62.9279L89.069 62.8143L87.5308 62.6317C86.431 62.4937 85.1688 62.3638 83.7929 62.1365L81.6216 61.8078C80.8667 61.6901 80.0875 61.5359 79.2798 61.4019C77.6564 61.126 75.9396 60.7647 74.1295 60.3995C70.5133 59.6324 66.5563 58.703 62.4247 57.6518C54.1655 55.5252 46.7221 53.4797 41.2918 52.1525C39.9403 51.8075 38.7065 51.5275 37.6391 51.2677C36.5717 51.008 35.6098 50.797 34.8631 50.6306L33.1098 50.2247L32.6552 50.1151C32.6025 50.1035 32.5508 50.0872 32.501 50.0664C32.5545 50.0686 32.6076 50.0768 32.6593 50.0908L33.1219 50.176L34.8834 50.5291C35.6504 50.6833 36.5879 50.8822 37.6675 51.1297C38.7471 51.3773 39.9849 51.6452 41.3446 51.978C46.783 53.2605 54.2386 55.2816 62.4937 57.4043C66.6253 58.4554 70.5742 59.3929 74.1823 60.1722C75.9924 60.5415 77.7051 60.9109 79.3245 61.195C80.1362 61.3411 80.9114 61.4953 81.6622 61.6008L83.8254 61.9458C85.2012 62.1852 86.4553 62.3273 87.5552 62.4775L89.0893 62.6804L90.3799 62.8143L92.1698 63.0091L92.6324 63.0659L92.7826 63.1065Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M96.131 60.9773C96.0789 60.948 96.0288 60.9155 95.9808 60.8799L95.5749 60.5755C95.2056 60.3117 94.678 59.8937 93.9515 59.3985C91.9511 57.9951 89.8665 56.7156 87.7095 55.5673C84.5067 53.8752 81.1551 52.4813 77.697 51.4032C73.4578 50.101 69.0819 49.2947 64.6569 49.0005C59.9449 48.6555 55.4481 49.1142 51.353 49.2075C49.411 49.2762 47.4666 49.2369 45.529 49.0898C41.3921 48.7494 37.3342 47.762 33.5035 46.1636C32.6918 45.8267 32.0952 45.5426 31.6853 45.3519L31.2226 45.1165L31.0684 45.0312C31.1262 45.0462 31.1821 45.068 31.2348 45.0962L31.7096 45.3072C32.1155 45.4939 32.7364 45.7658 33.54 46.0865C35.8079 46.9951 38.1522 47.7 40.5451 48.1929C42.1954 48.5323 43.8654 48.7681 45.5452 48.899C47.4754 49.0336 49.4114 49.0647 51.3449 48.9924C55.4278 48.8869 59.9368 48.4201 64.6731 48.7651C69.1177 49.0615 73.5121 49.8788 77.766 51.2002C81.2331 52.295 84.5906 53.7108 87.7947 55.4293C89.949 56.5876 92.0247 57.8864 94.0083 59.3173C94.7105 59.8206 95.2259 60.2549 95.5912 60.5349L95.997 60.8596C96.0446 60.8953 96.0894 60.9347 96.131 60.9773Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M63.9192 43.0816C63.8188 43.1282 63.7141 43.1649 63.6067 43.1912L62.6935 43.4631C62.2876 43.5849 61.8128 43.7188 61.2405 43.8487C60.6683 43.9786 60.023 44.1572 59.2924 44.287C58.5619 44.4169 57.7745 44.5914 56.91 44.6929C56.0456 44.7943 55.1283 44.9364 54.1583 45.046C52.0463 45.2502 49.9242 45.3328 47.8027 45.2936C45.6814 45.2371 43.565 45.0623 41.4632 44.77C40.4973 44.6158 39.58 44.4818 38.7278 44.2951C37.8755 44.1084 37.1043 43.9461 36.3697 43.7675C35.6351 43.589 35.0101 43.4063 34.446 43.244C33.8818 43.0816 33.3989 42.9315 33.0092 42.7975L32.1082 42.485C32.0022 42.4531 31.8991 42.4123 31.7998 42.3633C31.9103 42.3761 32.0191 42.4006 32.1245 42.4363L33.0377 42.7042C33.4435 42.826 33.9143 42.968 34.4825 43.1101C35.0507 43.2521 35.7001 43.4469 36.4103 43.5971C37.1206 43.7472 37.916 43.942 38.7683 44.0922C39.6206 44.2424 40.5338 44.3966 41.4957 44.5427C43.5877 44.8202 45.693 44.9868 47.8027 45.0419C49.9143 45.0792 52.0264 45.0034 54.1299 44.8146C55.0959 44.7091 56.0172 44.6239 56.8735 44.4859C57.7299 44.3479 58.5253 44.2302 59.2518 44.08C59.9783 43.9299 60.6277 43.8 61.1999 43.6742C61.7722 43.5484 62.2633 43.4347 62.661 43.3292L63.5823 43.106C63.6933 43.0854 63.8063 43.0772 63.9192 43.0816Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M46.1782 66.8891C46.1782 66.8891 46.2837 66.9459 46.4786 67.0677L47.3552 67.6075C48.1263 68.0742 49.2546 68.7885 50.7644 69.5962C52.5839 70.6072 54.5341 71.3624 56.56 71.8405C57.1712 71.9765 57.7909 72.0714 58.4148 72.1246C59.0677 72.2062 59.729 72.063 60.2898 71.7188C60.5621 71.5185 60.7593 71.2327 60.8499 70.9071C60.9379 70.5705 60.9379 70.2169 60.8499 69.8803C60.6372 69.1763 60.1849 68.5689 59.5714 68.1635C54.4901 64.7949 47.3349 62.3395 39.2381 62.1122C38.2275 62.0797 37.2088 62.0797 36.1698 62.1122C35.1309 62.1447 34.0756 62.3882 33.3816 63.1593C33.2064 63.3413 33.0692 63.5562 32.9779 63.7918C32.8866 64.0273 32.8431 64.2786 32.85 64.5311C32.8877 65.0471 33.0864 65.5383 33.4181 65.9354C34.0716 66.7714 35.0132 67.3518 35.9182 67.9646C39.5709 70.4403 43.4387 72.8998 47.7895 74.6044C52.1402 76.309 56.7629 77.0761 61.1177 76.4308C62.1922 76.2718 63.2512 76.0219 64.2834 75.684C65.3 75.3967 66.2119 74.8217 66.9093 74.0281C67.5327 73.2028 67.8626 72.1929 67.8468 71.1587C67.8497 70.1451 67.625 69.1437 67.1893 68.2284C66.3039 66.4723 64.9462 64.9979 63.2688 63.971C61.6898 62.9951 59.9765 62.2554 58.1834 61.7753C56.4585 61.2761 54.7499 60.919 53.1183 60.5578L48.4226 59.4944L34.2542 56.276L30.4067 55.3872L29.4083 55.1518C29.181 55.099 29.0674 55.0625 29.0674 55.0625L29.4124 55.1274L30.4189 55.3385L34.2786 56.1827L48.4632 59.324L53.1589 60.3711C54.7824 60.7404 56.5032 61.0895 58.2402 61.5887C60.0548 62.0698 61.7887 62.8151 63.3865 63.8006C65.1016 64.8462 66.4904 66.3503 67.3963 68.1432C67.8467 69.0889 68.0797 70.1234 68.0782 71.1709C68.0964 72.2575 67.7507 73.319 67.096 74.1864C66.3707 75.017 65.4208 75.6203 64.3605 75.9235C63.3146 76.2697 62.2404 76.5237 61.1502 76.6824C56.7426 77.3399 52.0631 76.5566 47.7002 74.8479C43.3372 73.1393 39.441 70.6798 35.7965 68.1919C34.8955 67.5669 33.9376 66.9743 33.2477 66.0936C32.8831 65.658 32.6657 65.1181 32.6267 64.5514C32.6196 64.2683 32.6687 63.9866 32.7711 63.7226C32.8735 63.4586 33.0272 63.2174 33.2233 63.0132C33.599 62.6113 34.0734 62.3147 34.5992 62.1528C35.1094 61.9991 35.6373 61.9118 36.1698 61.893C37.2169 61.8525 38.2438 61.8565 39.2584 61.893C47.4039 62.1406 54.5794 64.6163 59.6932 68.0336C60.3373 68.4648 60.8099 69.1082 61.0285 69.8519C61.1239 70.2164 61.1239 70.5994 61.0285 70.9639C60.9286 71.3211 60.7095 71.6333 60.4075 71.8487C59.8169 72.2131 59.12 72.3662 58.431 72.2829C57.7989 72.2243 57.1713 72.1253 56.5519 71.9867C54.5186 71.4945 52.5639 70.7213 50.7441 69.6895C49.2343 68.8778 48.1142 68.1391 47.3512 67.6602C46.9778 67.4208 46.6896 67.2544 46.4907 67.1002C46.2919 66.9459 46.1782 66.8891 46.1782 66.8891Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M94.8364 71.2204C94.6993 71.2055 94.5635 71.1797 94.4305 71.1433C94.1789 71.0743 93.8014 71.0012 93.3185 70.916C91.9393 70.7187 90.5384 70.7297 89.1625 70.9484C87.1263 71.2911 85.1507 71.9282 83.2979 72.8397C81.0433 73.9901 78.866 75.2861 76.7799 76.7197C74.6823 78.1612 72.4837 79.4497 70.201 80.5753C68.3181 81.4721 66.3087 82.0743 64.243 82.3611C62.8484 82.5487 61.4325 82.5089 60.0505 82.2434C59.6768 82.1692 59.3081 82.0716 58.9466 81.9512C58.8182 81.9168 58.6932 81.8706 58.5732 81.8132C58.7037 81.8336 58.8326 81.8634 58.9588 81.9025C59.2104 81.9755 59.5838 82.0567 60.0668 82.15C61.4407 82.3746 62.841 82.3869 64.2187 82.1866C66.2604 81.8789 68.2442 81.266 70.1036 80.3683C72.3696 79.236 74.5543 77.9477 76.6419 76.5127C78.7383 75.0733 80.9295 73.777 83.2005 72.6327C85.0755 71.7192 87.077 71.0926 89.1382 70.7739C90.5308 70.568 91.9473 70.5845 93.3347 70.8226C93.72 70.8867 94.1009 70.9748 94.4752 71.0864C94.5995 71.1198 94.7204 71.1646 94.8364 71.2204Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M93.6026 77.826C93.6026 77.8504 93.286 77.7205 92.7016 77.5906C91.8761 77.4114 91.0248 77.3839 90.1894 77.5095C88.9516 77.719 87.7468 78.0901 86.6057 78.6134C85.195 79.2299 83.8293 79.9446 82.5187 80.7523C81.1063 81.5883 79.7589 82.4041 78.4602 83.025C77.321 83.5882 76.1214 84.0199 74.8846 84.3116C74.0488 84.5016 73.1926 84.5861 72.3358 84.5632C72.1034 84.5575 71.8716 84.5372 71.6418 84.5024C71.5603 84.4985 71.4797 84.4835 71.4023 84.4577C71.4023 84.4293 71.7392 84.4577 72.3358 84.4577C73.1828 84.4453 74.0257 84.3364 74.8481 84.133C76.0637 83.8193 77.242 83.3757 78.3628 82.8099C79.6371 82.1849 80.9724 81.3692 82.3888 80.529C83.7103 79.7132 85.0914 78.9983 86.5204 78.3902C87.683 77.8677 88.9122 77.5085 90.1731 77.3228C91.0279 77.2097 91.8965 77.2648 92.73 77.4851C92.9548 77.5461 93.1757 77.6207 93.3916 77.7083C93.4671 77.7375 93.5381 77.7771 93.6026 77.826Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M72.1531 44.1988C72.1531 44.2678 69.584 43.7645 66.4468 43.0746C63.3095 42.3846 60.7648 41.7718 60.7932 41.7069C60.8216 41.6419 63.3623 42.1411 66.4995 42.8311C69.6368 43.521 72.1531 44.1339 72.1531 44.1988Z"
-                fill="#A9A9A9"
-              />
-              <path
-                d="M87.7278 22.8493C87.9286 21.4011 85.8726 20.21 84.3238 20.0848C83.5886 20.0273 82.8227 20.139 82.1249 19.8987C80.6135 19.3743 80.011 17.432 78.5371 16.8128C77.4342 16.3526 76.1544 16.762 75.0957 17.2967C74.0371 17.8313 72.9717 18.5046 71.7769 18.5825C70.7557 18.6468 69.6086 18.2644 68.7133 18.7686C68.0326 19.1442 67.6922 19.9224 67.059 20.3792C66.4259 20.836 65.6498 20.9206 64.8941 20.9612C64.1384 21.0018 63.3521 21.012 62.6611 21.3233C61.9701 21.6346 61.4017 22.3655 61.5446 23.1031L87.7278 22.8493Z"
-                fill="#ABABAB"
-              />
-              <path
-                d="M39.1881 32.5312C39.3293 31.4869 37.8655 30.6287 36.7662 30.5385C36.2413 30.4963 35.6955 30.5769 35.1993 30.4022C34.121 30.0182 33.6916 28.6264 32.64 28.1791C31.8556 27.847 30.951 28.1426 30.1895 28.5285C29.428 28.9144 28.6741 29.4001 27.8229 29.4538C27.0824 29.5018 26.2789 29.2254 25.632 29.5901C25.1491 29.8608 24.8972 30.4195 24.4525 30.742C24.0078 31.0645 23.4486 31.126 22.9085 31.1624C22.3684 31.1989 21.8092 31.1989 21.3187 31.4254C20.8282 31.652 20.4198 32.1741 20.5229 32.7078L39.1881 32.5312Z"
-                fill="#ABABAB"
-              />
-              <path
-                d="M76.46 61.6777L78.8178 62.1824L80.1702 66.9562L80.2674 66.977L83.4556 63.1752L85.8134 63.6799L80.8041 69.3391L80.0506 72.8588L77.9602 72.4114L78.7137 68.8917L76.46 61.6777Z"
-                fill="white"
-              />
-              <path
-                d="M67.148 61.4992L67.5195 59.7637L75.6965 61.514L75.325 63.2496L72.2769 62.5971L70.5171 70.8178L68.4364 70.3724L70.1962 62.1517L67.148 61.4992Z"
-                fill="white"
-              />
-              <path
-                d="M56.9049 67.9016L59.0361 57.9453L62.9642 58.7862C63.7193 58.9478 64.3318 59.2297 64.8016 59.632C65.272 60.0309 65.5922 60.5147 65.762 61.0832C65.9357 61.6491 65.9518 62.2627 65.8103 62.9238C65.6688 63.585 65.4013 64.1379 65.0078 64.5824C64.6144 65.0269 64.1169 65.3323 63.5153 65.4984C62.9169 65.6652 62.2353 65.6667 61.4705 65.503L58.9668 64.967L59.3279 63.2801L61.4913 63.7432C61.8964 63.8299 62.2451 63.8317 62.5375 63.7485C62.8338 63.6628 63.0734 63.5091 63.2565 63.2872C63.4435 63.0629 63.572 62.7871 63.6421 62.4597C63.7128 62.1291 63.7082 61.8265 63.628 61.5517C63.5518 61.2744 63.3954 61.0392 63.1587 60.8462C62.9228 60.65 62.6007 60.5082 62.1923 60.4207L60.7728 60.1169L59.0099 68.3522L56.9049 67.9016Z"
-                fill="white"
-              />
-              <path
-                d="M46.5049 55.2637L49.1009 55.8194L50.4108 63.0957L50.5275 63.1206L54.7013 57.0182L57.2973 57.5739L55.1661 67.5302L53.1243 67.0931L54.5114 60.6128L54.4288 60.5951L50.4754 66.4753L49.0851 66.1776L47.8905 59.1701L47.8078 59.1524L46.4154 65.657L44.3736 65.2199L46.5049 55.2637Z"
-                fill="white"
-              />
-              <path
-                d="M35.9977 63.425L38.1289 53.4688L44.8377 54.9048L44.4662 56.6404L39.8624 55.6549L39.3546 58.0273L43.6132 58.9389L43.2417 60.6744L38.9831 59.7628L38.4742 62.1401L43.0974 63.1297L42.7259 64.8653L35.9977 63.425Z"
-                fill="white"
-              />
-            </g>
-            <defs>
-              <linearGradient
-                id="paint0_linear_1206_120508"
-                x1="59.1074"
-                y1="36.1426"
-                x2="59.1074"
-                y2="114.947"
-                gradientUnits="userSpaceOnUse"
-              >
-                <stop stopColor="#CFCFCF" />
-                <stop offset="1" stopColor="#C6C6C6" />
-              </linearGradient>
-              <linearGradient
-                id="paint1_linear_1206_120508"
-                x1="62.0292"
-                y1="36.0039"
-                x2="62.0292"
-                y2="88.9801"
-                gradientUnits="userSpaceOnUse"
-              >
-                <stop stopColor="#DDDDDD" />
-                <stop offset="1" stopColor="#B6B6B6" />
-              </linearGradient>
-            </defs>
-          </svg>
-          <p className="mt-4 text-muted-foreground">Empty logs</p>
-        </div>
-      )}
-    </div>
-  )
-}
-
-export default Logs
diff --git a/web/screens/LocalServer/index.tsx b/web/screens/LocalServer/index.tsx
index b96f4c228f..f9c2cf7194 100644
--- a/web/screens/LocalServer/index.tsx
+++ b/web/screens/LocalServer/index.tsx
@@ -20,11 +20,12 @@ import {
   SelectValue,
 } from '@janhq/uikit'
 
-import { atom, useAtom, useAtomValue } from 'jotai'
+import { atom, useAtom, useAtomValue, useSetAtom } from 'jotai'
 
 import { Paintbrush, CodeIcon } from 'lucide-react'
 import { ExternalLinkIcon, InfoIcon } from 'lucide-react'
 
+import { AlertTriangleIcon } from 'lucide-react'
 import { twMerge } from 'tailwind-merge'
 
 import CardSidebar from '@/containers/CardSidebar'
@@ -33,8 +34,15 @@ import DropdownListSidebar, {
   selectedModelAtom,
 } from '@/containers/DropdownListSidebar'
 
-import { useActiveModel } from '@/hooks/useActiveModel'
-import { useServerLog } from '@/hooks/useServerLog'
+import ModalTroubleShooting, {
+  modalTroubleShootingAtom,
+} from '@/containers/ModalTroubleShoot'
+import ServerLogs from '@/containers/ServerLogs'
+
+import { toaster } from '@/containers/Toast'
+
+import { loadModelErrorAtom, useActiveModel } from '@/hooks/useActiveModel'
+import { useLogs } from '@/hooks/useLogs'
 
 import { getConfigurationsData } from '@/utils/componentSettings'
 import { toSettingParams } from '@/utils/modelParam'
@@ -45,10 +53,7 @@ import SettingComponentBuilder from '../Chat/ModelSetting/SettingComponent'
 
 import { showRightSideBarAtom } from '../Chat/Sidebar'
 
-import Logs from './Logs'
-
 import { serverEnabledAtom } from '@/helpers/atoms/LocalServer.atom'
-import { getActiveThreadModelParamsAtom } from '@/helpers/atoms/Thread.atom'
 
 const corsEnabledAtom = atom(true)
 const verboseEnabledAtom = atom(true)
@@ -59,19 +64,20 @@ const LocalServerScreen = () => {
   const [errorRangePort, setErrorRangePort] = useState(false)
   const [serverEnabled, setServerEnabled] = useAtom(serverEnabledAtom)
   const showRightSideBar = useAtomValue(showRightSideBarAtom)
-  const activeModelParams = useAtomValue(getActiveThreadModelParamsAtom)
+  const setModalTroubleShooting = useSetAtom(modalTroubleShootingAtom)
 
-  const modelEngineParams = toSettingParams(activeModelParams)
-  const componentDataEngineSetting = getConfigurationsData(modelEngineParams)
-
-  const { openServerLog, clearServerLog } = useServerLog()
+  const { openServerLog, clearServerLog } = useLogs()
   const { startModel, stateModel } = useActiveModel()
   const selectedModel = useAtomValue(selectedModelAtom)
 
+  const modelEngineParams = toSettingParams(selectedModel?.settings)
+  const componentDataEngineSetting = getConfigurationsData(modelEngineParams)
+
   const [isCorsEnabled, setIsCorsEnabled] = useAtom(corsEnabledAtom)
   const [isVerboseEnabled, setIsVerboseEnabled] = useAtom(verboseEnabledAtom)
   const [host, setHost] = useAtom(hostAtom)
   const [port, setPort] = useAtom(portAtom)
+  const [loadModelError, setLoadModelError] = useAtom(loadModelErrorAtom)
 
   const hostOptions = ['127.0.0.1', '0.0.0.0']
 
@@ -102,6 +108,45 @@ const LocalServerScreen = () => {
     handleChangePort(port)
   }, [handleChangePort, port])
 
+  const onStartServerClick = async () => {
+    if (selectedModel == null) return
+    try {
+      const isStarted = await window.core?.api?.startServer({
+        host,
+        port,
+        isCorsEnabled,
+        isVerboseEnabled,
+      })
+      await startModel(selectedModel.id)
+      if (isStarted) setServerEnabled(true)
+      if (firstTimeVisitAPIServer) {
+        localStorage.setItem(FIRST_TIME_VISIT_API_SERVER, 'false')
+        setFirstTimeVisitAPIServer(false)
+      }
+    } catch (e) {
+      console.error(e)
+      toaster({
+        title: `Failed to start server!`,
+        description: 'Please check Server Logs for more details.',
+        type: 'error',
+      })
+    }
+  }
+
+  const onStopServerClick = async () => {
+    window.core?.api?.stopServer()
+    setServerEnabled(false)
+    setLoadModelError(undefined)
+  }
+
+  const onToggleServer = async () => {
+    if (serverEnabled) {
+      await onStopServerClick()
+    } else {
+      await onStartServerClick()
+    }
+  }
+
   return (
     <div className="flex h-full w-full" data-testid="local-server-testid">
       {/* Left SideBar */}
@@ -118,25 +163,7 @@ const LocalServerScreen = () => {
               block
               themes={serverEnabled ? 'danger' : 'primary'}
               disabled={stateModel.loading || errorRangePort || !selectedModel}
-              onClick={() => {
-                if (serverEnabled) {
-                  window.core?.api?.stopServer()
-                  setServerEnabled(false)
-                } else {
-                  startModel(String(selectedModel?.id))
-                  window.core?.api?.startServer({
-                    host,
-                    port,
-                    isCorsEnabled,
-                    isVerboseEnabled,
-                  })
-                  setServerEnabled(true)
-                  if (firstTimeVisitAPIServer) {
-                    localStorage.setItem(FIRST_TIME_VISIT_API_SERVER, 'false')
-                    setFirstTimeVisitAPIServer(false)
-                  }
-                }
-              }}
+              onClick={onToggleServer}
             >
               {serverEnabled ? 'Stop' : 'Start'} Server
             </Button>
@@ -350,7 +377,9 @@ const LocalServerScreen = () => {
             </div>
           </div>
         ) : (
-          <Logs />
+          <div className="p-4">
+            <ServerLogs />
+          </div>
         )}
       </ScrollToBottom>
 
@@ -364,7 +393,43 @@ const LocalServerScreen = () => {
         )}
       >
         <div className="px-4 pt-4">
+          <div className="mb-4 flex items-start space-x-2">
+            <svg
+              width="18"
+              height="18"
+              viewBox="0 0 18 18"
+              className="mt-1 flex-shrink-0"
+              fill="none"
+              xmlns="http://www.w3.org/2000/svg"
+            >
+              <path
+                fillRule="evenodd"
+                clipRule="evenodd"
+                d="M9.00033 17.3337C13.6027 17.3337 17.3337 13.6027 17.3337 9.00033C17.3337 4.39795 13.6027 0.666992 9.00033 0.666992C4.39795 0.666992 0.666992 4.39795 0.666992 9.00033C0.666992 10.9978 1.36978 12.8311 2.54157 14.2666L0.910703 15.9111C0.390085 16.436 0.758808 17.3337 1.49507 17.3337H9.00033ZM5.25033 7.33366C5.25033 6.87342 5.62342 6.50033 6.08366 6.50033H11.917C12.3772 6.50033 12.7503 6.87342 12.7503 7.33366C12.7503 7.7939 12.3772 8.16699 11.917 8.16699H6.08366C5.62342 8.16699 5.25033 7.7939 5.25033 7.33366ZM6.08366 9.83366C5.62342 9.83366 5.25033 10.2068 5.25033 10.667C5.25033 11.1272 5.62342 11.5003 6.08366 11.5003H8.58366C9.0439 11.5003 9.41699 11.1272 9.41699 10.667C9.41699 10.2068 9.0439 9.83366 8.58366 9.83366H6.08366Z"
+                fill="#2563EB"
+              />
+            </svg>
+
+            <p>
+              You can concurrently send requests to one active local model and
+              multiple remote models.
+            </p>
+          </div>
           <DropdownListSidebar strictedThread={false} />
+          {loadModelError && serverEnabled && (
+            <div className="mt-3 flex space-x-2 text-xs">
+              <AlertTriangleIcon size={16} className="text-danger" />
+              <span>
+                Model failed to start. Access{' '}
+                <span
+                  className="cursor-pointer text-primary dark:text-blue-400"
+                  onClick={() => setModalTroubleShooting(true)}
+                >
+                  troubleshooting assistance
+                </span>
+              </span>
+            </div>
+          )}
 
           {componentDataEngineSetting.filter(
             (x) => x.name === 'prompt_template'
@@ -386,13 +451,17 @@ const LocalServerScreen = () => {
             <div className="my-4">
               <CardSidebar title="Engine Parameters" asChild>
                 <div className="px-2 py-4">
-                  <EngineSetting enabled={!serverEnabled} />
+                  <EngineSetting
+                    enabled={!serverEnabled}
+                    componentData={componentDataEngineSetting}
+                  />
                 </div>
               </CardSidebar>
             </div>
           )}
         </div>
       </div>
+      <ModalTroubleShooting />
     </div>
   )
 }
diff --git a/web/screens/Settings/Advanced/DataFolder/index.tsx b/web/screens/Settings/Advanced/DataFolder/index.tsx
index fe590bfaac..c11c49fa4c 100644
--- a/web/screens/Settings/Advanced/DataFolder/index.tsx
+++ b/web/screens/Settings/Advanced/DataFolder/index.tsx
@@ -83,7 +83,8 @@ const DataFolder = () => {
         await window.core?.api?.getAppConfigurations()
       const currentJanDataFolder = appConfiguration.data_folder
       appConfiguration.data_folder = destinationPath
-      await fs.syncFile(currentJanDataFolder, destinationPath)
+      const { err } = await fs.syncFile(currentJanDataFolder, destinationPath)
+      if (err) throw err
       await window.core?.api?.updateAppConfiguration(appConfiguration)
       console.debug(
         `File sync finished from ${currentJanDataFolder} to ${destinationPath}`
@@ -94,7 +95,7 @@ const DataFolder = () => {
       }, 1200)
       await window.core?.api?.relaunch()
     } catch (e) {
-      console.error(`Error: ${e}`)
+      console.error(e)
       setShowLoader(false)
       setShowChangeFolderError(true)
     }
diff --git a/web/screens/Settings/Advanced/index.tsx b/web/screens/Settings/Advanced/index.tsx
index d2f7d81eea..60812a3504 100644
--- a/web/screens/Settings/Advanced/index.tsx
+++ b/web/screens/Settings/Advanced/index.tsx
@@ -8,20 +8,46 @@ import {
   ChangeEvent,
 } from 'react'
 
-import { fs } from '@janhq/core'
-import { Switch, Button, Input } from '@janhq/uikit'
+import { openExternalUrl, fs } from '@janhq/core'
+
+import {
+  Switch,
+  Button,
+  Input,
+  Select,
+  Checkbox,
+  SelectContent,
+  SelectGroup,
+  SelectPortal,
+  SelectLabel,
+  SelectTrigger,
+  SelectValue,
+  Tooltip,
+  TooltipArrow,
+  TooltipContent,
+  TooltipTrigger,
+} from '@janhq/uikit'
+
+import { AlertTriangleIcon, AlertCircleIcon } from 'lucide-react'
 
 import ShortcutModal from '@/containers/ShortcutModal'
 
-import { toaster } from '@/containers/Toast'
+import { snackbar, toaster } from '@/containers/Toast'
 
 import { FeatureToggleContext } from '@/context/FeatureToggle'
 
+import { useActiveModel } from '@/hooks/useActiveModel'
 import { useSettings } from '@/hooks/useSettings'
 
 import DataFolder from './DataFolder'
 import FactoryReset from './FactoryReset'
 
+type GPU = {
+  id: string
+  vram: number | null
+  name: string
+}
+
 const Advanced = () => {
   const {
     experimentalFeature,
@@ -30,12 +56,24 @@ const Advanced = () => {
     setIgnoreSSL,
     proxy,
     setProxy,
+    proxyEnabled,
+    setProxyEnabled,
+    vulkanEnabled,
+    setVulkanEnabled,
   } = useContext(FeatureToggleContext)
   const [partialProxy, setPartialProxy] = useState<string>(proxy)
   const [gpuEnabled, setGpuEnabled] = useState<boolean>(false)
-
+  const [gpuList, setGpuList] = useState<GPU[]>([])
+  const [gpusInUse, setGpusInUse] = useState<string[]>([])
   const { readSettings, saveSettings, validateSettings, setShowNotification } =
     useSettings()
+  const { stopModel } = useActiveModel()
+
+  const selectedGpu = gpuList
+    .filter((x) => gpusInUse.includes(x.id))
+    .map((y) => {
+      return y['name']
+    })
 
   const onProxyChange = useCallback(
     (event: ChangeEvent<HTMLInputElement>) => {
@@ -53,10 +91,15 @@ const Advanced = () => {
   useEffect(() => {
     const setUseGpuIfPossible = async () => {
       const settings = await readSettings()
-      setGpuEnabled(settings.run_mode === 'gpu')
+      setGpuEnabled(settings.run_mode === 'gpu' && settings.gpus?.length > 0)
+      setGpusInUse(settings.gpus_in_use || [])
+      setVulkanEnabled(settings.vulkan || false)
+      if (settings.gpus) {
+        setGpuList(settings.gpus)
+      }
     }
     setUseGpuIfPossible()
-  }, [readSettings])
+  }, [readSettings, setGpuList, setGpuEnabled, setGpusInUse, setVulkanEnabled])
 
   const clearLogs = async () => {
     if (await fs.existsSync(`file://logs`)) {
@@ -69,6 +112,31 @@ const Advanced = () => {
     })
   }
 
+  const handleGPUChange = (gpuId: string) => {
+    let updatedGpusInUse = [...gpusInUse]
+    if (updatedGpusInUse.includes(gpuId)) {
+      updatedGpusInUse = updatedGpusInUse.filter((id) => id !== gpuId)
+      if (gpuEnabled && updatedGpusInUse.length === 0) {
+        // Vulkan support only allow 1 active device at a time
+        if (vulkanEnabled) {
+          updatedGpusInUse = []
+        }
+        updatedGpusInUse.push(gpuId)
+      }
+    } else {
+      // Vulkan support only allow 1 active device at a time
+      if (vulkanEnabled) {
+        updatedGpusInUse = []
+      }
+      updatedGpusInUse.push(gpuId)
+    }
+    setGpusInUse(updatedGpusInUse)
+    saveSettings({ gpusInUse: updatedGpusInUse })
+  }
+
+  const gpuSelectionPlaceHolder =
+    gpuList.length > 0 ? 'Select GPU' : "You don't have any compatible GPU"
+
   return (
     <div className="block w-full">
       {/* Keyboard shortcut  */}
@@ -106,42 +174,219 @@ const Advanced = () => {
 
       {/* CPU / GPU switching */}
       {!isMac && (
+        <div className="flex w-full flex-col items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
+          <div className="flex items-start justify-between w-full">
+            <div className="space-y-1.5">
+              <div className="flex gap-x-2">
+                <h6 className="text-sm font-semibold capitalize">
+                  GPU Acceleration
+                </h6>
+              </div>
+              <p className="pr-8 leading-relaxed">
+                Enable to enhance model performance by utilizing your GPU
+                devices for acceleration. Read{' '}
+                <span>
+                  {' '}
+                  <span
+                    className="cursor-pointer text-blue-600"
+                    onClick={() =>
+                      openExternalUrl(
+                        'https://jan.ai/guides/troubleshooting/gpu-not-used/'
+                      )
+                    }
+                  >
+                    troubleshooting guide
+                  </span>{' '}
+                </span>{' '}
+                for further assistance.
+              </p>
+            </div>
+            {gpuList.length > 0 && !gpuEnabled && (
+              <Tooltip>
+                <TooltipTrigger>
+                  <AlertCircleIcon size={20} className="mr-2 text-yellow-600" />
+                </TooltipTrigger>
+                <TooltipContent
+                  side="right"
+                  sideOffset={10}
+                  className="max-w-[240px]"
+                >
+                  <span>
+                    Disabling NVIDIA GPU Acceleration may result in reduced
+                    performance. It is recommended to keep this enabled for
+                    optimal user experience.
+                  </span>
+                  <TooltipArrow />
+                </TooltipContent>
+              </Tooltip>
+            )}
+
+            <Tooltip>
+              <TooltipTrigger>
+                <Switch
+                  disabled={gpuList.length === 0 || vulkanEnabled}
+                  checked={gpuEnabled}
+                  onCheckedChange={(e) => {
+                    if (e === true) {
+                      saveSettings({ runMode: 'gpu' })
+                      setGpuEnabled(true)
+                      setShowNotification(false)
+                      snackbar({
+                        description: 'Successfully turned on GPU Accelertion',
+                        type: 'success',
+                      })
+                      setTimeout(() => {
+                        validateSettings()
+                      }, 300)
+                    } else {
+                      saveSettings({ runMode: 'cpu' })
+                      setGpuEnabled(false)
+                      snackbar({
+                        description: 'Successfully turned off GPU Accelertion',
+                        type: 'success',
+                      })
+                    }
+                    // Stop any running model to apply the changes
+                    if (e !== gpuEnabled) stopModel()
+                  }}
+                />
+              </TooltipTrigger>
+              {gpuList.length === 0 && (
+                <TooltipContent
+                  side="right"
+                  sideOffset={10}
+                  className="max-w-[240px]"
+                >
+                  <span>
+                    Your current device does not have a compatible GPU for
+                    monitoring. To enable GPU monitoring, please ensure your
+                    device has a supported Nvidia or AMD GPU with updated
+                    drivers.
+                  </span>
+                  <TooltipArrow />
+                </TooltipContent>
+              )}
+            </Tooltip>
+          </div>
+          <div className="mt-2 w-full rounded-lg bg-secondary p-4">
+            <label className="mb-1 inline-block font-medium">
+              Choose device(s)
+            </label>
+            <Select
+              disabled={gpuList.length === 0 || !gpuEnabled}
+              value={selectedGpu.join()}
+            >
+              <SelectTrigger className="w-[340px] dark:bg-gray-500 bg-white">
+                <SelectValue placeholder={gpuSelectionPlaceHolder}>
+                  <span className="line-clamp-1 w-full pr-8">
+                    {selectedGpu.join()}
+                  </span>
+                </SelectValue>
+              </SelectTrigger>
+              <SelectPortal>
+                <SelectContent className="w-[400px] px-1 pb-2">
+                  <SelectGroup>
+                    <SelectLabel>
+                      {vulkanEnabled ? 'Vulkan Supported GPUs' : 'Nvidia'}
+                    </SelectLabel>
+                    <div className="px-4 pb-2">
+                      <div className="rounded-lg bg-secondary p-3">
+                        {gpuList
+                          .filter((gpu) =>
+                            vulkanEnabled
+                              ? gpu.name
+                              : gpu.name?.toLowerCase().includes('nvidia')
+                          )
+                          .map((gpu) => (
+                            <div
+                              key={gpu.id}
+                              className="my-1 flex items-center space-x-2"
+                            >
+                              <Checkbox
+                                id={`gpu-${gpu.id}`}
+                                name="gpu-nvidia"
+                                className="bg-white"
+                                value={gpu.id}
+                                checked={gpusInUse.includes(gpu.id)}
+                                onCheckedChange={() => handleGPUChange(gpu.id)}
+                              />
+                              <label
+                                className="flex w-full items-center justify-between"
+                                htmlFor={`gpu-${gpu.id}`}
+                              >
+                                <span>{gpu.name}</span>
+                                {!vulkanEnabled && (
+                                  <span>{gpu.vram}MB VRAM</span>
+                                )}
+                              </label>
+                            </div>
+                          ))}
+                      </div>
+                      {/* Warning message */}
+                      {gpuEnabled && gpusInUse.length > 1 && (
+                        <div className="mt-2 flex items-start space-x-2 text-yellow-500">
+                          <AlertTriangleIcon
+                            size={16}
+                            className="flex-shrink-0"
+                          />
+                          <p className="text-xs leading-relaxed">
+                            If multi-GPU is enabled with different GPU models or
+                            without NVLink, it could impact token speed.
+                          </p>
+                        </div>
+                      )}
+                    </div>
+                  </SelectGroup>
+
+                  {/* TODO enable this when we support AMD */}
+                </SelectContent>
+              </SelectPortal>
+            </Select>
+          </div>
+        </div>
+      )}
+
+      {/* Vulkan for AMD GPU/ APU and Intel Arc GPU */}
+      {!isMac && experimentalFeature && (
         <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
           <div className="flex-shrink-0 space-y-1.5">
             <div className="flex gap-x-2">
-              <h6 className="text-sm font-semibold capitalize">Nvidia GPU</h6>
+              <h6 className="text-sm font-semibold capitalize">
+                Vulkan Support
+              </h6>
             </div>
-            <p className="leading-relaxed">
-              Enable GPU acceleration for Nvidia GPUs.
+            <p className="text-xs leading-relaxed">
+              Enable Vulkan with AMD GPU/APU and Intel Arc GPU for better model
+              performance (reload needed).
             </p>
           </div>
+
           <Switch
-            checked={gpuEnabled}
+            checked={vulkanEnabled}
             onCheckedChange={(e) => {
-              if (e === true) {
-                saveSettings({ runMode: 'gpu' })
-                setGpuEnabled(true)
-                setShowNotification(false)
-                setTimeout(() => {
-                  validateSettings()
-                }, 300)
-              } else {
-                saveSettings({ runMode: 'cpu' })
-                setGpuEnabled(false)
-              }
+              toaster({
+                title: 'Reload',
+                description:
+                  'Vulkan settings updated. Reload now to apply the changes.',
+              })
+              stopModel()
+              saveSettings({ vulkan: e, gpusInUse: [] })
+              setVulkanEnabled(e)
             }}
           />
         </div>
       )}
 
-      {/* Directory */}
       <DataFolder />
-
       {/* Proxy */}
       <div className="flex w-full items-start justify-between border-b border-border py-4 first:pt-0 last:border-none">
-        <div className="flex-shrink-0 space-y-1.5">
-          <div className="flex gap-x-2">
+        <div className="flex-shrink-0 space-y-1.5 w-full">
+          <div className="flex gap-x-2 justify-between w-full">
             <h6 className="text-sm font-semibold capitalize">HTTPS Proxy</h6>
+            <Switch
+              checked={proxyEnabled}
+              onCheckedChange={(_) => setProxyEnabled(!proxyEnabled)}
+            />
           </div>
           <p className="leading-relaxed">
             Specify the HTTPS proxy or leave blank (proxy auto-configuration and
@@ -151,6 +396,7 @@ const Advanced = () => {
             placeholder={'http://<user>:<password>@<domain or IP>:<port>'}
             value={partialProxy}
             onChange={onProxyChange}
+            className="w-2/3"
           />
         </div>
       </div>
diff --git a/web/screens/Settings/Models/index.tsx b/web/screens/Settings/Models/index.tsx
index 3c5a0c6e3f..f8997e7513 100644
--- a/web/screens/Settings/Models/index.tsx
+++ b/web/screens/Settings/Models/index.tsx
@@ -2,16 +2,17 @@ import { useState } from 'react'
 
 import { Input } from '@janhq/uikit'
 
+import { useAtomValue } from 'jotai'
 import { SearchIcon } from 'lucide-react'
 
-import { useGetDownloadedModels } from '@/hooks/useGetDownloadedModels'
-
 import RowModel from './Row'
 
+import { downloadedModelsAtom } from '@/helpers/atoms/Model.atom'
+
 const Column = ['Name', 'Model ID', 'Size', 'Version', 'Status', '']
 
 export default function Models() {
-  const { downloadedModels } = useGetDownloadedModels()
+  const downloadedModels = useAtomValue(downloadedModelsAtom)
   const [searchValue, setsearchValue] = useState('')
 
   const filteredDownloadedModels = downloadedModels.filter((x) => {
diff --git a/web/services/restService.ts b/web/services/restService.ts
index 25488ae154..73348caebe 100644
--- a/web/services/restService.ts
+++ b/web/services/restService.ts
@@ -1,10 +1,5 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
-import {
-  AppRoute,
-  DownloadRoute,
-  ExtensionRoute,
-  FileSystemRoute,
-} from '@janhq/core'
+import { CoreRoutes } from '@janhq/core'
 
 import { safeJsonParse } from '@/utils/json'
 
@@ -14,15 +9,7 @@ export function openExternalUrl(url: string) {
 }
 
 // Define API routes based on different route types
-export const APIRoutes = [
-  ...Object.values(AppRoute).map((r) => ({ path: 'app', route: r })),
-  ...Object.values(DownloadRoute).map((r) => ({ path: `download`, route: r })),
-  ...Object.values(ExtensionRoute).map((r) => ({
-    path: `extension`,
-    route: r,
-  })),
-  ...Object.values(FileSystemRoute).map((r) => ({ path: `fs`, route: r })),
-]
+export const APIRoutes = [...CoreRoutes.map((r) => ({ path: `app`, route: r }))]
 
 // Define the restAPI object with methods for each API route
 export const restAPI = {
@@ -31,11 +18,14 @@ export const restAPI = {
       ...acc,
       [proxy.route]: (...args: any) => {
         // For each route, define a function that sends a request to the API
-        return fetch(`${API_BASE_URL}/v1/${proxy.path}/${proxy.route}`, {
-          method: 'POST',
-          body: JSON.stringify(args),
-          headers: { contentType: 'application/json' },
-        }).then(async (res) => {
+        return fetch(
+          `${window.core?.api.baseApiUrl}/v1/${proxy.path}/${proxy.route}`,
+          {
+            method: 'POST',
+            body: JSON.stringify(args),
+            headers: { contentType: 'application/json' },
+          }
+        ).then(async (res) => {
           try {
             if (proxy.path === 'fs') {
               const text = await res.text()
@@ -50,4 +40,7 @@ export const restAPI = {
     }
   }, {}),
   openExternalUrl,
+  // Jan Server URL
+  baseApiUrl: process.env.API_BASE_URL ?? API_BASE_URL,
+  pollingInterval: 5000,
 }
diff --git a/web/tsconfig.json b/web/tsconfig.json
index 26f0e8ef38..1729c971f4 100644
--- a/web/tsconfig.json
+++ b/web/tsconfig.json
@@ -17,13 +17,13 @@
     "incremental": true,
     "plugins": [
       {
-        "name": "next",
-      },
+        "name": "next"
+      }
     ],
     "paths": {
-      "@/*": ["./*"],
-    },
+      "@/*": ["./*"]
+    }
   },
   "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
-  "exclude": ["node_modules"],
+  "exclude": ["node_modules"]
 }
diff --git a/web/types/downloadState.d.ts b/web/types/downloadState.d.ts
deleted file mode 100644
index cca526bf13..0000000000
--- a/web/types/downloadState.d.ts
+++ /dev/null
@@ -1,20 +0,0 @@
-type DownloadState = {
-  modelId: string
-  time: DownloadTime
-  speed: number
-  percent: number
-  size: DownloadSize
-  isFinished?: boolean
-  children?: DownloadState[]
-  error?: string
-}
-
-type DownloadTime = {
-  elapsed: number
-  remaining: number
-}
-
-type DownloadSize = {
-  total: number
-  transferred: number
-}
diff --git a/web/utils/model.ts b/web/utils/model.ts
deleted file mode 100644
index eab4076d86..0000000000
--- a/web/utils/model.ts
+++ /dev/null
@@ -1,10 +0,0 @@
-import { Model } from '@janhq/core'
-
-export const modelBinFileName = (model: Model) => {
-  const modelFormatExt = '.gguf'
-  const extractedFileName = model.sources[0]?.url.split('/').pop() ?? model.id
-  const fileName = extractedFileName.toLowerCase().endsWith(modelFormatExt)
-    ? extractedFileName
-    : model.id
-  return fileName
-}
diff --git a/web/utils/umami.tsx b/web/utils/umami.tsx
index 277ae12235..dc406a7d24 100644
--- a/web/utils/umami.tsx
+++ b/web/utils/umami.tsx
@@ -1,31 +1,67 @@
 import { useEffect } from 'react'
 
+import Script from 'next/script'
+
+// Define the type for the umami data object
+interface UmamiData {
+  version: string
+}
+
+declare global {
+  interface Window {
+    umami:
+      | {
+          track: (event: string, data?: UmamiData) => void
+        }
+      | undefined
+  }
+}
+
 const Umami = () => {
+  const appVersion = VERSION
+  const analyticsScriptPath = './umami_script.js'
+  const analyticsId = ANALYTICS_ID
+
   useEffect(() => {
-    if (!VERSION || !ANALYTICS_HOST || !ANALYTICS_ID) return
-    fetch(ANALYTICS_HOST, {
-      method: 'POST',
-      // eslint-disable-next-line @typescript-eslint/naming-convention
-      headers: { 'Content-Type': 'application/json' },
-      body: JSON.stringify({
-        payload: {
-          website: ANALYTICS_ID,
-          hostname: 'jan.ai',
-          screen: `${screen.width}x${screen.height}`,
-          language: navigator.language,
-          referrer: 'index.html',
-          data: { version: VERSION },
-          type: 'event',
-          title: document.title,
-          url: 'index.html',
-          name: VERSION,
-        },
-        type: 'event',
-      }),
-    })
-  }, [])
-
-  return <></>
+    if (!appVersion || !analyticsScriptPath || !analyticsId) return
+
+    const ping = () => {
+      // Check if umami is defined before ping
+      if (window.umami !== null && typeof window.umami !== 'undefined') {
+        window.umami.track(appVersion, {
+          version: appVersion,
+        })
+      }
+    }
+
+    // Wait for umami to be defined before ping
+    if (window.umami !== null && typeof window.umami !== 'undefined') {
+      ping()
+    } else {
+      // Listen for umami script load event
+      document.addEventListener('umami:loaded', ping)
+    }
+
+    // Cleanup function to remove event listener if the component unmounts
+    return () => {
+      document.removeEventListener('umami:loaded', ping)
+    }
+  }, [appVersion, analyticsScriptPath, analyticsId])
+
+  return (
+    <>
+      {appVersion && analyticsScriptPath && analyticsId && (
+        <Script
+          src={analyticsScriptPath}
+          data-website-id={analyticsId}
+          data-cache="true"
+          data-host-url="https://eu.umami.is"
+          defer
+          onLoad={() => document.dispatchEvent(new Event('umami:loaded'))}
+        />
+      )}
+    </>
+  )
 }
 
 export default Umami