fix: #572 failed to load model sometime

2023-11-14 11:59:35 +07:00 · 2023-11-14 11:59:35 +07:00 · 86e1eea169
commit 86e1eea169
parent df6e9802f6
2 changed files with 167 additions and 87 deletions
--- a/plugins/inference-plugin/nitro/version.txt
+++ b/plugins/inference-plugin/nitro/version.txt
@ -1 +1 @@
-0.1.6
+0.1.7
--- a/plugins/inference-plugin/src/module.ts
+++ b/plugins/inference-plugin/src/module.ts
@ -1,119 +1,199 @@
+const fs = require("fs");
+const kill = require("kill-port");
 const path = require("path");
 const { app } = require("electron");
 const { spawn } = require("child_process");
-const fs = require("fs");
 const tcpPortUsed = require("tcp-port-used");
-const kill = require("kill-port");

+// The PORT to use for the Nitro subprocess
 const PORT = 3928;
+const LOCAL_HOST = "127.0.0.1";
+const NITRO_HTTP_SERVER_URL = `http://${LOCAL_HOST}:${PORT}`;
+const NITRO_HTTP_LOAD_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/loadmodel`;
+const NITRO_HTTP_UNLOAD_MODEL_URL = `${NITRO_HTTP_SERVER_URL}/inferences/llamacpp/unloadModel`;
+
+// The subprocess instance for Nitro
 let subprocess = null;

-const initModel = (fileName) => {
+/**
+ * The response from the initModel function.
+ * @property error - An error message if the model fails to load.
+ */
+interface InitModelResponse {
+  error?: any;
+}
+
+/**
+ * Initializes a Nitro subprocess to load a machine learning model.
+ * @param fileName - The name of the machine learning model file.
+ * @returns A Promise that resolves when the model is loaded successfully, or rejects with an error message if the model is not found or fails to load.
+ * TODO: Should pass absolute of the model file instead of just the name - So we can modurize the module.ts to npm package
+ */
+function initModel(fileName: string): Promise<InitModelResponse> {
+  // 1. Check if the model file exists
  return (
-    new Promise<void>(async (resolve, reject) => {
-      if (!fileName) {
-        reject("Model not found, please download again.");
-      }
-      resolve(fileName);
-    })
-      // Spawn Nitro subprocess to load model
-      .then(() => {
-        return tcpPortUsed.check(PORT, "127.0.0.1").then((inUse) => {
-          if (!inUse) {
-            let binaryFolder = path.join(__dirname, "nitro"); // Current directory by default
-            let binaryName;
-
-        if (process.platform === "win32") {
-          // Todo: Need to check for CUDA support to switch between CUDA and non-CUDA binaries
-          binaryName = "win-start.bat";
-        } else if (process.platform === "darwin") {
-          // Mac OS platform
-          if (process.arch === "arm64") {
-            binaryFolder = path.join(binaryFolder, "mac-arm64")
-          } else {
-            binaryFolder = path.join(binaryFolder, "mac-x64")
-          }
-          binaryName = "nitro"
-        } else {
-          // Linux
-          // Todo: Need to check for CUDA support to switch between CUDA and non-CUDA binaries
-          binaryName = "linux-start.sh"; // For other platforms
-        }
-
-            const binaryPath = path.join(binaryFolder, binaryName);
-
-        // Execute the binary
-        subprocess = spawn(binaryPath,["0.0.0.0", PORT], { cwd: binaryFolder });
-
-            // Handle subprocess output
-            subprocess.stdout.on("data", (data) => {
-              console.log(`stdout: ${data}`);
-            });
-
-            subprocess.stderr.on("data", (data) => {
-              console.error(`stderr: ${data}`);
-            });
-
-            subprocess.on("close", (code) => {
-              console.log(`child process exited with code ${code}`);
-              subprocess = null;
-            });
-          }
-        });
-      })
+    checkModelFileExist(fileName)
+      // 2. Check if the port is used, if used, attempt to unload model / kill nitro process
+      .then(checkAndUnloadNitro)
+      // 3. Spawn the Nitro subprocess
+      .then(spawnNitroProcess)
+      // 4. Wait until the port is used (Nitro http server is up)
      .then(() => tcpPortUsed.waitUntilUsed(PORT, 300, 30000))
-      .then(() => {
-        const llama_model_path = path.join(appPath(), fileName);
-
-        const config = {
-          llama_model_path,
-          ctx_len: 2048,
-          ngl: 100,
-          embedding: true, // Always enable embedding mode on
-        };
-
-        // Load model config
-        return fetch(`http://127.0.0.1:${PORT}/inferences/llamacpp/loadmodel`, {
-          method: "POST",
-          headers: {
-            "Content-Type": "application/json",
-          },
-          body: JSON.stringify(config),
-        });
-      })
-      .then((res) => {
+      // 5. Load the model into the Nitro subprocess (HTTP POST request)
+      .then(() => loadLLMModel(fileName))
+      // 6. Check if the model is loaded successfully
+      .then(async (res) => {
        if (res.ok) {
          return {};
        }
-        throw new Error("Nitro: Model failed to load.");
+        const json = await res.json();
+        throw new Error(`Nitro: Model failed to load. ${json}`);
      })
      .catch((err) => {
        return { error: err };
      })
  );
-};
-
-function dispose() {
-  killSubprocess();
-  // clean other registered resources here
 }

-function killSubprocess() {
+/**
+ * Loads a LLM model into the Nitro subprocess by sending a HTTP POST request.
+ * @param fileName - The name of the model file.
+ * @returns A Promise that resolves when the model is loaded successfully, or rejects with an error message if the model is not found or fails to load.
+ */
+function loadLLMModel(fileName: string): Promise<Response> {
+  const llama_model_path = path.join(appPath(), fileName);
+
+  const config = {
+    llama_model_path,
+    ctx_len: 2048,
+    ngl: 100,
+    embedding: false, // Always enable embedding mode on
+  };
+
+  // Load model config
+  return fetch(NITRO_HTTP_LOAD_MODEL_URL, {
+    method: "POST",
+    headers: {
+      "Content-Type": "application/json",
+    },
+    body: JSON.stringify(config),
+  });
+}
+
+/**
+ * Checks if the model file exists.
+ * @param fileName - The name of the model file.
+ * @returns A Promise that resolves when the model file exists, or rejects with an error message if the model file does not exist.
+ */
+function checkModelFileExist(fileName: string): Promise<string> {
+  return new Promise<string>(async (resolve, reject) => {
+    if (!fileName) {
+      reject("Model not found, please download again.");
+    }
+    resolve(fileName);
+  });
+}
+
+/**
+ * Terminates the Nitro subprocess.
+ * @returns A Promise that resolves when the subprocess is terminated successfully, or rejects with an error message if the subprocess fails to terminate.
+ */
+function killSubprocess(): Promise<void> {
  if (subprocess) {
    subprocess.kill();
    subprocess = null;
    console.log("Subprocess terminated.");
  } else {
-    kill(PORT, "tcp").then(console.log).catch(console.log);
-    console.error("No subprocess is currently running.");
+    return kill(PORT, "tcp").then(console.log).catch(console.log);
  }
 }

+/**
+ * Returns the path to the user data directory.
+ * @returns The path to the user data directory.
+ */
 function appPath() {
-  if (app) {
-    return app.getPath("userData");
+  return app.getPath("userData");
+}
+
+/**
+ * Check port is used or not, if used, attempt to unload model
+ * If unload failed, kill the port
+ */
+function checkAndUnloadNitro() {
+  return tcpPortUsed.check(PORT, LOCAL_HOST).then((inUse) => {
+    // If inUse - try unload or kill process, otherwise do nothing
+    if (inUse) {
+      // Attempt to unload model
+      return fetch(NITRO_HTTP_UNLOAD_MODEL_URL, {
+        method: "GET",
+        headers: {
+          "Content-Type": "application/json",
+        },
+      }).catch((err) => {
+        console.log(err);
+        // Fallback to kill the port
+        return killSubprocess();
+      });
+    }
+  });
+}
+
+/**
+ * Look for the Nitro binary and execute it
+ * Using child-process to spawn the process
+ * Should run exactly platform specified Nitro binary version
+ */
+function spawnNitroProcess() {
+  let binaryFolder = path.join(__dirname, "nitro"); // Current directory by default
+  let binaryName;
+
+  if (process.platform === "win32") {
+    // Todo: Need to check for CUDA support to switch between CUDA and non-CUDA binaries
+    binaryName = "win-start.bat";
+  } else if (process.platform === "darwin") {
+    // Mac OS platform
+    if (process.arch === "arm64") {
+      binaryFolder = path.join(binaryFolder, "mac-arm64");
+    } else {
+      binaryFolder = path.join(binaryFolder, "mac-x64");
+    }
+    binaryName = "nitro";
+  } else {
+    // Linux
+    // Todo: Need to check for CUDA support to switch between CUDA and non-CUDA binaries
+    binaryName = "linux-start.sh"; // For other platforms
  }
-  return process.env.APPDATA || (process.platform == 'darwin' ? process.env.HOME + '/Library/Preferences' : process.env.HOME + "/.local/share");
+
+  const binaryPath = path.join(binaryFolder, binaryName);
+
+  // Execute the binary
+  subprocess = spawn(binaryPath, [1, "0.0.0.0", PORT], {
+    cwd: binaryFolder,
+  });
+
+  // Handle subprocess output
+  subprocess.stdout.on("data", (data) => {
+    console.log(`stdout: ${data}`);
+  });
+
+  subprocess.stderr.on("data", (data) => {
+    console.error(`stderr: ${data}`);
+  });
+
+  subprocess.on("close", (code) => {
+    console.log(`child process exited with code ${code}`);
+    subprocess = null;
+  });
+}
+
+/**
+ * Cleans up any registered resources.
+ * Its module specific function, should be called when application is closed
+ */
+function dispose() {
+  // clean other registered resources here
+  killSubprocess();
 }

 module.exports = {
 @ -1 +1 @@
 .1.6
 .1.7