feat: inference-llamacpp-extension: backend implementation

2025-05-06 20:04:25 +05:30 · 2025-05-06 20:04:25 +05:30 · 9016fbff68
commit 9016fbff68
parent c288e75407
5 changed files with 133 additions and 0 deletions
--- a/src-tauri/src/core/utils/extensions/inference_llamacpp_extension/mod.rs
+++ b/src-tauri/src/core/utils/extensions/inference_llamacpp_extension/mod.rs
@ -0,0 +1 @@
+pub mod server;
--- a/src-tauri/src/core/utils/extensions/inference_llamacpp_extension/server.rs
+++ b/src-tauri/src/core/utils/extensions/inference_llamacpp_extension/server.rs
@ -0,0 +1,127 @@
+use std::path::PathBuf;
+use std::sync::Arc;
+use tauri::{AppHandle, Manager, State}; // Import Manager trait
+use tokio::process::{Child, Command};
+use tokio::sync::Mutex;
+
+use super::state::AppState;
+
+// Error type for server commands
+#[derive(Debug, thiserror::Error)]
+pub enum ServerError {
+    #[error("Server is already running")]
+    AlreadyRunning,
+    #[error("Server is not running")]
+    NotRunning,
+    #[error("Failed to locate server binary: {0}")]
+    BinaryNotFound(String),
+    #[error("Failed to determine resource path: {0}")]
+    ResourcePathError(String),
+    #[error("IO error: {0}")]
+    Io(#[from] std::io::Error),
+    #[error("Jan API error: {0}")]
+    Tauri(#[from] tauri::Error),
+}
+
+type ServerResult<T> = Result<T, ServerError>;
+
+// --- Helper function to find the server binary ---
+// -- TODO: Adjust extension engine paths
+// engine: static llama-server build (CUDA, VULKAN, SYCL, etc)
+fn get_server_path(app_handle: &AppHandle) -> ServerResult<PathBuf> {
+    let binary_name = if cfg!(windows) {
+        "llama-server.exe"
+    } else {
+        "llama-server"
+    };
+    let relative_path = PathBuf::from("engines").join(binary_name); // TODO: ADJUST THIS PATH
+
+    app_handle
+        .path()
+        .resolve_resource(relative_path)
+        .map_err(|e| ServerError::ResourcePathError(e.to_string()))?
+        .ok_or_else(|| {
+            ServerError::BinaryNotFound(format!(
+                "Could not resolve resource path for '{}'",
+                if cfg!(windows) {
+                    "engines/llama-server.exe"
+                } else {
+                    "engines/llama-server"
+                } // TODO: ADJUST THIS PATH
+            ))
+        })
+}
+
+// --- Load Command ---
+#[tauri::command]
+pub async fn load(
+    app_handle: AppHandle,            // Get the AppHandle
+    state: State<'_, AppState>,       // Access the shared state
+    args: Vec<String>,                // Arguments from the frontend
+) -> ServerResult<()> {
+    let mut process_lock = state.llama_server_process.lock().await;
+
+    if process_lock.is_some() {
+        log::warn!("Attempted to load server, but it's already running.");
+        return Err(ServerError::AlreadyRunning);
+    }
+
+    let server_path = get_server_path(&app_handle)?;
+    log::info!("Attempting to launch server at path: {:?}", server_path);
+    log::info!("Using arguments: {:?}", args);
+
+    if !server_path.exists() {
+         log::error!("Server binary not found at expected path: {:?}", server_path);
+         return Err(ServerError::BinaryNotFound(format!("Binary not found at {:?}", server_path)));
+    }
+
+    // Configure the command to run the server
+    let mut command = Command::new(server_path);
+    command.args(args);
+
+    // Optional: Redirect stdio if needed (e.g., for logging within Jan)
+    // command.stdout(Stdio::piped());
+    // command.stderr(Stdio::piped());
+
+    // Spawn the child process
+    let child = command.spawn().map_err(ServerError::Io)?;
+
+    log::info!("Server process started with PID: {:?}", child.id());
+
+    // Store the child process handle in the state
+    *process_lock = Some(child);
+
+    Ok(())
+}
+
+// --- Unload Command ---
+#[tauri::command]
+pub async fn unload(state: State<'_, AppState>) -> ServerResult<()> {
+    let mut process_lock = state.llama_server_process.lock().await;
+
+    // Take the child process out of the Option, leaving None in its place
+    if let Some(mut child) = process_lock.take() {
+        log::info!(
+            "Attempting to terminate server process with PID: {:?}",
+            child.id()
+        );
+        // Kill the process
+        // `start_kill` is preferred in async contexts
+        match child.start_kill() {
+            Ok(_) => {
+                log::info!("Server process termination signal sent.");
+                Ok(())
+            }
+            Err(e) => {
+                // For simplicity, we log and return error.
+                log::error!("Failed to kill server process: {}", e);
+                // Put it back? Maybe not useful if kill failed.
+                // *process_lock = Some(child);
+                Err(ServerError::Io(e))
+            }
+        }
+    } else {
+        log::warn!("Attempted to unload server, but it was not running.");
+        Ok(())
+    }
+}
--- a/src-tauri/src/core/utils/extensions/mod.rs
+++ b/src-tauri/src/core/utils/extensions/mod.rs
@ -0,0 +1 @@
+pub mod inference_llamacpp_extension;
--- a/src-tauri/src/core/utils/mod.rs
+++ b/src-tauri/src/core/utils/mod.rs
@ -76,3 +76,4 @@ pub fn normalize_path(path: &Path) -> PathBuf {
    }
    ret
 }
+pub mod extensions;
--- a/src-tauri/src/lib.rs
+++ b/src-tauri/src/lib.rs
@ -87,6 +87,9 @@ pub fn run() {
            // hardware
            core::hardware::get_system_info,
            core::hardware::get_system_usage,
+            // llama-cpp extension
+            core::utils::extensions::inference_llamacpp_extension::load, 
+            core::utils::extensions::inference_llamacpp_extension::unload
        ])
        .manage(AppState {
            app_token: Some(generate_app_token()),