refactor unload and implement a destructor to clean up sessions

2025-05-26 11:42:18 +05:30 · 2025-05-26 11:42:18 +05:30 · c5a0ee7f6e
commit c5a0ee7f6e
parent cd36b423b6
2 changed files with 23 additions and 37 deletions
--- a/extensions/llamacpp-extension/src/index.ts
+++ b/extensions/llamacpp-extension/src/index.ts
@ -76,7 +76,7 @@ export default class llamacpp_extension extends AIEngine {
  private downloadManager
  private activeSessions: Map<string, sessionInfo> = new Map()
  private modelsBasePath!: string
-  private activeRequests: Map<string, AbortController> = new Map()
+  private enginesPath!: string

  override async onLoad(): Promise<void> {
    super.onLoad() // Calls registerEngine() from AIEngine
@ -89,8 +89,24 @@ export default class llamacpp_extension extends AIEngine {
      await getJanDataFolderPath(),
      'models',
    ])
+
+    this.enginesPath = await joinPath([await getJanDataFolderPath(), 'llamacpp', 'engines'])
  }

+  override async onUnload(): Promise<void> {
+    // Terminate all active sessions
+    for (const [sessionId, _] of this.activeSessions) {
+      try {
+        await this.unload(sessionId);
+      } catch (error) {
+        console.error(`Failed to unload session ${sessionId}:`, error);
+      }
+  }
+  
+  // Clear the sessions map
+  this.activeSessions.clear();
+}
+
  // Implement the required LocalProvider interface methods
  override async list(): Promise<modelInfo[]> {
    const modelsDir = await joinPath([this.modelsBasePath, this.provider])
@ -335,6 +351,7 @@ export default class llamacpp_extension extends AIEngine {

    try {
      const sInfo = await invoke<sessionInfo>('load_llama_model', {
+        server_path: this.enginesPath,
        args: args,
      })

@ -348,17 +365,17 @@ export default class llamacpp_extension extends AIEngine {
    }
  }

-  override async unload(opts: unloadOptions): Promise<unloadResult> {
+  override async unload(sessionId: string): Promise<unloadResult> {
    try {
      // Pass the PID as the session_id
      const result = await invoke<unloadResult>('unload_llama_model', {
-        session_id: opts.sessionId, // Using PID as session ID
+        session_id: sessionId, // Using PID as session ID
      })

      // If successful, remove from active sessions
      if (result.success) {
-        this.activeSessions.delete(opts.sessionId)
-        console.log(`Successfully unloaded model with PID ${opts.sessionId}`)
+        this.activeSessions.delete(sessionId)
+        console.log(`Successfully unloaded model with PID ${sessionId}`)
      } else {
        console.warn(`Failed to unload model: ${result.error}`)
      }
@ -496,8 +513,4 @@ export default class llamacpp_extension extends AIEngine {
  override getChatClient(sessionId: string): any {
    throw new Error('method not implemented yet')
  }
-
-  onUnload(): void {
-    throw new Error('Method not implemented.')
-  }
 }
--- a/src-tauri/src/core/utils/extensions/inference_llamacpp_extension/server.rs
+++ b/src-tauri/src/core/utils/extensions/inference_llamacpp_extension/server.rs
@ -37,33 +37,6 @@ impl serde::Serialize for ServerError {

 type ServerResult<T> = Result<T, ServerError>;

-// --- Helper function to find the server binary ---
-// -- TODO: Adjust extension engine paths
-// engine: static llama-server build (CUDA, VULKAN, SYCL, etc)
-fn get_server_path(app_handle: &AppHandle) -> ServerResult<PathBuf> {
-    let binary_name = if cfg!(windows) {
-        "llama-server.exe"
-    } else {
-        "llama-server"
-    };
-    let relative_path = PathBuf::from("engines").join(binary_name); // TODO: ADJUST THIS PATH
-
-    app_handle
-        .path()
-        .resolve(relative_path, BaseDirectory::Resource)
-        .map_err(|e| ServerError::ResourcePathError(e.to_string()))
-    // .ok_or_else(|| {
-    //     ServerError::BinaryNotFound(format!(
-    //         "Could not resolve resource path for '{}'",
-    //         if cfg!(windows) {
-    //             "engines/llama-server.exe"
-    //         } else {
-    //             "engines/llama-server"
-    //         } // TODO: ADJUST THIS PATH
-    //     ))
-    // })
-}
-
 #[derive(Debug, Serialize, Deserialize)]
 pub struct SessionInfo {
    pub session_id: String,       // opaque handle for unload/chat
@ -82,6 +55,7 @@ pub struct UnloadResult {
 pub async fn load_llama_model(
    app_handle: AppHandle,      // Get the AppHandle
    state: State<'_, AppState>, // Access the shared state
+    server_path: String,
    args: Vec<String>,          // Arguments from the frontend
 ) -> ServerResult<SessionInfo> {
    let mut process_lock = state.llama_server_process.lock().await;
@ -91,7 +65,6 @@ pub async fn load_llama_model(
        return Err(ServerError::AlreadyRunning);
    }

-    let server_path = get_server_path(&app_handle)?;
    log::info!("Attempting to launch server at path: {:?}", server_path);
    log::info!("Using arguments: {:?}", args);