feat: add model load wait to ensure model is ready before use

2025-06-11 12:31:25 +05:30 · 2025-06-11 12:31:25 +05:30 · f463008362
commit f463008362
parent 9d4e7cb2b8
1 changed files with 21 additions and 1 deletions
--- a/extensions/llamacpp-extension/src/index.ts
+++ b/extensions/llamacpp-extension/src/index.ts
@ -369,6 +369,24 @@ export default class llamacpp_extension extends AIEngine {
    return port
  }

+  private async sleep(ms: number): Promise<void> {
+      return new Promise(resolve => setTimeout(resolve, ms))
+  }
+
+  private async waitForModelLoad(port: number, timeoutMs = 30_000): Promise<void> {
+      const start = Date.now()
+      while (Date.now() - start < timeoutMs) {
+          try {
+              const res = await fetch(`http://localhost:${port}/health`)
+              if(res.ok) {
+                  return
+              }
+          } catch (e) {}
+          await this.sleep(500) // 500 sec interval during rechecks
+      }
+      throw new Error(`Timed out loading model after ${timeoutMs}`)
+  }
+
  override async load(modelId: string): Promise<SessionInfo> {
    const sInfo = this.findSessionByModel(modelId)
    if (sInfo) {
@ -464,6 +482,8 @@ export default class llamacpp_extension extends AIEngine {
        args
      })

+      await this.waitForModelLoad(sInfo.port)
+
      // Store the session info for later use
      this.activeSessions.set(sInfo.pid, sInfo)

@ -586,7 +606,7 @@ export default class llamacpp_extension extends AIEngine {
    const url = `${baseUrl}/chat/completions`
    const headers = {
      'Content-Type': 'application/json',
-      'Authorization': `Bearer ${sessionInfo.apiKey}`,
+      'Authorization': `Bearer ${sessionInfo.api_key}`,
    }

    const body = JSON.stringify(opts)