🐛fix: llama.cpp default NGL setting does not offload all layers to GPU (#5310)

* 🐛fix: llama.cpp default NGL setting does not offload all layers to GPU * chore: cover more cases * chore: clean up * fix: should not show GPU section on Mac
2025-06-17 15:30:07 +07:00 · 2025-06-17 15:30:07 +07:00 · 2899d58ad7
commit 2899d58ad7
parent 50c25b65b6
3 changed files with 33 additions and 25 deletions
--- a/core/src/browser/models/utils.ts
+++ b/core/src/browser/models/utils.ts
@ -17,7 +17,7 @@ export const validationRules: { [key: string]: (value: any) => boolean } = {
  presence_penalty: (value: any) => typeof value === 'number' && value >= 0 && value <= 1,
  ctx_len: (value: any) => Number.isInteger(value) && value >= 0,
-  ngl: (value: any) => Number.isInteger(value) && value >= 0,
+  ngl: (value: any) => Number.isInteger(value),
  embedding: (value: any) => typeof value === 'boolean',
  n_parallel: (value: any) => Number.isInteger(value) && value >= 0,
  cpu_threads: (value: any) => Number.isInteger(value) && value >= 0,
--- a/extensions/inference-cortex-extension/src/index.ts
+++ b/extensions/inference-cortex-extension/src/index.ts
@ -253,11 +253,12 @@ export default class JanInferenceCortexExtension extends LocalOAIEngine {
        }
      }
    }
    const modelSettings = extractModelLoadParams(model.settings)
    return await this.apiInstance().then((api) =>
      api
        .post('v1/models/start', {
          json: {
-            ...extractModelLoadParams(model.settings),
+            ...modelSettings,
            model: model.id,
            engine:
              model.engine === 'nitro' // Legacy model cache
@ -282,6 +283,9 @@ export default class JanInferenceCortexExtension extends LocalOAIEngine {
            ...(this.context_shift === false
              ? { 'no-context-shift': true }
              : {}),
            ...(modelSettings.ngl === -1 || modelSettings.ngl === undefined
              ? { ngl: 100 }
              : {}),
          },
          timeout: false,
          signal,
--- a/web-app/src/routes/settings/hardware.tsx
+++ b/web-app/src/routes/settings/hardware.tsx
@ -371,30 +371,34 @@ function Hardware() {
            )}
            {/* GPU Information */}
-            <Card title="GPUs">
+            {!IS_MACOS ? (
-              {hardwareData.gpus.length > 0 ? (
+              <Card title="GPUs">
-                <DndContext
+                {hardwareData.gpus.length > 0 ? (
-                  sensors={sensors}
+                  <DndContext
-                  collisionDetection={closestCenter}
+                    sensors={sensors}
-                  onDragEnd={handleDragEnd}
+                    collisionDetection={closestCenter}
-                >
+                    onDragEnd={handleDragEnd}
                  <SortableContext
                    items={hardwareData.gpus.map((gpu) => gpu.id)}
                    strategy={verticalListSortingStrategy}
                  >
-                    {hardwareData.gpus.map((gpu, index) => (
+                    <SortableContext
-                      <SortableGPUItem
+                      items={hardwareData.gpus.map((gpu) => gpu.id)}
-                        key={gpu.id || index}
+                      strategy={verticalListSortingStrategy}
-                        gpu={gpu}
+                    >
-                        index={index}
+                      {hardwareData.gpus.map((gpu, index) => (
-                      />
+                        <SortableGPUItem
-                    ))}
+                          key={gpu.id || index}
-                  </SortableContext>
+                          gpu={gpu}
-                </DndContext>
+                          index={index}
-              ) : (
+                        />
-                <CardItem title="No GPUs detected" actions={<></>} />
+                      ))}
-              )}
+                    </SortableContext>
-            </Card>
+                  </DndContext>
                ) : (
                  <CardItem title="No GPUs detected" actions={<></>} />
                )}
              </Card>
            ) : (
              <></>
            )}
          </div>
        </div>
      </div>