* fix: move tensorrt executable to engine (#2400) * fix: move tensorrt executable to engine Signed-off-by: James <james@jan.ai> * some update Signed-off-by: hiro <hiro@jan.ai> * chore: bump tensorrt version * fix: wrong destroy path * fix: install extensions in parallel * chore: update path for tensorrt engine (#2404) Signed-off-by: James <james@jan.ai> Co-authored-by: James <james@jan.ai> --------- Signed-off-by: James <james@jan.ai> Signed-off-by: hiro <hiro@jan.ai> Co-authored-by: James <james@jan.ai> Co-authored-by: hiro <hiro@jan.ai> Co-authored-by: Louis <louis@jan.ai> * Release/v0.4.9 (#2421) * fix: turn off experimental settings should also turn off quick ask (#2411) * fix: app glitches 1s generating response before starting model (#2412) * fix: disable experimental feature should also disable vulkan (#2414) * fix: model load stuck on windows when can't get CPU core count (#2413) Signed-off-by: James <james@jan.ai> Co-authored-by: James <james@jan.ai> * feat: TensorRT-LLM engine update support (#2415) * fix: engine update * chore: add remove prepopulated models Signed-off-by: James <james@jan.ai> * update tinyjensen url Signed-off-by: James <james@jan.ai> * update llamacorn Signed-off-by: James <james@jan.ai> * update Mistral 7B Instruct v0.1 int4 Signed-off-by: James <james@jan.ai> * update tensorrt Signed-off-by: James <james@jan.ai> * update Signed-off-by: hiro <hiro@jan.ai> * update Signed-off-by: James <james@jan.ai> * prettier Signed-off-by: James <james@jan.ai> * update mistral config Signed-off-by: James <james@jan.ai> * fix some lint Signed-off-by: James <james@jan.ai> --------- Signed-off-by: James <james@jan.ai> Signed-off-by: hiro <hiro@jan.ai> Co-authored-by: James <james@jan.ai> Co-authored-by: hiro <hiro@jan.ai> * Tensorrt LLM disable turing support (#2418) Co-authored-by: Hien To <tominhhien97@gmail.com> * chore: add prompt template tensorrtllm (#2375) * chore: add prompt template tensorrtllm * Add Prompt template for mistral and correct model metadata --------- Co-authored-by: Hien To <tominhhien97@gmail.com> * fix: correct tensorrt mistral model.json (#2419) --------- Signed-off-by: James <james@jan.ai> Signed-off-by: hiro <hiro@jan.ai> Co-authored-by: Louis <louis@jan.ai> Co-authored-by: James <james@jan.ai> Co-authored-by: hiro <hiro@jan.ai> Co-authored-by: hiento09 <136591877+hiento09@users.noreply.github.com> Co-authored-by: Hien To <tominhhien97@gmail.com> --------- Signed-off-by: James <james@jan.ai> Signed-off-by: hiro <hiro@jan.ai> Co-authored-by: NamH <NamNh0122@gmail.com> Co-authored-by: James <james@jan.ai> Co-authored-by: hiro <hiro@jan.ai> Co-authored-by: hiento09 <136591877+hiento09@users.noreply.github.com> Co-authored-by: Hien To <tominhhien97@gmail.com>
77 lines
2.2 KiB
JSON
77 lines
2.2 KiB
JSON
{
|
|
"name": "@janhq/tensorrt-llm-extension",
|
|
"version": "0.0.3",
|
|
"description": "This extension enables Nvidia's TensorRT-LLM for the fastest GPU acceleration. See the [setup guide](https://jan.ai/guides/providers/tensorrt-llm/) for next steps.",
|
|
"main": "dist/index.js",
|
|
"node": "dist/node/index.cjs.js",
|
|
"author": "Jan <service@jan.ai>",
|
|
"license": "AGPL-3.0",
|
|
"config": {
|
|
"host": "127.0.0.1",
|
|
"port": "3929"
|
|
},
|
|
"compatibility": {
|
|
"platform": [
|
|
"win32"
|
|
],
|
|
"app": [
|
|
"0.1.0"
|
|
]
|
|
},
|
|
"tensorrtVersion": "0.1.8",
|
|
"provider": "nitro-tensorrt-llm",
|
|
"scripts": {
|
|
"build": "tsc --module commonjs && rollup -c rollup.config.ts",
|
|
"build:publish:win32": "rimraf *.tgz --glob && npm run build && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../pre-install",
|
|
"build:publish:linux": "rimraf *.tgz --glob && npm run build && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../pre-install",
|
|
"build:publish:darwin": "rimraf *.tgz --glob && npm run build && cpx \"bin/**\" \"dist/bin\" && npm pack && cpx *.tgz ../../pre-install",
|
|
"build:publish": "run-script-os"
|
|
},
|
|
"exports": {
|
|
".": "./dist/index.js",
|
|
"./main": "./dist/node/index.cjs.js"
|
|
},
|
|
"devDependencies": {
|
|
"@rollup/plugin-commonjs": "^25.0.7",
|
|
"@rollup/plugin-json": "^6.1.0",
|
|
"@rollup/plugin-node-resolve": "^15.2.3",
|
|
"@rollup/plugin-replace": "^5.0.5",
|
|
"@types/node": "^20.11.4",
|
|
"@types/os-utils": "^0.0.4",
|
|
"@types/tcp-port-used": "^1.0.4",
|
|
"@types/decompress": "4.2.7",
|
|
"cpx": "^1.5.0",
|
|
"download-cli": "^1.1.1",
|
|
"rimraf": "^3.0.2",
|
|
"rollup": "^2.38.5",
|
|
"rollup-plugin-define": "^1.0.1",
|
|
"rollup-plugin-sourcemaps": "^0.6.3",
|
|
"rollup-plugin-typescript2": "^0.36.0",
|
|
"run-script-os": "^1.1.6",
|
|
"typescript": "^5.2.2"
|
|
},
|
|
"dependencies": {
|
|
"@janhq/core": "file:../../core",
|
|
"decompress": "^4.2.1",
|
|
"fetch-retry": "^5.0.6",
|
|
"path-browserify": "^1.0.1",
|
|
"rxjs": "^7.8.1",
|
|
"tcp-port-used": "^1.0.2",
|
|
"ulid": "^2.3.0"
|
|
},
|
|
"engines": {
|
|
"node": ">=18.0.0"
|
|
},
|
|
"files": [
|
|
"dist/*",
|
|
"package.json",
|
|
"README.md"
|
|
],
|
|
"bundleDependencies": [
|
|
"tcp-port-used",
|
|
"fetch-retry",
|
|
"decompress",
|
|
"@janhq/core"
|
|
]
|
|
}
|