Chore: Add phi-3 (#2794)
* add: phi-3 * chore: bump version * fix: correct model id
This commit is contained in:
parent
f288a86647
commit
3c294d6a48
@ -1,7 +1,7 @@
|
|||||||
{
|
{
|
||||||
"name": "@janhq/inference-nitro-extension",
|
"name": "@janhq/inference-nitro-extension",
|
||||||
"productName": "Nitro Inference Engine",
|
"productName": "Nitro Inference Engine",
|
||||||
"version": "1.0.2",
|
"version": "1.0.3",
|
||||||
"description": "This extension embeds Nitro, a lightweight (3mb) inference engine written in C++. See https://nitro.jan.ai.\nAdditional dependencies could be installed to run without Cuda Toolkit installation.",
|
"description": "This extension embeds Nitro, a lightweight (3mb) inference engine written in C++. See https://nitro.jan.ai.\nAdditional dependencies could be installed to run without Cuda Toolkit installation.",
|
||||||
"main": "dist/index.js",
|
"main": "dist/index.js",
|
||||||
"node": "dist/node/index.cjs.js",
|
"node": "dist/node/index.cjs.js",
|
||||||
|
|||||||
@ -0,0 +1,32 @@
|
|||||||
|
{
|
||||||
|
"sources": [
|
||||||
|
{
|
||||||
|
"url": "https://huggingface.co/microsoft/Phi-3-mini-4k-instruct-gguf/resolve/main/Phi-3-mini-4k-instruct-q4.gguf",
|
||||||
|
"filename": "Phi-3-mini-4k-instruct-q4.gguf"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"id": "phi3-3.8b",
|
||||||
|
"object": "model",
|
||||||
|
"name": "Phi-3 Mini",
|
||||||
|
"version": "1.0",
|
||||||
|
"description": "Phi-3 Mini is Microsoft's newest, compact model designed for mobile use.",
|
||||||
|
"format": "gguf",
|
||||||
|
"settings": {
|
||||||
|
"ctx_len": 4096,
|
||||||
|
"prompt_template": "<|system|>\n{system_message}<|end|>\n<|user|>\n{prompt}<|end|>\n<|assistant|>\n",
|
||||||
|
"llama_model_path": "Phi-3-mini-4k-instruct-q4.gguf"
|
||||||
|
},
|
||||||
|
"parameters": {
|
||||||
|
"max_tokens": 4096,
|
||||||
|
"stop": ["<|end|>"]
|
||||||
|
},
|
||||||
|
"metadata": {
|
||||||
|
"author": "Microsoft",
|
||||||
|
"tags": [
|
||||||
|
"3B",
|
||||||
|
"Finetuned"
|
||||||
|
],
|
||||||
|
"size": 2320000000
|
||||||
|
},
|
||||||
|
"engine": "nitro"
|
||||||
|
}
|
||||||
Loading…
x
Reference in New Issue
Block a user