Van Pham 67db45ff3c
chore: add model.json for Llama3 and other outdated model version (#2773)
* chore: add model.json for Llama3 and other outdated model version

* fix: consistency format

* fix: correct folder id

* update: bump version

* add: stop words

* fix: model.json

* Update extensions/inference-nitro-extension/resources/models/llama3-8b-instruct/model.json

* Update extensions/inference-nitro-extension/resources/models/llama3-8b-instruct/model.json

Based on suggested change

Co-authored-by: Nikolaus Kühn <nikolaus.kuehn@commercetools.com>

---------

Co-authored-by: Van-QA <van@jan.ai>
Co-authored-by: Hoang Ha <64120343+hahuyhoang411@users.noreply.github.com>
Co-authored-by: Louis <louis@jan.ai>
Co-authored-by: Nikolaus Kühn <nikolaus.kuehn@commercetools.com>
2024-04-22 21:40:22 +07:00

35 lines
1.2 KiB
JSON

{
"sources": [
{
"filename": "Meta-Llama-3-8B-Instruct-Q4_K_M.gguf",
"url": "https://huggingface.co/lmstudio-community/Meta-Llama-3-8B-Instruct-GGUF/resolve/main/Meta-Llama-3-8B-Instruct-Q4_K_M.gguf"
}
],
"id": "llama3-8b-instruct",
"object": "model",
"name": "Llama 3 8B Q4",
"version": "1.0",
"description": "Meta's Llama 3 excels at general usage situations, including chat, general world knowledge, and coding.",
"format": "gguf",
"settings": {
"ctx_len": 8192,
"prompt_template": "<|begin_of_text|><|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|><|start_header_id|>user<|end_header_id|>\n\n{prompt}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n",
"llama_model_path": "Meta-Llama-3-8B-Instruct-Q4_K_M.gguf"
},
"parameters": {
"temperature": 0.7,
"top_p": 0.95,
"stream": true,
"max_tokens": 4096,
"stop": ["<|end_of_text|>","<|eot_id|>"],
"frequency_penalty": 0,
"presence_penalty": 0
},
"metadata": {
"author": "MetaAI",
"tags": ["7B", "Featured"],
"size": 4920000000
},
"engine": "nitro"
}