diff --git a/models/merlinite-7b/model.json b/models/merlinite-7b/model.json new file mode 100644 index 000000000..a7beaef3a --- /dev/null +++ b/models/merlinite-7b/model.json @@ -0,0 +1,35 @@ +{ + "sources": [ + { + "filename": "merlinite-7b-Q4_K_M.gguf", + "url": "https://huggingface.co/ibm/merlinite-7b-GGUF/resolve/main/merlinite-7b-Q4_K_M.gguf" + } + ], + "id": "merlinite-7b", + "object": "model", + "name": "Merlinite 7B Q4", + "version": "1.0", + "description": "", + "format": "gguf", + "settings": { + "ctx_len": 4096, + "prompt_template": "<|system|>\n{system_prompt}\n<|user|>\n{prompt}\n<|assistant|>\n", + "llama_model_path": "merlinite-7b-Q4_K_M.gguf" + }, + "parameters": { + "temperature": 0.7, + "top_p": 0.95, + "stream": true, + "max_tokens": 4096, + "stop": [], + "frequency_penalty": 0, + "presence_penalty": 0 + }, + "metadata": { + "author": "IBM", + "tags": ["7B", "Finetuned"], + "size": 4370000000 + }, + "engine": "nitro" + } + \ No newline at end of file