jan/models/starling-7b/model.json
Hoang Ha 0dd12950df
fix(magicoder): correct the id and update parameters (#1448)
fix(capybara): change description + parameters

fix(codeninja): update description + add parameters

delete(magicoder): this model is failed to load due to gguf

fix(deepseek-1.3b): update description + add parameters

fix(deepseek-34b): update description + add parameters

fix(dolphin8x7b): update description + parameters

fix(llama2-chat-7b): update description + add parameters

fix(llama2-chat-70b): update description + add parameters

fix(mistral-7b): update description + add parameters

fix(mistral): degrade to v0.1 due to giberish output from v0.2

fix(mixtral): update desciption + parameters

fix(noromaid): update description + parameters

fix(mistral7b): correct the prompt template

update(openchat): add parameters

fix(openhermesneural): update parameter + description

fix(openhermesneural): update max_tokens

delete(pandora): remove pandora

fix(phi2): update parameter

update(phind34b): update description + change to q4 + add parameter

update(solar-slerp): update parameter

fix(starling): update description + parameter

fix(openchat): add to recommended

fix(stealth): add parameters

fix(tinyllama): update description + parameters

fix(trinity): update description + parameters

fix(tulu2): update description + parameters

fix(stealth): change max_tokens to 4096

update(wizardcoder): update parameter + description

update(wizardcoder): update  description

update(wizardcoder): change to q4

fix(yarn-mistral): update parameters

fix(yarn-mistral): change to q4

update(wizardcoder): correct the size of q4 model

fix(model-extension): pump to 1.0.20

fix(tinyllama): change to q8

fix(phi-2): change to q8

fix(deepseek34b): change to q4

fix(mistral7b): update the stop token

fix(starling): remove recommended
2024-01-08 23:00:01 +07:00

28 lines
876 B
JSON

{
"source_url": "https://huggingface.co/TheBloke/Starling-LM-7B-alpha-GGUF/resolve/main/starling-lm-7b-alpha.Q4_K_M.gguf",
"id": "starling-7b",
"object": "model",
"name": "Starling alpha 7B Q4",
"version": "1.0",
"description": "Starling 7B, an upgrade of Openchat 3.5 using RLAIF, is really good at various benchmarks, especially with GPT-4 judging its performance.",
"format": "gguf",
"settings": {
"ctx_len": 4096,
"prompt_template": "GPT4 User: {prompt}<|end_of_turn|>GPT4 Assistant:"
},
"parameters": {
"temperature": 0.7,
"top_p": 0.95,
"stream": true,
"max_tokens": 4096,
"frequency_penalty": 0,
"presence_penalty": 0
},
"metadata": {
"author": "Berkeley-nest, The Bloke",
"tags": ["7B","Finetuned"],
"size": 4370000000
},
"engine": "nitro"
}