diff --git a/models/storytelling-70b/model.json b/models/storytelling-70b/model.json deleted file mode 100644 index 76e6f7922..000000000 --- a/models/storytelling-70b/model.json +++ /dev/null @@ -1,24 +0,0 @@ -{ - "source_url": "https://huggingface.co/TheBloke/GOAT-70B-Storytelling-GGUF/resolve/main/goat-70b-storytelling.Q5_K_M.gguf", - "id": "storytelling-70b", - "object": "model", - "name": "Storytelling 70B", - "version": "1.0", - "description": "The GOAT-70B-Storytelling model is designed for autonomous story-writing, including crafting books and movie scripts. Based on the LLaMA 2 70B architecture, this model excels in generating cohesive and engaging narratives using inputs like plot outlines and character profiles.", - "format": "gguf", - "settings": { - "ctx_len": 4096, - "system_prompt": "", - "user_prompt": "### USER: ", - "ai_prompt": "\n### ASSISTANT: " - }, - "parameters": { - "max_tokens": 4096 - }, - "metadata": { - "author": "GOAT-AI, The Bloke", - "tags": ["General Use", "Writing"], - "size": 48750000000 - } - } - \ No newline at end of file diff --git a/models/xwin-70b/model.json b/models/xwin-70b/model.json deleted file mode 100644 index a5c1647b0..000000000 --- a/models/xwin-70b/model.json +++ /dev/null @@ -1,24 +0,0 @@ -{ - "source_url": "https://huggingface.co/TheBloke/Xwin-LM-70B-V0.1-GGUF/resolve/main/xwin-lm-70b-v0.1.Q5_K_M.gguf", - "id": "xwin-70b", - "object": "model", - "name": "Xwin LM 70B", - "version": "1.0", - "description": "Xwin-LM, based on Llama2 models, emphasizes alignment and exhibits advanced language understanding, text generation, and role-playing abilities.", - "format": "gguf", - "settings": { - "ctx_len": 4096, - "system_prompt": "", - "user_prompt": "USER: ", - "ai_prompt": "ASSISTANT: " - }, - "parameters": { - "max_tokens": 4096 - }, - "metadata": { - "author": "Xwin-LM, The Bloke", - "tags": ["General Use", "Role-playing"], - "size": 48750000000 - } - } - \ No newline at end of file diff --git a/models/yarn-70b/model.json b/models/yarn-70b/model.json deleted file mode 100644 index 67d8d3804..000000000 --- a/models/yarn-70b/model.json +++ /dev/null @@ -1,21 +0,0 @@ -{ - "source_url": "https://huggingface.co/TheBloke/Yarn-Llama-2-70B-32k-GGUF/resolve/main/yarn-llama-2-70b-32k.Q5_K_M.gguf", - "id": "yarn-70b", - "object": "model", - "name": "Yarn 32k 70B", - "version": "1,0", - "description": "Yarn-Llama-2-70b-32k is designed specifically for handling long contexts. It represents an extension of the Llama-2-70b-hf model, now supporting a 32k token context window.", - "format": "gguf", - "settings": { - "ctx_len": 4096 - }, - "parameters": { - "max_tokens": 4096 - }, - "metadata": { - "author": "NousResearch, The Bloke", - "tags": ["General Use", "Big Context Length"], - "size": 48750000000 - } - } - \ No newline at end of file