jan/models/mixtral-8x7b-instruct/model.json

{
    "source_url": "https://huggingface.co/TheBloke/Mixtral-8x7B-Instruct-v0.1-GGUF/resolve/main/mixtral-8x7b-instruct-v0.1.Q4_K_M.gguf",
    "id": "mixtral-8x7b-instruct",
    "object": "model",
    "name": "Mixtral 8x7B Instruct Q4",
    "version": "1.0",
    "description": "The Mixtral-8x7B Large Language Model (LLM) is a pretrained generative Sparse Mixture of Experts. The Mixtral-8x7B outperforms Llama 2 70B on most benchmarks we tested.",
    "format": "gguf",
    "settings": {
      "ctx_len": 2048,
      "prompt_template": "[INST] {prompt} [/INST]"
    },
    "parameters": {
      "max_tokens": 2048
    },
    "metadata": {
      "author": "MistralAI, TheBloke",
      "tags": ["MOE", "Foundational Model"],
      "size": 26440000000
    },
    "engine": "nitro"
  }