From a09a486906931ad477c322aaf7b0cfe09af62d18 Mon Sep 17 00:00:00 2001 From: hahuyhoang411 Date: Fri, 15 Dec 2023 16:36:39 +0700 Subject: [PATCH] fix(tinyllama): adjust ctx+maxtok --- models/tinyllama-1.1b/model.json | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/models/tinyllama-1.1b/model.json b/models/tinyllama-1.1b/model.json index 3dd5bcecf..d924be046 100644 --- a/models/tinyllama-1.1b/model.json +++ b/models/tinyllama-1.1b/model.json @@ -7,11 +7,11 @@ "description": "The TinyLlama project, featuring a 1.1B parameter Llama model, is pretrained on an expansive 3 trillion token dataset. Its design ensures easy integration with various Llama-based open-source projects. Despite its smaller size, it efficiently utilizes lower computational and memory resources, drawing on GPT-4's analytical prowess to enhance its conversational abilities and versatility.", "format": "gguf", "settings": { - "ctx_len": 4096, + "ctx_len": 2048, "prompt_template": "<|system|>\n{system_message}<|user|>\n{prompt}<|assistant|>" }, "parameters": { - "max_tokens": 4096 + "max_tokens": 2048 }, "metadata": { "author": "TinyLlama",