From bcf4361739f5a71c75a651763da222a179f96f66 Mon Sep 17 00:00:00 2001 From: hahuyhoang411 Date: Sun, 5 May 2024 00:16:55 +0700 Subject: [PATCH] fix: correct ctx --- .../resources/models/wizardcoder-13b/model.json | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/extensions/inference-nitro-extension/resources/models/wizardcoder-13b/model.json b/extensions/inference-nitro-extension/resources/models/wizardcoder-13b/model.json index cae96c26b9..b7e84bf88b 100644 --- a/extensions/inference-nitro-extension/resources/models/wizardcoder-13b/model.json +++ b/extensions/inference-nitro-extension/resources/models/wizardcoder-13b/model.json @@ -12,7 +12,7 @@ "description": "WizardCoder 13B is a Python coding model. This model demonstrate high proficiency in specific domains like coding and mathematics.", "format": "gguf", "settings": { - "ctx_len": 4096, + "ctx_len": 16384, "prompt_template": "### Instruction:\n{prompt}\n### Response:", "llama_model_path": "wizardcoder-python-13b-v1.0.Q4_K_M.gguf" }, @@ -20,7 +20,7 @@ "temperature": 0.7, "top_p": 0.95, "stream": true, - "max_tokens": 4096, + "max_tokens": 16384, "stop": [], "frequency_penalty": 0, "presence_penalty": 0