From c8a08f11155a64a2789a233f1518a0df041df623 Mon Sep 17 00:00:00 2001 From: Louis Date: Tue, 17 Sep 2024 09:25:55 +0700 Subject: [PATCH] fix: correct prompt template for Phi3 Medium model (#3670) --- extensions/inference-nitro-extension/package.json | 2 +- .../resources/models/phi3-medium/model.json | 4 ++-- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/extensions/inference-nitro-extension/package.json b/extensions/inference-nitro-extension/package.json index 425e4b49ca..ac3ed180a6 100644 --- a/extensions/inference-nitro-extension/package.json +++ b/extensions/inference-nitro-extension/package.json @@ -1,7 +1,7 @@ { "name": "@janhq/inference-cortex-extension", "productName": "Cortex Inference Engine", - "version": "1.0.16", + "version": "1.0.17", "description": "This extension embeds cortex.cpp, a lightweight inference engine written in C++. See https://jan.ai.\nAdditional dependencies could be installed to run without Cuda Toolkit installation.", "main": "dist/index.js", "node": "dist/node/index.cjs.js", diff --git a/extensions/inference-nitro-extension/resources/models/phi3-medium/model.json b/extensions/inference-nitro-extension/resources/models/phi3-medium/model.json index 50944b9fe9..7331b2fd81 100644 --- a/extensions/inference-nitro-extension/resources/models/phi3-medium/model.json +++ b/extensions/inference-nitro-extension/resources/models/phi3-medium/model.json @@ -8,12 +8,12 @@ "id": "phi3-medium", "object": "model", "name": "Phi-3 Medium Instruct Q4", - "version": "1.3", + "version": "1.4", "description": "Phi-3 Medium is Microsoft's latest SOTA model.", "format": "gguf", "settings": { "ctx_len": 128000, - "prompt_template": "<|user|> {prompt}<|end|><|assistant|><|end|>", + "prompt_template": "<|user|> {prompt}<|end|><|assistant|>", "llama_model_path": "Phi-3-medium-128k-instruct-Q4_K_M.gguf", "ngl": 33 },