From ada6138932deea316a5026450e108dfafcf3b957 Mon Sep 17 00:00:00 2001 From: Juan Calderon-Perez <835733+gaby@users.noreply.github.com> Date: Tue, 26 Dec 2023 23:56:27 -0500 Subject: [PATCH 1/3] Fix inefficent model check during chat creation --- api/src/serge/routers/chat.py | 9 ++------- 1 file changed, 2 insertions(+), 7 deletions(-) diff --git a/api/src/serge/routers/chat.py b/api/src/serge/routers/chat.py index 7cd0bd289d1..78fb452e08c 100644 --- a/api/src/serge/routers/chat.py +++ b/api/src/serge/routers/chat.py @@ -30,13 +30,8 @@ async def create_new_chat( init_prompt: str = "Below is an instruction that describes a task. Write a response that appropriately completes the request.", n_threads: int = 4, ): - try: - client = Llama( - model_path=f"/usr/src/app/weights/{model}.bin", - ) - del client - except Exception as exc: - raise ValueError(f"Model can't be found: {exc}") + if not os.path.exists(f"/usr/src/app/weights/{model}.bin"): + raisd ValueError(f"Model can't be found: /usr/src/app/weights/{model}.bin") client = Redis(host="localhost", port=6379, decode_responses=False) From 1303d50006a58bd975887b4923f42663ea20e6e1 Mon Sep 17 00:00:00 2001 From: Juan Calderon-Perez <835733+gaby@users.noreply.github.com> Date: Tue, 26 Dec 2023 23:58:51 -0500 Subject: [PATCH 2/3] Update chat.py --- api/src/serge/routers/chat.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/api/src/serge/routers/chat.py b/api/src/serge/routers/chat.py index 78fb452e08c..963911d1f19 100644 --- a/api/src/serge/routers/chat.py +++ b/api/src/serge/routers/chat.py @@ -31,7 +31,7 @@ async def create_new_chat( n_threads: int = 4, ): if not os.path.exists(f"/usr/src/app/weights/{model}.bin"): - raisd ValueError(f"Model can't be found: /usr/src/app/weights/{model}.bin") + raise ValueError(f"Model can't be found: /usr/src/app/weights/{model}.bin") client = Redis(host="localhost", port=6379, decode_responses=False) From a267bea0bc3c24c6ef70294966e7e532c5b4652a Mon Sep 17 00:00:00 2001 From: Juan Calderon-Perez <835733+gaby@users.noreply.github.com> Date: Wed, 27 Dec 2023 00:01:10 -0500 Subject: [PATCH 3/3] Update chat.py --- api/src/serge/routers/chat.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/api/src/serge/routers/chat.py b/api/src/serge/routers/chat.py index 963911d1f19..6de156812f4 100644 --- a/api/src/serge/routers/chat.py +++ b/api/src/serge/routers/chat.py @@ -1,3 +1,5 @@ +import os + from typing import Optional from fastapi import APIRouter, HTTPException from langchain.memory import RedisChatMessageHistory