From db62d1e649f5f9a6f63bbf4f805ad4b6fece1428 Mon Sep 17 00:00:00 2001
From: kingbri <bdashore3@proton.me>
Date: Sat, 23 Mar 2024 20:29:17 -0400
Subject: [PATCH] OAI: Log request errors to console

Previously, some request errors were only sent to the client, but
some clients don't log the full error, so log it in console.

Signed-off-by: kingbri <bdashore3@proton.me>
---
 endpoints/OAI/app.py | 83 ++++++++++++++++++++++++++++++++------------
 1 file changed, 61 insertions(+), 22 deletions(-)

diff --git a/endpoints/OAI/app.py b/endpoints/OAI/app.py
index 84b7bde3..6c523d2b 100644
--- a/endpoints/OAI/app.py
+++ b/endpoints/OAI/app.py
@@ -162,7 +162,12 @@ async def load_model(request: Request, data: ModelLoadRequest):
 
     # Verify request parameters
     if not data.name:
-        raise HTTPException(400, "A model name was not provided.")
+        error_message = handle_request_error(
+            "A model name was not provided for load.",
+            exc_info=False,
+        ).error.message
+
+        raise HTTPException(400, error_message)
 
     model_path = pathlib.Path(unwrap(config.model_config().get("model_dir"), "models"))
     model_path = model_path / data.name
@@ -170,16 +175,24 @@ async def load_model(request: Request, data: ModelLoadRequest):
     draft_model_path = None
     if data.draft:
         if not data.draft.draft_model_name:
-            raise HTTPException(
-                400, "draft_model_name was not found inside the draft object."
-            )
+            error_message = handle_request_error(
+                "Could not find the draft model name for model load.",
+                exc_info=False,
+            ).error.message
+
+            raise HTTPException(400, error_message)
 
         draft_model_path = unwrap(
             config.draft_model_config().get("draft_model_dir"), "models"
         )
 
     if not model_path.exists():
-        raise HTTPException(400, "model_path does not exist. Check model_name?")
+        error_message = handle_request_error(
+            "Could not find the model path for load. Check model name or config.yml?",
+            exc_info=False,
+        ).error.message
+
+        raise HTTPException(400, error_message)
 
     load_callback = partial(stream_model_load, data, model_path, draft_model_path)
 
@@ -220,13 +233,23 @@ async def get_templates():
 async def switch_template(data: TemplateSwitchRequest):
     """Switch the currently loaded template"""
     if not data.name:
-        raise HTTPException(400, "New template name not found.")
+        error_message = handle_request_error(
+            "New template name not found.",
+            exc_info=False,
+        ).error.message
+
+        raise HTTPException(400, error_message)
 
     try:
         template = get_template_from_file(data.name)
         model.container.prompt_template = template
     except FileNotFoundError as e:
-        raise HTTPException(400, "Template does not exist. Check the name?") from e
+        error_message = handle_request_error(
+            f"The template name {data.name} doesn't exist. Check the spelling?",
+            exc_info=False,
+        ).error.message
+
+        raise HTTPException(400, error_message) from e
 
 
 @app.post(
@@ -259,15 +282,22 @@ async def switch_sampler_override(data: SamplerOverrideSwitchRequest):
         try:
             sampling.overrides_from_file(data.preset)
         except FileNotFoundError as e:
-            raise HTTPException(
-                400, "Sampler override preset does not exist. Check the name?"
-            ) from e
+            error_message = handle_request_error(
+                f"Sampler override preset with name {data.preset} does not exist. "
+                + "Check the spelling?",
+                exc_info=False,
+            ).error.message
+
+            raise HTTPException(400, error_message) from e
     elif data.overrides:
         sampling.overrides_from_dict(data.overrides)
     else:
-        raise HTTPException(
-            400, "A sampler override preset or dictionary wasn't provided."
-        )
+        error_message = handle_request_error(
+            "A sampler override preset or dictionary wasn't provided.",
+            exc_info=False,
+        ).error.message
+
+        raise HTTPException(400, error_message)
 
 
 @app.post(
@@ -322,14 +352,21 @@ async def load_lora(data: LoraLoadRequest):
     """Loads a LoRA into the model container."""
 
     if not data.loras:
-        raise HTTPException(400, "List of loras to load is not found.")
+        error_message = handle_request_error(
+            "List of loras to load is not found.",
+            exc_info=False,
+        ).error.message
+
+        raise HTTPException(400, error_message)
 
     lora_dir = pathlib.Path(unwrap(config.lora_config().get("lora_dir"), "loras"))
     if not lora_dir.exists():
-        raise HTTPException(
-            400,
-            "A parent lora directory does not exist. Check your config.yml?",
-        )
+        error_message = handle_request_error(
+            "A parent lora directory does not exist for load. Check your config.yml?",
+            exc_info=False,
+        ).error.message
+
+        raise HTTPException(400, error_message)
 
     load_callback = partial(model.load_loras, lora_dir, **data.model_dump())
 
@@ -459,10 +496,12 @@ async def chat_completion_request(request: Request, data: ChatCompletionRequest)
     """Generates a chat completion from a prompt."""
 
     if model.container.prompt_template is None:
-        raise HTTPException(
-            422,
-            "This endpoint is disabled because a prompt template is not set.",
-        )
+        error_message = handle_request_error(
+            "Chat completions are disabled because a prompt template is not set.",
+            exc_info=False,
+        ).error.message
+
+        raise HTTPException(422, error_message)
 
     model_path = model.container.get_model_path()