Spaces:

KiWA001
/

kai-api-gateway

Running

App Files Files Community

KiWA001 commited on 3 days ago

Commit

b544391

1 Parent(s): 45ac16b

feat: standard openai error handling

Browse files

Files changed (3) hide show

error_handling.py +51 -0
main.py +20 -0
v1_router.py +21 -8

error_handling.py ADDED Viewed

	@@ -0,0 +1,51 @@

+from fastapi import Request
+from fastapi.responses import JSONResponse
+def openai_error(message: str, code: str, type: str = "invalid_request_error", status_code: int = 400):
+    """
+    Return an OpenAI-formatted error response.
+    """
+    return JSONResponse(
+        status_code=status_code,
+        content={
+            "error": {
+                "message": message,
+                "type": type,
+                "param": None,
+                "code": code
+            }
+        }
+    )
+# Common Errors
+def error_invalid_api_key():
+    return openai_error(
+        "Incorrect API key provided.",
+        "invalid_api_key",
+        "authentication_error",
+        401
+    )
+def error_quota_exceeded():
+    return openai_error(
+        "You have exceeded your current quota, please check your plan and billing details.",
+        "insufficient_quota",
+        "insufficient_quota",
+        429
+    )
+def error_model_not_found(model_name: str):
+    return openai_error(
+        f"The model '{model_name}' does not exist",
+        "model_not_found",
+        "invalid_request_error",
+        404
+    )
+def error_server(message: str):
+    return openai_error(
+        message,
+        "internal_server_error",
+        "server_error",
+        500
+    )

main.py CHANGED Viewed

@@ -69,6 +69,26 @@ app = FastAPI(
 # Mount static files (for CSS/JS if needed later)
 app.mount("/static", StaticFiles(directory="static"), name="static")
 # CORS middleware
 app.add_middleware(
     CORSMiddleware,

 # Mount static files (for CSS/JS if needed later)
 app.mount("/static", StaticFiles(directory="static"), name="static")
+# Error Handling (Global)
+from error_handling import openai_error
+@app.exception_handler(HTTPException)
+async def http_exception_handler(request: Request, exc: HTTPException):
+    """
+    Override default 404/401/500 to return OpenAI-style JSON.
+    """
+    code = "invalid_request_error"
+    if exc.status_code == 401: code = "invalid_api_key"
+    if exc.status_code == 429: code = "insufficient_quota"
+    if exc.status_code == 404: code = "model_not_found"
+    if exc.status_code == 500: code = "internal_server_error"
+    return openai_error(
+        message=exc.detail,
+        code=code,
+        status_code=exc.status_code
+    )
 # CORS middleware
 app.add_middleware(
     CORSMiddleware,

v1_router.py CHANGED Viewed

@@ -8,6 +8,13 @@ from config import DEMO_API_KEY
 from db import get_supabase
 from services import engine
 from utils import calculate_usage
 # Initialize Router
 router = APIRouter()
@@ -77,7 +84,7 @@ async def verify_api_key(
         token = x_api_key
     if not token:
-        raise HTTPException(status_code=401, detail="Missing API Key")
     # 1. Check Demo Key
     if token == DEMO_API_KEY:
@@ -86,15 +93,14 @@ async def verify_api_key(
     # 2. Check Database
     supabase = get_supabase()
     if not supabase:
-        # Fallback if DB is down but key matches verified format? No, safer to reject.
-        raise HTTPException(status_code=503, detail="Auth service unavailable")
     try:
         # Check if key exists and is active
         res = supabase.table("api_keys").select("*").eq("token", token).execute()
         if not res.data:
-            raise HTTPException(status_code=401, detail="Invalid API Key")
         key_data = res.data[0]
@@ -102,18 +108,19 @@ async def verify_api_key(
             raise HTTPException(status_code=403, detail="API Key is inactive")
         # Check limits
-        # Note: We check limit BEFORE processing, but update usage AFTER (bg task)
         current_usage = key_data.get("usage_tokens", 0)
         limit = key_data.get("limit_tokens", 0)
         if limit > 0 and current_usage >= limit:
-             raise HTTPException(status_code=429, detail="Quota exceeded")
         return key_data
     except Exception as e:
         print(f"Auth Error: {e}")
-        raise HTTPException(status_code=500, detail="Auth Error")
 # --- Background Task for Usage Update ---
@@ -208,5 +215,11 @@ async def chat_completions(
             usage=UsageInfo(**usage)
         )
     except Exception as e:
-        raise HTTPException(status_code=500, detail=str(e))

 from db import get_supabase
 from services import engine
 from utils import calculate_usage
+from error_handling import (
+    openai_error,
+    error_invalid_api_key,
+    error_quota_exceeded,
+    error_model_not_found,
+    error_server
+)
 # Initialize Router
 router = APIRouter()
         token = x_api_key
     if not token:
+        raise HTTPException(status_code=401, detail="Incorrect API Key")
     # 1. Check Demo Key
     if token == DEMO_API_KEY:
     # 2. Check Database
     supabase = get_supabase()
     if not supabase:
+        raise HTTPException(status_code=503, detail="Service unavailable")
     try:
         # Check if key exists and is active
         res = supabase.table("api_keys").select("*").eq("token", token).execute()
         if not res.data:
+             raise HTTPException(status_code=401, detail="Incorrect API key provided")
         key_data = res.data[0]
             raise HTTPException(status_code=403, detail="API Key is inactive")
         # Check limits
         current_usage = key_data.get("usage_tokens", 0)
         limit = key_data.get("limit_tokens", 0)
         if limit > 0 and current_usage >= limit:
+             raise HTTPException(status_code=429, detail="You have exceeded your current quota")
         return key_data
+    except HTTPException:
+        raise
     except Exception as e:
         print(f"Auth Error: {e}")
+        raise HTTPException(status_code=500, detail="Internal server error")
 # --- Background Task for Usage Update ---
             usage=UsageInfo(**usage)
         )
+    except ValueError as e:
+        # Invalid model or params
+        # We need to return the JSON response object, but we are inside an async endpoint.
+        # Direct return works!
+        return error_model_not_found(request.model) if "model" in str(e) else openai_error(str(e), "invalid_request_error")
     except Exception as e:
+        return error_server(str(e))