mega changes

2025-12-18 07:54:29 +01:00 · 2025-11-20 11:11:18 +01:00
parent e070c95190
commit 841d79f26b
138 changed files with 21499 additions and 8844 deletions
--- a/backend/app/api/v1/openai_compat.py
+++ b/backend/app/api/v1/openai_compat.py
@@ -12,9 +12,13 @@ from sqlalchemy.ext.asyncio import AsyncSession
 from app.db.database import get_db
 from app.services.api_key_auth import require_api_key
 from app.api.v1.llm import (
-    get_cached_models, ModelsResponse, ModelInfo,
-    ChatCompletionRequest, EmbeddingRequest, create_chat_completion as llm_chat_completion,
-    create_embedding as llm_create_embedding
+    get_cached_models,
+    ModelsResponse,
+    ModelInfo,
+    ChatCompletionRequest,
+    EmbeddingRequest,
+    create_chat_completion as llm_chat_completion,
+    create_embedding as llm_create_embedding,
 )

 logger = logging.getLogger(__name__)
@@ -22,8 +26,12 @@ logger = logging.getLogger(__name__)
 router = APIRouter()


-def openai_error_response(message: str, error_type: str = "invalid_request_error", 
-                         status_code: int = 400, code: str = None):
+def openai_error_response(
+    message: str,
+    error_type: str = "invalid_request_error",
+    status_code: int = 400,
+    code: str = None,
+):
    """Create OpenAI-compatible error response"""
    error_data = {
        "error": {
@@ -33,52 +41,42 @@ def openai_error_response(message: str, error_type: str = "invalid_request_error
    }
    if code:
        error_data["error"]["code"] = code
-    
-    return JSONResponse(
-        status_code=status_code,
-        content=error_data
-    )
+
+    return JSONResponse(status_code=status_code, content=error_data)


@router.get("/models", response_model=ModelsResponse)
 async def list_models(
    context: Dict[str, Any] = Depends(require_api_key),
-    db: AsyncSession = Depends(get_db)
+    db: AsyncSession = Depends(get_db),
 ):
    """
-    Lists the currently available models, and provides basic information about each one 
+    Lists the currently available models, and provides basic information about each one
    such as the owner and availability.
-    
+
    This endpoint follows the exact OpenAI API specification:
    GET /v1/models
    """
    try:
        # Delegate to the existing LLM models endpoint
        from app.api.v1.llm import list_models as llm_list_models
+
        return await llm_list_models(context, db)
    except HTTPException as e:
        # Convert FastAPI HTTPException to OpenAI format
        if e.status_code == 401:
            return openai_error_response(
-                "Invalid authentication credentials", 
-                "authentication_error", 
-                401
+                "Invalid authentication credentials", "authentication_error", 401
            )
        elif e.status_code == 403:
            return openai_error_response(
-                "Insufficient permissions", 
-                "permission_error", 
-                403
+                "Insufficient permissions", "permission_error", 403
            )
        else:
            return openai_error_response(str(e.detail), "api_error", e.status_code)
    except Exception as e:
        logger.error(f"Error in OpenAI models endpoint: {e}")
-        return openai_error_response(
-            "Internal server error", 
-            "api_error", 
-            500
-        )
+        return openai_error_response("Internal server error", "api_error", 500)


@router.post("/chat/completions")
@@ -86,11 +84,11 @@ async def create_chat_completion(
    request_body: Request,
    chat_request: ChatCompletionRequest,
    context: Dict[str, Any] = Depends(require_api_key),
-    db: AsyncSession = Depends(get_db)
+    db: AsyncSession = Depends(get_db),
 ):
    """
    Create chat completion - OpenAI compatible endpoint
-    
+
    This endpoint follows the exact OpenAI API specification:
    POST /v1/chat/completions
    """
@@ -102,11 +100,11 @@ async def create_chat_completion(
 async def create_embedding(
    request: EmbeddingRequest,
    context: Dict[str, Any] = Depends(require_api_key),
-    db: AsyncSession = Depends(get_db)
+    db: AsyncSession = Depends(get_db),
 ):
    """
    Create embedding - OpenAI compatible endpoint
-    
+
    This endpoint follows the exact OpenAI API specification:
    POST /v1/embeddings
    """
@@ -118,44 +116,46 @@ async def create_embedding(
 async def retrieve_model(
    model_id: str,
    context: Dict[str, Any] = Depends(require_api_key),
-    db: AsyncSession = Depends(get_db)
+    db: AsyncSession = Depends(get_db),
 ):
    """
    Retrieve model information - OpenAI compatible endpoint
-    
+
    This endpoint follows the exact OpenAI API specification:
    GET /v1/models/{model}
    """
    try:
        # Get all models and find the specific one
        models = await get_cached_models()
-        
+
        # Filter models based on API key permissions
        api_key = context.get("api_key")
        if api_key and api_key.allowed_models:
-            models = [model for model in models if model.get("id") in api_key.allowed_models]
-        
+            models = [
+                model for model in models if model.get("id") in api_key.allowed_models
+            ]
+
        # Find the specific model
        model = next((m for m in models if m.get("id") == model_id), None)
-        
+
        if not model:
            raise HTTPException(
                status_code=status.HTTP_404_NOT_FOUND,
-                detail=f"Model '{model_id}' not found"
+                detail=f"Model '{model_id}' not found",
            )
-        
+
        return ModelInfo(
            id=model.get("id", model_id),
            object="model",
            created=model.get("created", 0),
-            owned_by=model.get("owned_by", "system")
+            owned_by=model.get("owned_by", "system"),
        )
-        
+
    except HTTPException:
        raise
    except Exception as e:
        logger.error(f"Error retrieving model {model_id}: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail="Failed to retrieve model information"
-        )
+            detail="Failed to retrieve model information",
+        )