2024-03-08 22:33:56 +01:00
|
|
|
from litellm.proxy.proxy_server import ProxyConfig, initialize
|
|
|
|
from litellm.proxy.proxy_server import app
|
|
|
|
|
2024-03-21 03:28:33 +01:00
|
|
|
from fastapi import FastAPI, Request, Depends, status, Response
|
2024-03-08 22:33:56 +01:00
|
|
|
from fastapi.responses import JSONResponse
|
2024-03-21 03:28:33 +01:00
|
|
|
|
|
|
|
from starlette.middleware.base import BaseHTTPMiddleware, RequestResponseEndpoint
|
|
|
|
from starlette.responses import StreamingResponse
|
|
|
|
import json
|
|
|
|
|
2024-03-08 22:33:56 +01:00
|
|
|
from utils.utils import get_http_authorization_cred, get_current_user
|
|
|
|
from config import ENV
|
|
|
|
|
2024-03-21 03:28:33 +01:00
|
|
|
|
|
|
|
from config import (
|
|
|
|
MODEL_FILTER_ENABLED,
|
|
|
|
MODEL_FILTER_LIST,
|
|
|
|
)
|
|
|
|
|
|
|
|
|
2024-03-08 22:33:56 +01:00
|
|
|
proxy_config = ProxyConfig()
|
|
|
|
|
|
|
|
|
|
|
|
async def config():
|
|
|
|
router, model_list, general_settings = await proxy_config.load_config(
|
|
|
|
router=None, config_file_path="./data/litellm/config.yaml"
|
|
|
|
)
|
|
|
|
|
|
|
|
await initialize(config="./data/litellm/config.yaml", telemetry=False)
|
|
|
|
|
|
|
|
|
|
|
|
async def startup():
|
|
|
|
await config()
|
|
|
|
|
|
|
|
|
|
|
|
@app.on_event("startup")
|
|
|
|
async def on_startup():
|
|
|
|
await startup()
|
|
|
|
|
|
|
|
|
2024-03-21 03:28:33 +01:00
|
|
|
app.state.MODEL_FILTER_ENABLED = MODEL_FILTER_ENABLED
|
|
|
|
app.state.MODEL_FILTER_LIST = MODEL_FILTER_LIST
|
|
|
|
|
|
|
|
|
2024-03-08 22:33:56 +01:00
|
|
|
@app.middleware("http")
|
|
|
|
async def auth_middleware(request: Request, call_next):
|
|
|
|
auth_header = request.headers.get("Authorization", "")
|
2024-03-21 03:28:33 +01:00
|
|
|
request.state.user = None
|
2024-03-08 22:33:56 +01:00
|
|
|
|
2024-03-21 03:33:27 +01:00
|
|
|
try:
|
|
|
|
user = get_current_user(get_http_authorization_cred(auth_header))
|
|
|
|
print(user)
|
|
|
|
request.state.user = user
|
|
|
|
except Exception as e:
|
|
|
|
return JSONResponse(status_code=400, content={"detail": str(e)})
|
2024-03-08 22:33:56 +01:00
|
|
|
|
|
|
|
response = await call_next(request)
|
|
|
|
return response
|
2024-03-21 03:28:33 +01:00
|
|
|
|
|
|
|
|
|
|
|
class ModifyModelsResponseMiddleware(BaseHTTPMiddleware):
|
|
|
|
async def dispatch(
|
|
|
|
self, request: Request, call_next: RequestResponseEndpoint
|
|
|
|
) -> Response:
|
|
|
|
|
|
|
|
response = await call_next(request)
|
|
|
|
user = request.state.user
|
|
|
|
|
|
|
|
if "/models" in request.url.path:
|
|
|
|
if isinstance(response, StreamingResponse):
|
|
|
|
# Read the content of the streaming response
|
|
|
|
body = b""
|
|
|
|
async for chunk in response.body_iterator:
|
|
|
|
body += chunk
|
|
|
|
|
|
|
|
data = json.loads(body.decode("utf-8"))
|
|
|
|
|
|
|
|
if app.state.MODEL_FILTER_ENABLED:
|
|
|
|
if user and user.role == "user":
|
|
|
|
data["data"] = list(
|
|
|
|
filter(
|
|
|
|
lambda model: model["id"]
|
|
|
|
in app.state.MODEL_FILTER_LIST,
|
|
|
|
data["data"],
|
|
|
|
)
|
|
|
|
)
|
|
|
|
|
2024-03-21 03:32:25 +01:00
|
|
|
# Modified Flag
|
2024-03-21 03:28:33 +01:00
|
|
|
data["modified"] = True
|
|
|
|
return JSONResponse(content=data)
|
|
|
|
|
|
|
|
return response
|
|
|
|
|
|
|
|
|
|
|
|
app.add_middleware(ModifyModelsResponseMiddleware)
|