open-webui/backend/apps/litellm/main.py

import sys

from fastapi import FastAPI, Depends, HTTPException
from fastapi.routing import APIRoute
from fastapi.middleware.cors import CORSMiddleware

import logging
from fastapi import FastAPI, Request, Depends, status, Response
from fastapi.responses import JSONResponse

from starlette.middleware.base import BaseHTTPMiddleware, RequestResponseEndpoint
from starlette.responses import StreamingResponse
import json
import time
import requests

from pydantic import BaseModel, ConfigDict
from typing import Optional, List

from utils.utils import get_verified_user, get_current_user, get_admin_user
from config import SRC_LOG_LEVELS, ENV
from constants import MESSAGES

import os

log = logging.getLogger(__name__)
log.setLevel(SRC_LOG_LEVELS["LITELLM"])


from config import (
    ENABLE_LITELLM,
    ENABLE_MODEL_FILTER,
    MODEL_FILTER_LIST,
    DATA_DIR,
    LITELLM_PROXY_PORT,
    LITELLM_PROXY_HOST,
)

from litellm.utils import get_llm_provider

import asyncio
import subprocess
import yaml

app = FastAPI()

origins = ["*"]

app.add_middleware(
    CORSMiddleware,
    allow_origins=origins,
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)


LITELLM_CONFIG_DIR = f"{DATA_DIR}/litellm/config.yaml"

with open(LITELLM_CONFIG_DIR, "r") as file:
    litellm_config = yaml.safe_load(file)


app.state.ENABLE = ENABLE_LITELLM
app.state.CONFIG = litellm_config

# Global variable to store the subprocess reference
background_process = None

CONFLICT_ENV_VARS = [
    # Uvicorn uses PORT, so LiteLLM might use it as well
    "PORT",
    # LiteLLM uses DATABASE_URL for Prisma connections
    "DATABASE_URL",
]


async def run_background_process(command):
    global background_process
    log.info("run_background_process")

    try:
        # Log the command to be executed
        log.info(f"Executing command: {command}")
        # Filter environment variables known to conflict with litellm
        env = {k: v for k, v in os.environ.items() if k not in CONFLICT_ENV_VARS}
        # Execute the command and create a subprocess
        process = await asyncio.create_subprocess_exec(
            *command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, env=env
        )
        background_process = process
        log.info("Subprocess started successfully.")

        # Capture STDERR for debugging purposes
        stderr_output = await process.stderr.read()
        stderr_text = stderr_output.decode().strip()
        if stderr_text:
            log.info(f"Subprocess STDERR: {stderr_text}")

        # log.info output line by line
        async for line in process.stdout:
            log.info(line.decode().strip())

        # Wait for the process to finish
        returncode = await process.wait()
        log.info(f"Subprocess exited with return code {returncode}")
    except Exception as e:
        log.error(f"Failed to start subprocess: {e}")
        raise  # Optionally re-raise the exception if you want it to propagate


async def start_litellm_background():
    log.info("start_litellm_background")
    # Command to run in the background
    command = [
        "litellm",
        "--port",
        str(LITELLM_PROXY_PORT),
        "--host",
        LITELLM_PROXY_HOST,
        "--telemetry",
        "False",
        "--config",
        LITELLM_CONFIG_DIR,
    ]

    await run_background_process(command)


async def shutdown_litellm_background():
    log.info("shutdown_litellm_background")
    global background_process
    if background_process:
        background_process.terminate()
        await background_process.wait()  # Ensure the process has terminated
        log.info("Subprocess terminated")
        background_process = None


@app.on_event("startup")
async def startup_event():
    log.info("startup_event")
    # TODO: Check config.yaml file and create one
    asyncio.create_task(start_litellm_background())


app.state.ENABLE_MODEL_FILTER = ENABLE_MODEL_FILTER
app.state.MODEL_FILTER_LIST = MODEL_FILTER_LIST


@app.get("/")
async def get_status():
    return {"status": True}


async def restart_litellm():
    """
    Endpoint to restart the litellm background service.
    """
    log.info("Requested restart of litellm service.")
    try:
        # Shut down the existing process if it is running
        await shutdown_litellm_background()
        log.info("litellm service shutdown complete.")

        # Restart the background service

        asyncio.create_task(start_litellm_background())
        log.info("litellm service restart complete.")

        return {
            "status": "success",
            "message": "litellm service restarted successfully.",
        }
    except Exception as e:
        log.info(f"Error restarting litellm service: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e)
        )


@app.get("/restart")
async def restart_litellm_handler(user=Depends(get_admin_user)):
    return await restart_litellm()


@app.get("/config")
async def get_config(user=Depends(get_admin_user)):
    return app.state.CONFIG


class LiteLLMConfigForm(BaseModel):
    general_settings: Optional[dict] = None
    litellm_settings: Optional[dict] = None
    model_list: Optional[List[dict]] = None
    router_settings: Optional[dict] = None

    model_config = ConfigDict(protected_namespaces=())


@app.post("/config/update")
async def update_config(form_data: LiteLLMConfigForm, user=Depends(get_admin_user)):
    app.state.CONFIG = form_data.model_dump(exclude_none=True)

    with open(LITELLM_CONFIG_DIR, "w") as file:
        yaml.dump(app.state.CONFIG, file)

    await restart_litellm()
    return app.state.CONFIG


@app.get("/models")
@app.get("/v1/models")
async def get_models(user=Depends(get_current_user)):

    if app.state.ENABLE:
        while not background_process:
            await asyncio.sleep(0.1)

        url = f"http://localhost:{LITELLM_PROXY_PORT}/v1"
        r = None
        try:
            r = requests.request(method="GET", url=f"{url}/models")
            r.raise_for_status()

            data = r.json()

            if app.state.ENABLE_MODEL_FILTER:
                if user and user.role == "user":
                    data["data"] = list(
                        filter(
                            lambda model: model["id"] in app.state.MODEL_FILTER_LIST,
                            data["data"],
                        )
                    )

            return data
        except Exception as e:

            log.exception(e)
            error_detail = "Open WebUI: Server Connection Error"
            if r is not None:
                try:
                    res = r.json()
                    if "error" in res:
                        error_detail = f"External: {res['error']}"
                except:
                    error_detail = f"External: {e}"

            return {
                "data": [
                    {
                        "id": model["model_name"],
                        "object": "model",
                        "created": int(time.time()),
                        "owned_by": "openai",
                    }
                    for model in app.state.CONFIG["model_list"]
                ],
                "object": "list",
            }
    else:
        return {
            "data": [],
            "object": "list",
        }


@app.get("/model/info")
async def get_model_list(user=Depends(get_admin_user)):
    return {"data": app.state.CONFIG["model_list"]}


class AddLiteLLMModelForm(BaseModel):
    model_name: str
    litellm_params: dict

    model_config = ConfigDict(protected_namespaces=())


@app.post("/model/new")
async def add_model_to_config(
    form_data: AddLiteLLMModelForm, user=Depends(get_admin_user)
):
    try:
        get_llm_provider(model=form_data.model_name)
        app.state.CONFIG["model_list"].append(form_data.model_dump())

        with open(LITELLM_CONFIG_DIR, "w") as file:
            yaml.dump(app.state.CONFIG, file)

        await restart_litellm()

        return {"message": MESSAGES.MODEL_ADDED(form_data.model_name)}
    except Exception as e:
        print(e)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e)
        )


class DeleteLiteLLMModelForm(BaseModel):
    id: str


@app.post("/model/delete")
async def delete_model_from_config(
    form_data: DeleteLiteLLMModelForm, user=Depends(get_admin_user)
):
    app.state.CONFIG["model_list"] = [
        model
        for model in app.state.CONFIG["model_list"]
        if model["model_name"] != form_data.id
    ]

    with open(LITELLM_CONFIG_DIR, "w") as file:
        yaml.dump(app.state.CONFIG, file)

    await restart_litellm()

    return {"message": MESSAGES.MODEL_DELETED(form_data.id)}


@app.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE"])
async def proxy(path: str, request: Request, user=Depends(get_verified_user)):
    body = await request.body()

    url = f"http://localhost:{LITELLM_PROXY_PORT}"

    target_url = f"{url}/{path}"

    headers = {}
    # headers["Authorization"] = f"Bearer {key}"
    headers["Content-Type"] = "application/json"

    r = None

    try:
        r = requests.request(
            method=request.method,
            url=target_url,
            data=body,
            headers=headers,
            stream=True,
        )

        r.raise_for_status()

        # Check if response is SSE
        if "text/event-stream" in r.headers.get("Content-Type", ""):
            return StreamingResponse(
                r.iter_content(chunk_size=8192),
                status_code=r.status_code,
                headers=dict(r.headers),
            )
        else:
            response_data = r.json()
            return response_data
    except Exception as e:
        log.exception(e)
        error_detail = "Open WebUI: Server Connection Error"
        if r is not None:
            try:
                res = r.json()
                if "error" in res:
                    error_detail = f"External: {res['error']['message'] if 'message' in res['error'] else res['error']}"
            except:
                error_detail = f"External: {e}"

        raise HTTPException(
            status_code=r.status_code if r else 500, detail=error_detail
        )
fix: harden litellm exec command to prevent unintended commands logic was previously to split on space for arguments, but if any of the user controlled variables LITELLM_PROXY_HOST or DATA_DIR had spaces in them, this would not behave correctly. 2024-04-23 20:25:43 +02:00			`import sys`

DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`from fastapi import FastAPI, Depends, HTTPException`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`from fastapi.routing import APIRoute`
			`from fastapi.middleware.cors import CORSMiddleware`
refac: litellm 2024-03-08 22:33:56 +01:00
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`import logging`
feat: litellm model filter support 2024-03-21 03:28:33 +01:00			`from fastapi import FastAPI, Request, Depends, status, Response`
refac: litellm 2024-03-08 22:33:56 +01:00			`from fastapi.responses import JSONResponse`
feat: litellm model filter support 2024-03-21 03:28:33 +01:00
			`from starlette.middleware.base import BaseHTTPMiddleware, RequestResponseEndpoint`
			`from starlette.responses import StreamingResponse`
			`import json`
refac: improved error handling 2024-04-22 00:37:59 +02:00			`import time`
DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`import requests`
feat: litellm model filter support 2024-03-21 03:28:33 +01:00
refac: litellm model name validation 2024-04-22 01:25:53 +02:00			`from pydantic import BaseModel, ConfigDict`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`from typing import Optional, List`

feat: restart subprocess route 2024-04-21 08:51:38 +02:00			`from utils.utils import get_verified_user, get_current_user, get_admin_user`
Migrate to python logging module with env var control. 2024-03-21 00:11:36 +01:00			`from config import SRC_LOG_LEVELS, ENV`
refac: improved error handling 2024-04-22 00:37:59 +02:00			`from constants import MESSAGES`
Migrate to python logging module with env var control. 2024-03-21 00:11:36 +01:00
feat: add support for using postgres for the backend DB 2024-04-24 19:10:18 +02:00			`import os`

Migrate to python logging module with env var control. 2024-03-21 00:11:36 +01:00			`log = logging.getLogger(__name__)`
			`log.setLevel(SRC_LOG_LEVELS["LITELLM"])`
refac: litellm 2024-03-08 22:33:56 +01:00
feat: litellm model filter support 2024-03-21 03:28:33 +01:00
feat: add LITELLM_PROXY_PORT to configure internal proxy port 2024-04-23 20:14:01 +02:00			`from config import (`
fix 2024-04-28 03:17:19 +02:00			`ENABLE_LITELLM,`
refac: naming convention MODEL_FILTER_ENABLED -> ENABLE_MODEL_FILTER 2024-04-26 23:17:18 +02:00			`ENABLE_MODEL_FILTER,`
feat: add LITELLM_PROXY_PORT to configure internal proxy port 2024-04-23 20:14:01 +02:00			`MODEL_FILTER_LIST,`
			`DATA_DIR,`
			`LITELLM_PROXY_PORT,`
feat: add LITELLM_PROXY_HOST to configure address litellm listens on 2024-04-23 20:19:16 +02:00			`LITELLM_PROXY_HOST,`
feat: add LITELLM_PROXY_PORT to configure internal proxy port 2024-04-23 20:14:01 +02:00			`)`
feat: litellm model filter support 2024-03-21 03:28:33 +01:00
refac: litellm model name validation 2024-04-22 01:25:53 +02:00			`from litellm.utils import get_llm_provider`
feat: litellm model filter support 2024-03-21 03:28:33 +01:00
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`import asyncio`
			`import subprocess`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`import yaml`
refac: litellm 2024-03-08 22:33:56 +01:00
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`app = FastAPI()`
refac: litellm 2024-03-08 22:33:56 +01:00
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`origins = ["*"]`
refac: litellm 2024-03-08 22:33:56 +01:00
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`app.add_middleware(`
			`CORSMiddleware,`
			`allow_origins=origins,`
			`allow_credentials=True,`
			`allow_methods=["*"],`
			`allow_headers=["*"],`
			`)`
refac: litellm 2024-03-08 22:33:56 +01:00
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00
feat: litellm config update 2024-04-21 23:10:01 +02:00			`LITELLM_CONFIG_DIR = f"{DATA_DIR}/litellm/config.yaml"`

			`with open(LITELLM_CONFIG_DIR, "r") as file:`
			`litellm_config = yaml.safe_load(file)`

fix 2024-04-28 03:17:19 +02:00
			`app.state.ENABLE = ENABLE_LITELLM`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`app.state.CONFIG = litellm_config`

refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00			`# Global variable to store the subprocess reference`
			`background_process = None`

feat: add support for using postgres for the backend DB 2024-04-24 19:10:18 +02:00			`CONFLICT_ENV_VARS = [`
			`# Uvicorn uses PORT, so LiteLLM might use it as well`
			`"PORT",`
			`# LiteLLM uses DATABASE_URL for Prisma connections`
			`"DATABASE_URL",`
			`]`

pwned :) 2024-04-21 08:22:02 +02:00
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00			`async def run_background_process(command):`
			`global background_process`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info("run_background_process")`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00
			`try:`
			`# Log the command to be executed`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info(f"Executing command: {command}")`
feat: add support for using postgres for the backend DB 2024-04-24 19:10:18 +02:00			`# Filter environment variables known to conflict with litellm`
			`env = {k: v for k, v in os.environ.items() if k not in CONFLICT_ENV_VARS}`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00			`# Execute the command and create a subprocess`
			`process = await asyncio.create_subprocess_exec(`
feat: add support for using postgres for the backend DB 2024-04-24 19:10:18 +02:00			`*command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, env=env`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00			`)`
			`background_process = process`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info("Subprocess started successfully.")`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00
			`# Capture STDERR for debugging purposes`
			`stderr_output = await process.stderr.read()`
			`stderr_text = stderr_output.decode().strip()`
			`if stderr_text:`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info(f"Subprocess STDERR: {stderr_text}")`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00
feat: litellm config update 2024-04-21 23:10:01 +02:00			`# log.info output line by line`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00			`async for line in process.stdout:`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info(line.decode().strip())`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00
			`# Wait for the process to finish`
			`returncode = await process.wait()`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info(f"Subprocess exited with return code {returncode}")`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00			`except Exception as e:`
			`log.error(f"Failed to start subprocess: {e}")`
			`raise # Optionally re-raise the exception if you want it to propagate`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00

			`async def start_litellm_background():`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info("start_litellm_background")`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`# Command to run in the background`
fix: harden litellm exec command to prevent unintended commands logic was previously to split on space for arguments, but if any of the user controlled variables LITELLM_PROXY_HOST or DATA_DIR had spaces in them, this would not behave correctly. 2024-04-23 20:25:43 +02:00			`command = [`
			`"litellm",`
			`"--port",`
			`str(LITELLM_PROXY_PORT),`
			`"--host",`
			`LITELLM_PROXY_HOST,`
			`"--telemetry",`
			`"False",`
			`"--config",`
			`LITELLM_CONFIG_DIR,`
			`]`
pwned :) 2024-04-21 08:22:02 +02:00
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`await run_background_process(command)`
refac: litellm 2024-03-08 22:33:56 +01:00

refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00			`async def shutdown_litellm_background():`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info("shutdown_litellm_background")`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00			`global background_process`
			`if background_process:`
			`background_process.terminate()`
			`await background_process.wait() # Ensure the process has terminated`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info("Subprocess terminated")`
feat: litellm model add/delete 2024-04-22 00:26:22 +02:00			`background_process = None`
refac: close subprocess gracefully 2024-04-21 08:46:09 +02:00

refac: litellm 2024-03-08 22:33:56 +01:00			`@app.on_event("startup")`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`async def startup_event():`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info("startup_event")`
DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`# TODO: Check config.yaml file and create one`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`asyncio.create_task(start_litellm_background())`
refac: litellm 2024-03-08 22:33:56 +01:00

refac: naming convention MODEL_FILTER_ENABLED -> ENABLE_MODEL_FILTER 2024-04-26 23:17:18 +02:00			`app.state.ENABLE_MODEL_FILTER = ENABLE_MODEL_FILTER`
feat: litellm model filter support 2024-03-21 03:28:33 +01:00			`app.state.MODEL_FILTER_LIST = MODEL_FILTER_LIST`


fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00			`@app.get("/")`
			`async def get_status():`
			`return {"status": True}`


feat: litellm config update 2024-04-21 23:10:01 +02:00			`async def restart_litellm():`
feat: restart subprocess route 2024-04-21 08:51:38 +02:00			`"""`
			`Endpoint to restart the litellm background service.`
			`"""`
			`log.info("Requested restart of litellm service.")`
			`try:`
			`# Shut down the existing process if it is running`
			`await shutdown_litellm_background()`
			`log.info("litellm service shutdown complete.")`

			`# Restart the background service`
feat: litellm config update 2024-04-21 23:10:01 +02:00
			`asyncio.create_task(start_litellm_background())`
feat: restart subprocess route 2024-04-21 08:51:38 +02:00			`log.info("litellm service restart complete.")`

			`return {`
			`"status": "success",`
			`"message": "litellm service restarted successfully.",`
			`}`
			`except Exception as e:`
feat: litellm config update 2024-04-21 23:10:01 +02:00			`log.info(f"Error restarting litellm service: {e}")`
feat: restart subprocess route 2024-04-21 08:51:38 +02:00			`raise HTTPException(`
			`status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e)`
			`)`


feat: litellm config update 2024-04-21 23:10:01 +02:00			`@app.get("/restart")`
			`async def restart_litellm_handler(user=Depends(get_admin_user)):`
			`return await restart_litellm()`


			`@app.get("/config")`
			`async def get_config(user=Depends(get_admin_user)):`
			`return app.state.CONFIG`


			`class LiteLLMConfigForm(BaseModel):`
			`general_settings: Optional[dict] = None`
			`litellm_settings: Optional[dict] = None`
			`model_list: Optional[List[dict]] = None`
			`router_settings: Optional[dict] = None`

refac: litellm model name validation 2024-04-22 01:25:53 +02:00			`model_config = ConfigDict(protected_namespaces=())`

feat: litellm config update 2024-04-21 23:10:01 +02:00
			`@app.post("/config/update")`
			`async def update_config(form_data: LiteLLMConfigForm, user=Depends(get_admin_user)):`
			`app.state.CONFIG = form_data.model_dump(exclude_none=True)`

			`with open(LITELLM_CONFIG_DIR, "w") as file:`
			`yaml.dump(app.state.CONFIG, file)`

			`await restart_litellm()`
			`return app.state.CONFIG`


DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`@app.get("/models")`
			`@app.get("/v1/models")`
			`async def get_models(user=Depends(get_current_user)):`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00
fix 2024-04-28 03:17:19 +02:00			`if app.state.ENABLE:`
			`while not background_process:`
			`await asyncio.sleep(0.1)`

			`url = f"http://localhost:{LITELLM_PROXY_PORT}/v1"`
			`r = None`
			`try:`
			`r = requests.request(method="GET", url=f"{url}/models")`
			`r.raise_for_status()`

			`data = r.json()`

			`if app.state.ENABLE_MODEL_FILTER:`
			`if user and user.role == "user":`
			`data["data"] = list(`
			`filter(`
			`lambda model: model["id"] in app.state.MODEL_FILTER_LIST,`
			`data["data"],`
			`)`
DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`)`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00
fix 2024-04-28 03:17:19 +02:00			`return data`
			`except Exception as e:`

			`log.exception(e)`
			`error_detail = "Open WebUI: Server Connection Error"`
			`if r is not None:`
			`try:`
			`res = r.json()`
			`if "error" in res:`
			`error_detail = f"External: {res['error']}"`
			`except:`
			`error_detail = f"External: {e}"`

			`return {`
			`"data": [`
			`{`
			`"id": model["model_name"],`
			`"object": "model",`
			`"created": int(time.time()),`
			`"owned_by": "openai",`
			`}`
			`for model in app.state.CONFIG["model_list"]`
			`],`
			`"object": "list",`
			`}`
			`else:`
refac: improved error handling 2024-04-22 00:37:59 +02:00			`return {`
fix 2024-04-28 03:17:19 +02:00			`"data": [],`
refac: improved error handling 2024-04-22 00:37:59 +02:00			`"object": "list",`
			`}`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00

feat: litellm model add/delete 2024-04-22 00:26:22 +02:00			`@app.get("/model/info")`
			`async def get_model_list(user=Depends(get_admin_user)):`
			`return {"data": app.state.CONFIG["model_list"]}`


			`class AddLiteLLMModelForm(BaseModel):`
			`model_name: str`
			`litellm_params: dict`

refac: litellm model name validation 2024-04-22 01:25:53 +02:00			`model_config = ConfigDict(protected_namespaces=())`

feat: litellm model add/delete 2024-04-22 00:26:22 +02:00
			`@app.post("/model/new")`
			`async def add_model_to_config(`
			`form_data: AddLiteLLMModelForm, user=Depends(get_admin_user)`
			`):`
refac: litellm model name validation 2024-04-22 01:25:53 +02:00			`try:`
			`get_llm_provider(model=form_data.model_name)`
			`app.state.CONFIG["model_list"].append(form_data.model_dump())`
refac: improved error handling 2024-04-22 00:37:59 +02:00
refac: litellm model name validation 2024-04-22 01:25:53 +02:00			`with open(LITELLM_CONFIG_DIR, "w") as file:`
			`yaml.dump(app.state.CONFIG, file)`
feat: litellm model add/delete 2024-04-22 00:26:22 +02:00
refac: litellm model name validation 2024-04-22 01:25:53 +02:00			`await restart_litellm()`
feat: litellm model add/delete 2024-04-22 00:26:22 +02:00
refac: litellm model name validation 2024-04-22 01:25:53 +02:00			`return {"message": MESSAGES.MODEL_ADDED(form_data.model_name)}`
			`except Exception as e:`
			`print(e)`
			`raise HTTPException(`
			`status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e)`
			`)`
feat: litellm model add/delete 2024-04-22 00:26:22 +02:00

			`class DeleteLiteLLMModelForm(BaseModel):`
			`id: str`


			`@app.post("/model/delete")`
			`async def delete_model_from_config(`
			`form_data: DeleteLiteLLMModelForm, user=Depends(get_admin_user)`
			`):`
			`app.state.CONFIG["model_list"] = [`
			`model`
			`for model in app.state.CONFIG["model_list"]`
			`if model["model_name"] != form_data.id`
			`]`

			`with open(LITELLM_CONFIG_DIR, "w") as file:`
			`yaml.dump(app.state.CONFIG, file)`

			`await restart_litellm()`

refac: improved error handling 2024-04-22 00:37:59 +02:00			`return {"message": MESSAGES.MODEL_DELETED(form_data.id)}`
feat: litellm model add/delete 2024-04-22 00:26:22 +02:00

DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`@app.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE"])`
			`async def proxy(path: str, request: Request, user=Depends(get_verified_user)):`
			`body = await request.body()`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00
feat: add LITELLM_PROXY_PORT to configure internal proxy port 2024-04-23 20:14:01 +02:00			`url = f"http://localhost:{LITELLM_PROXY_PORT}"`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00
DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`target_url = f"{url}/{path}"`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00
DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`headers = {}`
			`# headers["Authorization"] = f"Bearer {key}"`
			`headers["Content-Type"] = "application/json"`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00
DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`r = None`
fix: run litellm as subprocess 2024-04-21 07:52:27 +02:00
DO NOT TRACK ME >:( 2024-04-21 08:13:24 +02:00			`try:`
			`r = requests.request(`
			`method=request.method,`
			`url=target_url,`
			`data=body,`
			`headers=headers,`
			`stream=True,`
			`)`

			`r.raise_for_status()`

			`# Check if response is SSE`
			`if "text/event-stream" in r.headers.get("Content-Type", ""):`
			`return StreamingResponse(`
			`r.iter_content(chunk_size=8192),`
			`status_code=r.status_code,`
			`headers=dict(r.headers),`
			`)`
			`else:`
			`response_data = r.json()`
			`return response_data`
			`except Exception as e:`
			`log.exception(e)`
			`error_detail = "Open WebUI: Server Connection Error"`
			`if r is not None:`
			`try:`
			`res = r.json()`
			`if "error" in res:`
			`error_detail = f"External: {res['error']['message'] if 'message' in res['error'] else res['error']}"`
			`except:`
			`error_detail = f"External: {e}"`

			`raise HTTPException(`
			`status_code=r.status_code if r else 500, detail=error_detail`
			`)`