forked from open-webui/open-webui
		
	feat: multiple ollama support
This commit is contained in:
		
							parent
							
								
									475105473c
								
							
						
					
					
						commit
						f04d60b6d9
					
				
					 4 changed files with 831 additions and 62 deletions
				
			
		|  | @ -3,16 +3,23 @@ from fastapi.middleware.cors import CORSMiddleware | |||
| from fastapi.responses import StreamingResponse | ||||
| from fastapi.concurrency import run_in_threadpool | ||||
| 
 | ||||
| from pydantic import BaseModel | ||||
| 
 | ||||
| import random | ||||
| import requests | ||||
| import json | ||||
| import uuid | ||||
| from pydantic import BaseModel | ||||
| import aiohttp | ||||
| import asyncio | ||||
| 
 | ||||
| from apps.web.models.users import Users | ||||
| from constants import ERROR_MESSAGES | ||||
| from utils.utils import decode_token, get_current_user, get_admin_user | ||||
| from config import OLLAMA_BASE_URL, WEBUI_AUTH | ||||
| 
 | ||||
| from typing import Optional, List, Union | ||||
| 
 | ||||
| 
 | ||||
| app = FastAPI() | ||||
| app.add_middleware( | ||||
|     CORSMiddleware, | ||||
|  | @ -23,26 +30,39 @@ app.add_middleware( | |||
| ) | ||||
| 
 | ||||
| app.state.OLLAMA_BASE_URL = OLLAMA_BASE_URL | ||||
| 
 | ||||
| # TARGET_SERVER_URL = OLLAMA_API_BASE_URL | ||||
| app.state.OLLAMA_BASE_URLS = [OLLAMA_BASE_URL] | ||||
| app.state.MODELS = {} | ||||
| 
 | ||||
| 
 | ||||
| REQUEST_POOL = [] | ||||
| 
 | ||||
| 
 | ||||
| @app.get("/url") | ||||
| async def get_ollama_api_url(user=Depends(get_admin_user)): | ||||
|     return {"OLLAMA_BASE_URL": app.state.OLLAMA_BASE_URL} | ||||
| @app.middleware("http") | ||||
| async def check_url(request: Request, call_next): | ||||
|     if len(app.state.MODELS) == 0: | ||||
|         await get_all_models() | ||||
|     else: | ||||
|         pass | ||||
| 
 | ||||
|     response = await call_next(request) | ||||
|     return response | ||||
| 
 | ||||
| 
 | ||||
| @app.get("/urls") | ||||
| async def get_ollama_api_urls(user=Depends(get_admin_user)): | ||||
|     return {"OLLAMA_BASE_URLS": app.state.OLLAMA_BASE_URLS} | ||||
| 
 | ||||
| 
 | ||||
| class UrlUpdateForm(BaseModel): | ||||
|     url: str | ||||
|     urls: List[str] | ||||
| 
 | ||||
| 
 | ||||
| @app.post("/url/update") | ||||
| @app.post("/urls/update") | ||||
| async def update_ollama_api_url(form_data: UrlUpdateForm, user=Depends(get_admin_user)): | ||||
|     app.state.OLLAMA_BASE_URL = form_data.url | ||||
|     return {"OLLAMA_BASE_URL": app.state.OLLAMA_BASE_URL} | ||||
|     app.state.OLLAMA_BASE_URLS = form_data.urls | ||||
| 
 | ||||
|     print(app.state.OLLAMA_BASE_URLS) | ||||
|     return {"OLLAMA_BASE_URLS": app.state.OLLAMA_BASE_URLS} | ||||
| 
 | ||||
| 
 | ||||
| @app.get("/cancel/{request_id}") | ||||
|  | @ -55,9 +75,695 @@ async def cancel_ollama_request(request_id: str, user=Depends(get_current_user)) | |||
|         raise HTTPException(status_code=401, detail=ERROR_MESSAGES.ACCESS_PROHIBITED) | ||||
| 
 | ||||
| 
 | ||||
| async def fetch_url(url): | ||||
|     try: | ||||
|         async with aiohttp.ClientSession() as session: | ||||
|             async with session.get(url) as response: | ||||
|                 return await response.json() | ||||
|     except Exception as e: | ||||
|         # Handle connection error here | ||||
|         print(f"Connection error: {e}") | ||||
|         return None | ||||
| 
 | ||||
| 
 | ||||
| def merge_models_lists(model_lists): | ||||
|     merged_models = {} | ||||
| 
 | ||||
|     for idx, model_list in enumerate(model_lists): | ||||
|         for model in model_list: | ||||
|             digest = model["digest"] | ||||
|             if digest not in merged_models: | ||||
|                 model["urls"] = [idx] | ||||
|                 merged_models[digest] = model | ||||
|             else: | ||||
|                 merged_models[digest]["urls"].append(idx) | ||||
| 
 | ||||
|     return list(merged_models.values()) | ||||
| 
 | ||||
| 
 | ||||
| # user=Depends(get_current_user) | ||||
| 
 | ||||
| 
 | ||||
| async def get_all_models(): | ||||
|     print("get_all_models") | ||||
|     tasks = [fetch_url(f"{url}/api/tags") for url in app.state.OLLAMA_BASE_URLS] | ||||
|     responses = await asyncio.gather(*tasks) | ||||
|     responses = list(filter(lambda x: x is not None, responses)) | ||||
| 
 | ||||
|     models = { | ||||
|         "models": merge_models_lists( | ||||
|             map(lambda response: response["models"], responses) | ||||
|         ) | ||||
|     } | ||||
|     app.state.MODELS = {model["model"]: model for model in models["models"]} | ||||
| 
 | ||||
|     return models | ||||
| 
 | ||||
| 
 | ||||
| @app.get("/api/tags") | ||||
| @app.get("/api/tags/{url_idx}") | ||||
| async def get_ollama_tags( | ||||
|     url_idx: Optional[int] = None, user=Depends(get_current_user) | ||||
| ): | ||||
| 
 | ||||
|     if url_idx == None: | ||||
|         return await get_all_models() | ||||
|     else: | ||||
|         url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
|         try: | ||||
|             r = requests.request(method="GET", url=f"{url}/api/tags") | ||||
|             r.raise_for_status() | ||||
| 
 | ||||
|             return r.json() | ||||
|         except Exception as e: | ||||
|             print(e) | ||||
|             error_detail = "Open WebUI: Server Connection Error" | ||||
|             if r is not None: | ||||
|                 try: | ||||
|                     res = r.json() | ||||
|                     if "error" in res: | ||||
|                         error_detail = f"Ollama: {res['error']}" | ||||
|                 except: | ||||
|                     error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|             raise HTTPException( | ||||
|                 status_code=r.status_code if r else 500, | ||||
|                 detail=error_detail, | ||||
|             ) | ||||
| 
 | ||||
| 
 | ||||
| @app.get("/api/version") | ||||
| @app.get("/api/version/{url_idx}") | ||||
| async def get_ollama_versions(url_idx: Optional[int] = None): | ||||
| 
 | ||||
|     if url_idx == None: | ||||
| 
 | ||||
|         # returns lowest version | ||||
|         tasks = [fetch_url(f"{url}/api/version") for url in app.state.OLLAMA_BASE_URLS] | ||||
|         responses = await asyncio.gather(*tasks) | ||||
|         responses = list(filter(lambda x: x is not None, responses)) | ||||
| 
 | ||||
|         lowest_version = min( | ||||
|             responses, key=lambda x: tuple(map(int, x["version"].split("."))) | ||||
|         ) | ||||
| 
 | ||||
|         return {"version": lowest_version["version"]} | ||||
|     else: | ||||
|         url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
|         try: | ||||
|             r = requests.request(method="GET", url=f"{url}/api/version") | ||||
|             r.raise_for_status() | ||||
| 
 | ||||
|             return r.json() | ||||
|         except Exception as e: | ||||
|             print(e) | ||||
|             error_detail = "Open WebUI: Server Connection Error" | ||||
|             if r is not None: | ||||
|                 try: | ||||
|                     res = r.json() | ||||
|                     if "error" in res: | ||||
|                         error_detail = f"Ollama: {res['error']}" | ||||
|                 except: | ||||
|                     error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|             raise HTTPException( | ||||
|                 status_code=r.status_code if r else 500, | ||||
|                 detail=error_detail, | ||||
|             ) | ||||
| 
 | ||||
| 
 | ||||
| class ModelNameForm(BaseModel): | ||||
|     name: str | ||||
| 
 | ||||
| 
 | ||||
| @app.post("/api/pull") | ||||
| @app.post("/api/pull/{url_idx}") | ||||
| async def pull_model( | ||||
|     form_data: ModelNameForm, url_idx: int = 0, user=Depends(get_admin_user) | ||||
| ): | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
|     r = None | ||||
| 
 | ||||
|     def get_request(url): | ||||
|         nonlocal r | ||||
|         try: | ||||
| 
 | ||||
|             def stream_content(): | ||||
|                 for chunk in r.iter_content(chunk_size=8192): | ||||
|                     yield chunk | ||||
| 
 | ||||
|             r = requests.request( | ||||
|                 method="POST", | ||||
|                 url=f"{url}/api/pull", | ||||
|                 data=form_data.model_dump_json(exclude_none=True), | ||||
|                 stream=True, | ||||
|             ) | ||||
| 
 | ||||
|             r.raise_for_status() | ||||
| 
 | ||||
|             return StreamingResponse( | ||||
|                 stream_content(), | ||||
|                 status_code=r.status_code, | ||||
|                 headers=dict(r.headers), | ||||
|             ) | ||||
|         except Exception as e: | ||||
|             raise e | ||||
| 
 | ||||
|     try: | ||||
|         return await run_in_threadpool(get_request(url)) | ||||
|     except Exception as e: | ||||
|         print(e) | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| class PushModelForm(BaseModel): | ||||
|     name: str | ||||
|     insecure: Optional[bool] = None | ||||
|     stream: Optional[bool] = None | ||||
| 
 | ||||
| 
 | ||||
| @app.delete("/api/push") | ||||
| @app.delete("/api/push/{url_idx}") | ||||
| async def push_model( | ||||
|     form_data: PushModelForm, | ||||
|     url_idx: Optional[int] = None, | ||||
|     user=Depends(get_admin_user), | ||||
| ): | ||||
|     if url_idx == None: | ||||
|         if form_data.name in app.state.MODELS: | ||||
|             url_idx = app.state.MODELS[form_data.name]["urls"][0] | ||||
|         else: | ||||
|             raise HTTPException( | ||||
|                 status_code=400, | ||||
|                 detail="error_detail", | ||||
|             ) | ||||
| 
 | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
| 
 | ||||
|     r = None | ||||
| 
 | ||||
|     def get_request(): | ||||
|         nonlocal url | ||||
|         nonlocal r | ||||
|         try: | ||||
| 
 | ||||
|             def stream_content(): | ||||
|                 for chunk in r.iter_content(chunk_size=8192): | ||||
|                     yield chunk | ||||
| 
 | ||||
|             r = requests.request( | ||||
|                 method="POST", | ||||
|                 url=f"{url}/api/push", | ||||
|                 data=form_data.model_dump_json(exclude_none=True), | ||||
|             ) | ||||
| 
 | ||||
|             r.raise_for_status() | ||||
| 
 | ||||
|             return StreamingResponse( | ||||
|                 stream_content(), | ||||
|                 status_code=r.status_code, | ||||
|                 headers=dict(r.headers), | ||||
|             ) | ||||
|         except Exception as e: | ||||
|             raise e | ||||
| 
 | ||||
|     try: | ||||
|         return await run_in_threadpool(get_request) | ||||
|     except Exception as e: | ||||
|         print(e) | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| class CreateModelForm(BaseModel): | ||||
|     name: str | ||||
|     modelfile: Optional[str] = None | ||||
|     stream: Optional[bool] = None | ||||
|     path: Optional[str] = None | ||||
| 
 | ||||
| 
 | ||||
| @app.post("/api/create") | ||||
| @app.post("/api/create/{url_idx}") | ||||
| async def create_model( | ||||
|     form_data: CreateModelForm, url_idx: int = 0, user=Depends(get_admin_user) | ||||
| ): | ||||
|     print(form_data) | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
|     r = None | ||||
| 
 | ||||
|     def get_request(): | ||||
|         nonlocal url | ||||
|         nonlocal r | ||||
|         try: | ||||
| 
 | ||||
|             def stream_content(): | ||||
|                 for chunk in r.iter_content(chunk_size=8192): | ||||
|                     yield chunk | ||||
| 
 | ||||
|             r = requests.request( | ||||
|                 method="POST", | ||||
|                 url=f"{url}/api/create", | ||||
|                 data=form_data.model_dump_json(exclude_none=True), | ||||
|                 stream=True, | ||||
|             ) | ||||
| 
 | ||||
|             r.raise_for_status() | ||||
| 
 | ||||
|             print(r) | ||||
| 
 | ||||
|             return StreamingResponse( | ||||
|                 stream_content(), | ||||
|                 status_code=r.status_code, | ||||
|                 headers=dict(r.headers), | ||||
|             ) | ||||
|         except Exception as e: | ||||
|             raise e | ||||
| 
 | ||||
|     try: | ||||
|         return await run_in_threadpool(get_request) | ||||
|     except Exception as e: | ||||
|         print(e) | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| class CopyModelForm(BaseModel): | ||||
|     source: str | ||||
|     destination: str | ||||
| 
 | ||||
| 
 | ||||
| @app.post("/api/copy") | ||||
| @app.post("/api/copy/{url_idx}") | ||||
| async def copy_model( | ||||
|     form_data: CopyModelForm, | ||||
|     url_idx: Optional[int] = None, | ||||
|     user=Depends(get_admin_user), | ||||
| ): | ||||
|     if url_idx == None: | ||||
|         if form_data.source in app.state.MODELS: | ||||
|             url_idx = app.state.MODELS[form_data.source]["urls"][0] | ||||
|         else: | ||||
|             raise HTTPException( | ||||
|                 status_code=400, | ||||
|                 detail="error_detail", | ||||
|             ) | ||||
| 
 | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
| 
 | ||||
|     try: | ||||
|         r = requests.request( | ||||
|             method="POST", | ||||
|             url=f"{url}/api/copy", | ||||
|             data=form_data.model_dump_json(exclude_none=True), | ||||
|         ) | ||||
|         r.raise_for_status() | ||||
| 
 | ||||
|         print(r.text) | ||||
| 
 | ||||
|         return True | ||||
|     except Exception as e: | ||||
|         print(e) | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| @app.delete("/api/delete") | ||||
| @app.delete("/api/delete/{url_idx}") | ||||
| async def delete_model( | ||||
|     form_data: ModelNameForm, | ||||
|     url_idx: Optional[int] = None, | ||||
|     user=Depends(get_admin_user), | ||||
| ): | ||||
|     if url_idx == None: | ||||
|         if form_data.name in app.state.MODELS: | ||||
|             url_idx = app.state.MODELS[form_data.name]["urls"][0] | ||||
|         else: | ||||
|             raise HTTPException( | ||||
|                 status_code=400, | ||||
|                 detail="error_detail", | ||||
|             ) | ||||
| 
 | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
| 
 | ||||
|     try: | ||||
|         r = requests.request( | ||||
|             method="DELETE", | ||||
|             url=f"{url}/api/delete", | ||||
|             data=form_data.model_dump_json(exclude_none=True), | ||||
|         ) | ||||
|         r.raise_for_status() | ||||
| 
 | ||||
|         print(r.text) | ||||
| 
 | ||||
|         return True | ||||
|     except Exception as e: | ||||
|         print(e) | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| @app.post("/api/show") | ||||
| async def show_model_info(form_data: ModelNameForm, user=Depends(get_current_user)): | ||||
|     if form_data.name not in app.state.MODELS: | ||||
|         raise HTTPException( | ||||
|             status_code=400, | ||||
|             detail="error_detail", | ||||
|         ) | ||||
| 
 | ||||
|     url_idx = random.choice(app.state.MODELS[form_data.name]["urls"]) | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
| 
 | ||||
|     try: | ||||
|         r = requests.request( | ||||
|             method="POST", | ||||
|             url=f"{url}/api/show", | ||||
|             data=form_data.model_dump_json(exclude_none=True), | ||||
|         ) | ||||
|         r.raise_for_status() | ||||
| 
 | ||||
|         return r.json() | ||||
|     except Exception as e: | ||||
|         print(e) | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| class GenerateEmbeddingsForm(BaseModel): | ||||
|     model: str | ||||
|     prompt: str | ||||
|     options: Optional[dict] = None | ||||
|     keep_alive: Optional[Union[int, str]] = None | ||||
| 
 | ||||
| 
 | ||||
| @app.post("/api/embeddings") | ||||
| @app.post("/api/embeddings/{url_idx}") | ||||
| async def generate_embeddings( | ||||
|     form_data: GenerateEmbeddingsForm, | ||||
|     url_idx: Optional[int] = None, | ||||
|     user=Depends(get_current_user), | ||||
| ): | ||||
|     if url_idx == None: | ||||
|         if form_data.model in app.state.MODELS: | ||||
|             url_idx = random.choice(app.state.MODELS[form_data.model]["urls"]) | ||||
|         else: | ||||
|             raise HTTPException( | ||||
|                 status_code=400, | ||||
|                 detail="error_detail", | ||||
|             ) | ||||
| 
 | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
| 
 | ||||
|     try: | ||||
|         r = requests.request( | ||||
|             method="POST", | ||||
|             url=f"{url}/api/embeddings", | ||||
|             data=form_data.model_dump_json(exclude_none=True), | ||||
|         ) | ||||
|         r.raise_for_status() | ||||
| 
 | ||||
|         return r.json() | ||||
|     except Exception as e: | ||||
|         print(e) | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| class GenerateCompletionForm(BaseModel): | ||||
|     model: str | ||||
|     prompt: str | ||||
|     images: Optional[List[str]] = None | ||||
|     format: Optional[str] = None | ||||
|     options: Optional[dict] = None | ||||
|     system: Optional[str] = None | ||||
|     template: Optional[str] = None | ||||
|     context: Optional[str] = None | ||||
|     stream: Optional[bool] = True | ||||
|     raw: Optional[bool] = None | ||||
|     keep_alive: Optional[Union[int, str]] = None | ||||
| 
 | ||||
| 
 | ||||
| @app.post("/api/generate") | ||||
| @app.post("/api/generate/{url_idx}") | ||||
| async def generate_completion( | ||||
|     form_data: GenerateCompletionForm, | ||||
|     url_idx: Optional[int] = None, | ||||
|     user=Depends(get_current_user), | ||||
| ): | ||||
| 
 | ||||
|     if url_idx == None: | ||||
|         if form_data.model in app.state.MODELS: | ||||
|             url_idx = random.choice(app.state.MODELS[form_data.model]["urls"]) | ||||
|         else: | ||||
|             raise HTTPException( | ||||
|                 status_code=400, | ||||
|                 detail="error_detail", | ||||
|             ) | ||||
| 
 | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
| 
 | ||||
|     r = None | ||||
| 
 | ||||
|     def get_request(): | ||||
|         nonlocal form_data | ||||
|         nonlocal r | ||||
| 
 | ||||
|         request_id = str(uuid.uuid4()) | ||||
|         try: | ||||
|             REQUEST_POOL.append(request_id) | ||||
| 
 | ||||
|             def stream_content(): | ||||
|                 try: | ||||
|                     if form_data.stream: | ||||
|                         yield json.dumps({"id": request_id, "done": False}) + "\n" | ||||
| 
 | ||||
|                     for chunk in r.iter_content(chunk_size=8192): | ||||
|                         if request_id in REQUEST_POOL: | ||||
|                             yield chunk | ||||
|                         else: | ||||
|                             print("User: canceled request") | ||||
|                             break | ||||
|                 finally: | ||||
|                     if hasattr(r, "close"): | ||||
|                         r.close() | ||||
|                         if request_id in REQUEST_POOL: | ||||
|                             REQUEST_POOL.remove(request_id) | ||||
| 
 | ||||
|             r = requests.request( | ||||
|                 method="POST", | ||||
|                 url=f"{url}/api/generate", | ||||
|                 data=form_data.model_dump_json(exclude_none=True), | ||||
|                 stream=True, | ||||
|             ) | ||||
| 
 | ||||
|             r.raise_for_status() | ||||
| 
 | ||||
|             return StreamingResponse( | ||||
|                 stream_content(), | ||||
|                 status_code=r.status_code, | ||||
|                 headers=dict(r.headers), | ||||
|             ) | ||||
|         except Exception as e: | ||||
|             raise e | ||||
| 
 | ||||
|     try: | ||||
|         return await run_in_threadpool(get_request) | ||||
|     except Exception as e: | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| class ChatMessage(BaseModel): | ||||
|     role: str | ||||
|     content: str | ||||
|     images: Optional[List[str]] = None | ||||
| 
 | ||||
| 
 | ||||
| class GenerateChatCompletionForm(BaseModel): | ||||
|     model: str | ||||
|     messages: List[ChatMessage] | ||||
|     format: Optional[str] = None | ||||
|     options: Optional[dict] = None | ||||
|     template: Optional[str] = None | ||||
|     stream: Optional[bool] = True | ||||
|     keep_alive: Optional[Union[int, str]] = None | ||||
| 
 | ||||
| 
 | ||||
| @app.post("/api/chat") | ||||
| @app.post("/api/chat/{url_idx}") | ||||
| async def generate_completion( | ||||
|     form_data: GenerateChatCompletionForm, | ||||
|     url_idx: Optional[int] = None, | ||||
|     user=Depends(get_current_user), | ||||
| ): | ||||
| 
 | ||||
|     if url_idx == None: | ||||
|         if form_data.model in app.state.MODELS: | ||||
|             url_idx = random.choice(app.state.MODELS[form_data.model]["urls"]) | ||||
|         else: | ||||
|             raise HTTPException( | ||||
|                 status_code=400, | ||||
|                 detail="error_detail", | ||||
|             ) | ||||
| 
 | ||||
|     url = app.state.OLLAMA_BASE_URLS[url_idx] | ||||
| 
 | ||||
|     r = None | ||||
| 
 | ||||
|     print(form_data.model_dump_json(exclude_none=True)) | ||||
| 
 | ||||
|     def get_request(): | ||||
|         nonlocal form_data | ||||
|         nonlocal r | ||||
| 
 | ||||
|         request_id = str(uuid.uuid4()) | ||||
|         try: | ||||
|             REQUEST_POOL.append(request_id) | ||||
| 
 | ||||
|             def stream_content(): | ||||
|                 try: | ||||
|                     if form_data.stream: | ||||
|                         yield json.dumps({"id": request_id, "done": False}) + "\n" | ||||
| 
 | ||||
|                     for chunk in r.iter_content(chunk_size=8192): | ||||
|                         if request_id in REQUEST_POOL: | ||||
|                             yield chunk | ||||
|                         else: | ||||
|                             print("User: canceled request") | ||||
|                             break | ||||
|                 finally: | ||||
|                     if hasattr(r, "close"): | ||||
|                         r.close() | ||||
|                         if request_id in REQUEST_POOL: | ||||
|                             REQUEST_POOL.remove(request_id) | ||||
| 
 | ||||
|             r = requests.request( | ||||
|                 method="POST", | ||||
|                 url=f"{url}/api/chat", | ||||
|                 data=form_data.model_dump_json(exclude_none=True), | ||||
|                 stream=True, | ||||
|             ) | ||||
| 
 | ||||
|             r.raise_for_status() | ||||
| 
 | ||||
|             return StreamingResponse( | ||||
|                 stream_content(), | ||||
|                 status_code=r.status_code, | ||||
|                 headers=dict(r.headers), | ||||
|             ) | ||||
|         except Exception as e: | ||||
|             raise e | ||||
| 
 | ||||
|     try: | ||||
|         return await run_in_threadpool(get_request) | ||||
|     except Exception as e: | ||||
|         error_detail = "Open WebUI: Server Connection Error" | ||||
|         if r is not None: | ||||
|             try: | ||||
|                 res = r.json() | ||||
|                 if "error" in res: | ||||
|                     error_detail = f"Ollama: {res['error']}" | ||||
|             except: | ||||
|                 error_detail = f"Ollama: {e}" | ||||
| 
 | ||||
|         raise HTTPException( | ||||
|             status_code=r.status_code if r else 500, | ||||
|             detail=error_detail, | ||||
|         ) | ||||
| 
 | ||||
| 
 | ||||
| @app.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE"]) | ||||
| async def proxy(path: str, request: Request, user=Depends(get_current_user)): | ||||
|     target_url = f"{app.state.OLLAMA_BASE_URL}/{path}" | ||||
|     url = app.state.OLLAMA_BASE_URLS[0] | ||||
|     target_url = f"{url}/{path}" | ||||
| 
 | ||||
|     body = await request.body() | ||||
|     headers = dict(request.headers) | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue
	
	 Timothy J. Baek
						Timothy J. Baek