Merge pull request #1107 from open-webui/dev

0.1.111
2024-03-10 17:00:56 -05:00 · 2024-03-10 17:00:56 -05:00 · 89634046e7
commit 89634046e7
parent 04ddbf4306 88d324b52d
37 changed files with 1571 additions and 782 deletions
--- a/.github/workflows/build-release.yml
+++ b/.github/workflows/build-release.yml
@ -29,11 +29,11 @@ jobs:
    - name: Extract latest CHANGELOG entry
      id: changelog
      run: |
-        CHANGELOG_CONTENT=$(awk '/^## \[/{n++} n==1' CHANGELOG.md)
+        CHANGELOG_CONTENT=$(awk 'BEGIN {print_section=0;} /^## \[/ {if (print_section == 0) {print_section=1;} else {exit;}} print_section {print;}' CHANGELOG.md)
-        echo "CHANGELOG_CONTENT<<EOF" 
+        CHANGELOG_ESCAPED=$(echo "$CHANGELOG_CONTENT" | sed ':a;N;$!ba;s/\n/%0A/g')
-        echo "$CHANGELOG_CONTENT"
+        echo "Extracted latest release notes from CHANGELOG.md:" 
-        echo "EOF" 
+        echo -e "$CHANGELOG_CONTENT" 
-        echo "::set-output name=content::${CHANGELOG_CONTENT}"
+        echo "::set-output name=content::$CHANGELOG_ESCAPED"
    - name: Create GitHub release
      uses: actions/github-script@v5
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -5,6 +5,24 @@ All notable changes to this project will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 ## [0.1.111] - 2024-03-10
 ### Added
 - 🛡️ **Model Whitelisting**: Admins now have the ability to whitelist models for users with the 'user' role.
 - 🔄 **Update All Models**: Added a convenient button to update all models at once.
 - 📄 **Toggle PDF OCR**: Users can now toggle PDF OCR option for improved parsing performance.
 - 🎨 **DALL-E Integration**: Introduced DALL-E integration for image generation alongside automatic1111.
 - 🛠️ **RAG API Refactoring**: Refactored RAG logic and exposed its API, with additional documentation to follow.
 ### Fixed
 - 🔒 **Max Token Settings**: Added max token settings for anthropic/claude-3-sonnet-20240229 (Issue #1094).
 - 🔧 **Misalignment Issue**: Corrected misalignment of Edit and Delete Icons when Chat Title is Empty (Issue #1104).
 - 🔄 **Context Loss Fix**: Resolved RAG losing context on model response regeneration with Groq models via API key (Issue #1105).
 - 📁 **File Handling Bug**: Addressed File Not Found Notification when Dropping a Conversation Element (Issue #1098).
 - 🖱️ **Dragged File Styling**: Fixed dragged file layover styling issue.
 ## [0.1.110] - 2024-03-06
 ### Added
--- a/2
+++ b/2
@ -41,7 +41,7 @@ ENV WHISPER_MODEL_DIR="/app/backend/data/cache/whisper/models"
 # for better persormance and multilangauge support use "intfloat/multilingual-e5-large" (~2.5GB) or "intfloat/multilingual-e5-base" (~1.5GB)
 # IMPORTANT: If you change the default model (all-MiniLM-L6-v2) and vice versa, you aren't able to use RAG Chat with your previous documents loaded in the WebUI! You need to re-embed them.
 ENV RAG_EMBEDDING_MODEL="all-MiniLM-L6-v2"
-# device type for whisper tts and ebbeding models - "cpu" (default), "cuda" (nvidia gpu and CUDA required) or "mps" (apple silicon) - choosing this right can lead to better performance
+# device type for whisper tts and embbeding models - "cpu" (default), "cuda" (nvidia gpu and CUDA required) or "mps" (apple silicon) - choosing this right can lead to better performance
 ENV RAG_EMBEDDING_MODEL_DEVICE_TYPE="cpu"
 ENV RAG_EMBEDDING_MODEL_DIR="/app/backend/data/cache/embedding/models"
 ENV SENTENCE_TRANSFORMERS_HOME $RAG_EMBEDDING_MODEL_DIR
--- a/README.md
+++ b/README.md
@ -53,8 +53,6 @@ User-friendly WebUI for LLMs, supported LLM runners include Ollama and OpenAI-co
 - 💬 **Collaborative Chat**: Harness the collective intelligence of multiple models by seamlessly orchestrating group conversations. Use the `@` command to specify the model, enabling dynamic and diverse dialogues within your chat interface. Immerse yourself in the collective intelligence woven into your chat environment.
 - 🤝 **OpenAI API Integration**: Effortlessly integrate OpenAI-compatible API for versatile conversations alongside Ollama models. Customize the API Base URL to link with **LMStudio, Mistral, OpenRouter, and more**.
 - 🔄 **Regeneration History Access**: Easily revisit and explore your entire regeneration history.
 - 📜 **Chat History**: Effortlessly access and manage your conversation history.
@ -65,8 +63,18 @@ User-friendly WebUI for LLMs, supported LLM runners include Ollama and OpenAI-co
 - ⚙️ **Fine-Tuned Control with Advanced Parameters**: Gain a deeper level of control by adjusting parameters such as temperature and defining your system prompts to tailor the conversation to your specific preferences and needs.
 - 🎨🤖 **Image Generation Integration**: Seamlessly incorporate image generation capabilities using AUTOMATIC1111 API (local) and DALL-E, enriching your chat experience with dynamic visual content.
 - 🤝 **OpenAI API Integration**: Effortlessly integrate OpenAI-compatible API for versatile conversations alongside Ollama models. Customize the API Base URL to link with **LMStudio, Mistral, OpenRouter, and more**.
 - ✨ **Multiple OpenAI-Compatible API Support**: Seamlessly integrate and customize various OpenAI-compatible APIs, enhancing the versatility of your chat interactions.
 - 🔗 **External Ollama Server Connection**: Seamlessly link to an external Ollama server hosted on a different address by configuring the environment variable.
 - 🔀 **Multiple Ollama Instance Load Balancing**: Effortlessly distribute chat requests across multiple Ollama instances for enhanced performance and reliability.
 - 👥 **Multi-User Management**: Easily oversee and administer users via our intuitive admin panel, streamlining user management processes.
 - 🔐 **Role-Based Access Control (RBAC)**: Ensure secure access with restricted permissions; only authorized individuals can access your Ollama, and exclusive model creation/pulling rights are reserved for administrators.
 - 🔒 **Backend Reverse Proxy Support**: Bolster security through direct communication between Open WebUI backend and Ollama. This key feature eliminates the need to expose Ollama over LAN. Requests made to the '/ollama/api' route from the web UI are seamlessly redirected to Ollama from the backend, enhancing overall system security.
--- a/backend/apps/images/main.py
+++ b/backend/apps/images/main.py
@ -21,7 +21,16 @@ from utils.utils import (
 from utils.misc import calculate_sha256
 from typing import Optional
 from pydantic import BaseModel
-from config import AUTOMATIC1111_BASE_URL
+from pathlib import Path
 import uuid
 import base64
 import json
 from config import CACHE_DIR, AUTOMATIC1111_BASE_URL
 IMAGE_CACHE_DIR = Path(CACHE_DIR).joinpath("./image/generations/")
 IMAGE_CACHE_DIR.mkdir(parents=True, exist_ok=True)
 app = FastAPI()
 app.add_middleware(
@ -32,25 +41,34 @@ app.add_middleware(
    allow_headers=["*"],
 )
 app.state.ENGINE = ""
 app.state.ENABLED = False
 app.state.OPENAI_API_KEY = ""
 app.state.MODEL = ""
 app.state.AUTOMATIC1111_BASE_URL = AUTOMATIC1111_BASE_URL
-app.state.ENABLED = app.state.AUTOMATIC1111_BASE_URL != ""
+
 app.state.IMAGE_SIZE = "512x512"
 app.state.IMAGE_STEPS = 50
-@app.get("/enabled", response_model=bool)
+@app.get("/config")
-async def get_enable_status(request: Request, user=Depends(get_admin_user)):
+async def get_config(request: Request, user=Depends(get_admin_user)):
-    return app.state.ENABLED
+    return {"engine": app.state.ENGINE, "enabled": app.state.ENABLED}
-@app.get("/enabled/toggle", response_model=bool)
+class ConfigUpdateForm(BaseModel):
-async def toggle_enabled(request: Request, user=Depends(get_admin_user)):
+    engine: str
-    try:
+    enabled: bool
-        r = requests.head(app.state.AUTOMATIC1111_BASE_URL)
+
-        app.state.ENABLED = not app.state.ENABLED
+
-        return app.state.ENABLED
+@app.post("/config/update")
-    except Exception as e:
+async def update_config(form_data: ConfigUpdateForm, user=Depends(get_admin_user)):
-        raise HTTPException(status_code=400, detail=ERROR_MESSAGES.DEFAULT(e))
+    app.state.ENGINE = form_data.engine
    app.state.ENABLED = form_data.enabled
    return {"engine": app.state.ENGINE, "enabled": app.state.ENABLED}
 class UrlUpdateForm(BaseModel):
@ -58,17 +76,24 @@ class UrlUpdateForm(BaseModel):
@app.get("/url")
-async def get_openai_url(user=Depends(get_admin_user)):
+async def get_automatic1111_url(user=Depends(get_admin_user)):
    return {"AUTOMATIC1111_BASE_URL": app.state.AUTOMATIC1111_BASE_URL}
@app.post("/url/update")
-async def update_openai_url(form_data: UrlUpdateForm, user=Depends(get_admin_user)):
+async def update_automatic1111_url(
    form_data: UrlUpdateForm, user=Depends(get_admin_user)
 ):
    if form_data.url == "":
        app.state.AUTOMATIC1111_BASE_URL = AUTOMATIC1111_BASE_URL
    else:
-        app.state.AUTOMATIC1111_BASE_URL = form_data.url.strip("/")
+        url = form_data.url.strip("/")
        try:
            r = requests.head(url)
            app.state.AUTOMATIC1111_BASE_URL = url
        except Exception as e:
            raise HTTPException(status_code=400, detail=ERROR_MESSAGES.DEFAULT(e))
    return {
        "AUTOMATIC1111_BASE_URL": app.state.AUTOMATIC1111_BASE_URL,
@ -76,6 +101,30 @@ async def update_openai_url(form_data: UrlUpdateForm, user=Depends(get_admin_use
    }
 class OpenAIKeyUpdateForm(BaseModel):
    key: str
@app.get("/key")
 async def get_openai_key(user=Depends(get_admin_user)):
    return {"OPENAI_API_KEY": app.state.OPENAI_API_KEY}
@app.post("/key/update")
 async def update_openai_key(
    form_data: OpenAIKeyUpdateForm, user=Depends(get_admin_user)
 ):
    if form_data.key == "":
        raise HTTPException(status_code=400, detail=ERROR_MESSAGES.API_KEY_NOT_FOUND)
    app.state.OPENAI_API_KEY = form_data.key
    return {
        "OPENAI_API_KEY": app.state.OPENAI_API_KEY,
        "status": True,
    }
 class ImageSizeUpdateForm(BaseModel):
    size: str
@ -132,9 +181,22 @@ async def update_image_size(
@app.get("/models")
 def get_models(user=Depends(get_current_user)):
    try:
-        r = requests.get(url=f"{app.state.AUTOMATIC1111_BASE_URL}/sdapi/v1/sd-models")
+        if app.state.ENGINE == "openai":
            return [
                {"id": "dall-e-2", "name": "DALL·E 2"},
                {"id": "dall-e-3", "name": "DALL·E 3"},
            ]
        else:
            r = requests.get(
                url=f"{app.state.AUTOMATIC1111_BASE_URL}/sdapi/v1/sd-models"
            )
            models = r.json()
-        return models
+            return list(
                map(
                    lambda model: {"id": model["title"], "name": model["model_name"]},
                    models,
                )
            )
    except Exception as e:
        app.state.ENABLED = False
        raise HTTPException(status_code=400, detail=ERROR_MESSAGES.DEFAULT(e))
@ -143,9 +205,11 @@ def get_models(user=Depends(get_current_user)):
@app.get("/models/default")
 async def get_default_model(user=Depends(get_admin_user)):
    try:
        if app.state.ENGINE == "openai":
            return {"model": app.state.MODEL if app.state.MODEL else "dall-e-2"}
        else:
            r = requests.get(url=f"{app.state.AUTOMATIC1111_BASE_URL}/sdapi/v1/options")
            options = r.json()
            return {"model": options["sd_model_checkpoint"]}
    except Exception as e:
        app.state.ENABLED = False
@ -157,6 +221,11 @@ class UpdateModelForm(BaseModel):
 def set_model_handler(model: str):
    if app.state.ENGINE == "openai":
        app.state.MODEL = model
        return app.state.MODEL
    else:
        r = requests.get(url=f"{app.state.AUTOMATIC1111_BASE_URL}/sdapi/v1/options")
        options = r.json()
@ -181,19 +250,72 @@ class GenerateImageForm(BaseModel):
    model: Optional[str] = None
    prompt: str
    n: int = 1
-    size: str = "512x512"
+    size: Optional[str] = None
    negative_prompt: Optional[str] = None
 def save_b64_image(b64_str):
    image_id = str(uuid.uuid4())
    file_path = IMAGE_CACHE_DIR.joinpath(f"{image_id}.png")
    try:
        # Split the base64 string to get the actual image data
        img_data = base64.b64decode(b64_str)
        # Write the image data to a file
        with open(file_path, "wb") as f:
            f.write(img_data)
        return image_id
    except Exception as e:
        print(f"Error saving image: {e}")
        return None
@app.post("/generations")
 def generate_image(
    form_data: GenerateImageForm,
    user=Depends(get_current_user),
 ):
-    print(form_data)
+    r = None
    try:
        if app.state.ENGINE == "openai":
            headers = {}
            headers["Authorization"] = f"Bearer {app.state.OPENAI_API_KEY}"
            headers["Content-Type"] = "application/json"
            data = {
                "model": app.state.MODEL if app.state.MODEL != "" else "dall-e-2",
                "prompt": form_data.prompt,
                "n": form_data.n,
                "size": form_data.size if form_data.size else app.state.IMAGE_SIZE,
                "response_format": "b64_json",
            }
            r = requests.post(
                url=f"https://api.openai.com/v1/images/generations",
                json=data,
                headers=headers,
            )
            r.raise_for_status()
            res = r.json()
            images = []
            for image in res["data"]:
                image_id = save_b64_image(image["b64_json"])
                images.append({"url": f"/cache/image/generations/{image_id}.png"})
                file_body_path = IMAGE_CACHE_DIR.joinpath(f"{image_id}.json")
                with open(file_body_path, "w") as f:
                    json.dump(data, f)
            return images
        else:
            if form_data.model:
                set_model_handler(form_data.model)
@ -212,14 +334,29 @@ def generate_image(
            if form_data.negative_prompt != None:
                data["negative_prompt"] = form_data.negative_prompt
        print(data)
            r = requests.post(
                url=f"{app.state.AUTOMATIC1111_BASE_URL}/sdapi/v1/txt2img",
                json=data,
            )
-        return r.json()
+            res = r.json()
            print(res)
            images = []
            for image in res["images"]:
                image_id = save_b64_image(image)
                images.append({"url": f"/cache/image/generations/{image_id}.png"})
                file_body_path = IMAGE_CACHE_DIR.joinpath(f"{image_id}.json")
                with open(file_body_path, "w") as f:
                    json.dump({**data, "info": res["info"]}, f)
            return images
    except Exception as e:
        print(e)
        if r:
            print(r.json())
        raise HTTPException(status_code=400, detail=ERROR_MESSAGES.DEFAULT(e))
--- a/backend/apps/litellm/main.py
+++ b/backend/apps/litellm/main.py
@ -0,0 +1,41 @@
 from litellm.proxy.proxy_server import ProxyConfig, initialize
 from litellm.proxy.proxy_server import app
 from fastapi import FastAPI, Request, Depends, status
 from fastapi.responses import JSONResponse
 from utils.utils import get_http_authorization_cred, get_current_user
 from config import ENV
 proxy_config = ProxyConfig()
 async def config():
    router, model_list, general_settings = await proxy_config.load_config(
        router=None, config_file_path="./data/litellm/config.yaml"
    )
    await initialize(config="./data/litellm/config.yaml", telemetry=False)
 async def startup():
    await config()
@app.on_event("startup")
 async def on_startup():
    await startup()
@app.middleware("http")
 async def auth_middleware(request: Request, call_next):
    auth_header = request.headers.get("Authorization", "")
    if ENV != "dev":
        try:
            user = get_current_user(get_http_authorization_cred(auth_header))
            print(user)
        except Exception as e:
            return JSONResponse(status_code=400, content={"detail": str(e)})
    response = await call_next(request)
    return response
--- a/backend/apps/ollama/main.py
+++ b/backend/apps/ollama/main.py
@ -15,7 +15,7 @@ import asyncio
 from apps.web.models.users import Users
 from constants import ERROR_MESSAGES
 from utils.utils import decode_token, get_current_user, get_admin_user
-from config import OLLAMA_BASE_URLS
+from config import OLLAMA_BASE_URLS, MODEL_FILTER_ENABLED, MODEL_FILTER_LIST
 from typing import Optional, List, Union
@ -29,6 +29,10 @@ app.add_middleware(
    allow_headers=["*"],
 )
 app.state.MODEL_FILTER_ENABLED = MODEL_FILTER_ENABLED
 app.state.MODEL_FILTER_LIST = MODEL_FILTER_LIST
 app.state.OLLAMA_BASE_URLS = OLLAMA_BASE_URLS
 app.state.MODELS = {}
@ -129,9 +133,19 @@ async def get_all_models():
 async def get_ollama_tags(
    url_idx: Optional[int] = None, user=Depends(get_current_user)
 ):
    if url_idx == None:
-        return await get_all_models()
+        models = await get_all_models()
        if app.state.MODEL_FILTER_ENABLED:
            if user.role == "user":
                models["models"] = list(
                    filter(
                        lambda model: model["name"] in app.state.MODEL_FILTER_LIST,
                        models["models"],
                    )
                )
                return models
        return models
    else:
        url = app.state.OLLAMA_BASE_URLS[url_idx]
        try:
--- a/backend/apps/openai/main.py
+++ b/backend/apps/openai/main.py
@ -18,7 +18,13 @@ from utils.utils import (
    get_verified_user,
    get_admin_user,
 )
-from config import OPENAI_API_BASE_URLS, OPENAI_API_KEYS, CACHE_DIR
+from config import (
    OPENAI_API_BASE_URLS,
    OPENAI_API_KEYS,
    CACHE_DIR,
    MODEL_FILTER_ENABLED,
    MODEL_FILTER_LIST,
 )
 from typing import List, Optional
@ -34,6 +40,9 @@ app.add_middleware(
    allow_headers=["*"],
 )
 app.state.MODEL_FILTER_ENABLED = MODEL_FILTER_ENABLED
 app.state.MODEL_FILTER_LIST = MODEL_FILTER_LIST
 app.state.OPENAI_API_BASE_URLS = OPENAI_API_BASE_URLS
 app.state.OPENAI_API_KEYS = OPENAI_API_KEYS
@ -186,12 +195,21 @@ async def get_all_models():
    return models
 # , user=Depends(get_current_user)
@app.get("/models")
@app.get("/models/{url_idx}")
-async def get_models(url_idx: Optional[int] = None):
+async def get_models(url_idx: Optional[int] = None, user=Depends(get_current_user)):
    if url_idx == None:
-        return await get_all_models()
+        models = await get_all_models()
        if app.state.MODEL_FILTER_ENABLED:
            if user.role == "user":
                models["data"] = list(
                    filter(
                        lambda model: model["id"] in app.state.MODEL_FILTER_LIST,
                        models["data"],
                    )
                )
                return models
        return models
    else:
        url = app.state.OPENAI_API_BASE_URLS[url_idx]
        try:
--- a/backend/apps/rag/main.py
+++ b/backend/apps/rag/main.py
@ -44,6 +44,8 @@ from apps.web.models.documents import (
    DocumentResponse,
 )
 from apps.rag.utils import query_doc, query_collection
 from utils.misc import (
    calculate_sha256,
    calculate_sha256_string,
@ -75,6 +77,7 @@ from constants import ERROR_MESSAGES
 app = FastAPI()
 app.state.PDF_EXTRACT_IMAGES = False
 app.state.CHUNK_SIZE = CHUNK_SIZE
 app.state.CHUNK_OVERLAP = CHUNK_OVERLAP
 app.state.RAG_TEMPLATE = RAG_TEMPLATE
@ -182,12 +185,15 @@ async def update_embedding_model(
    }
-@app.get("/chunk")
+@app.get("/config")
-async def get_chunk_params(user=Depends(get_admin_user)):
+async def get_rag_config(user=Depends(get_admin_user)):
    return {
        "status": True,
        "pdf_extract_images": app.state.PDF_EXTRACT_IMAGES,
        "chunk": {
            "chunk_size": app.state.CHUNK_SIZE,
            "chunk_overlap": app.state.CHUNK_OVERLAP,
        },
    }
@ -196,17 +202,24 @@ class ChunkParamUpdateForm(BaseModel):
    chunk_overlap: int
-@app.post("/chunk/update")
+class ConfigUpdateForm(BaseModel):
-async def update_chunk_params(
+    pdf_extract_images: bool
-    form_data: ChunkParamUpdateForm, user=Depends(get_admin_user)
+    chunk: ChunkParamUpdateForm
-):
+
-    app.state.CHUNK_SIZE = form_data.chunk_size
+
-    app.state.CHUNK_OVERLAP = form_data.chunk_overlap
+@app.post("/config/update")
 async def update_rag_config(form_data: ConfigUpdateForm, user=Depends(get_admin_user)):
    app.state.PDF_EXTRACT_IMAGES = form_data.pdf_extract_images
    app.state.CHUNK_SIZE = form_data.chunk.chunk_size
    app.state.CHUNK_OVERLAP = form_data.chunk.chunk_overlap
    return {
        "status": True,
        "pdf_extract_images": app.state.PDF_EXTRACT_IMAGES,
        "chunk": {
            "chunk_size": app.state.CHUNK_SIZE,
            "chunk_overlap": app.state.CHUNK_OVERLAP,
        },
    }
@ -248,21 +261,18 @@ class QueryDocForm(BaseModel):
@app.post("/query/doc")
-def query_doc(
+def query_doc_handler(
    form_data: QueryDocForm,
    user=Depends(get_current_user),
 ):
    try:
-        # if you use docker use the model from the environment variable
+        return query_doc(
-        collection = CHROMA_CLIENT.get_collection(
+            collection_name=form_data.collection_name,
-            name=form_data.collection_name,
+            query=form_data.query,
            k=form_data.k if form_data.k else app.state.TOP_K,
            embedding_function=app.state.sentence_transformer_ef,
        )
        result = collection.query(
            query_texts=[form_data.query],
            n_results=form_data.k if form_data.k else app.state.TOP_K,
        )
        return result
    except Exception as e:
        print(e)
        raise HTTPException(
@ -277,78 +287,18 @@ class QueryCollectionsForm(BaseModel):
    k: Optional[int] = None
 def merge_and_sort_query_results(query_results, k):
    # Initialize lists to store combined data
    combined_ids = []
    combined_distances = []
    combined_metadatas = []
    combined_documents = []
    # Combine data from each dictionary
    for data in query_results:
        combined_ids.extend(data["ids"][0])
        combined_distances.extend(data["distances"][0])
        combined_metadatas.extend(data["metadatas"][0])
        combined_documents.extend(data["documents"][0])
    # Create a list of tuples (distance, id, metadata, document)
    combined = list(
        zip(combined_distances, combined_ids, combined_metadatas, combined_documents)
    )
    # Sort the list based on distances
    combined.sort(key=lambda x: x[0])
    # Unzip the sorted list
    sorted_distances, sorted_ids, sorted_metadatas, sorted_documents = zip(*combined)
    # Slicing the lists to include only k elements
    sorted_distances = list(sorted_distances)[:k]
    sorted_ids = list(sorted_ids)[:k]
    sorted_metadatas = list(sorted_metadatas)[:k]
    sorted_documents = list(sorted_documents)[:k]
    # Create the output dictionary
    merged_query_results = {
        "ids": [sorted_ids],
        "distances": [sorted_distances],
        "metadatas": [sorted_metadatas],
        "documents": [sorted_documents],
        "embeddings": None,
        "uris": None,
        "data": None,
    }
    return merged_query_results
@app.post("/query/collection")
-def query_collection(
+def query_collection_handler(
    form_data: QueryCollectionsForm,
    user=Depends(get_current_user),
 ):
-    results = []
+    return query_collection(
-
+        collection_names=form_data.collection_names,
-    for collection_name in form_data.collection_names:
+        query=form_data.query,
-        try:
+        k=form_data.k if form_data.k else app.state.TOP_K,
            # if you use docker use the model from the environment variable
            collection = CHROMA_CLIENT.get_collection(
                name=collection_name,
        embedding_function=app.state.sentence_transformer_ef,
    )
            result = collection.query(
                query_texts=[form_data.query],
                n_results=form_data.k if form_data.k else app.state.TOP_K,
            )
            results.append(result)
        except:
            pass
    return merge_and_sort_query_results(
        results, form_data.k if form_data.k else app.state.TOP_K
    )
@app.post("/web")
 def store_web(form_data: StoreWebForm, user=Depends(get_current_user)):
@ -425,7 +375,7 @@ def get_loader(filename: str, file_content_type: str, file_path: str):
    ]
    if file_ext == "pdf":
-        loader = PyPDFLoader(file_path, extract_images=True)
+        loader = PyPDFLoader(file_path, extract_images=app.state.PDF_EXTRACT_IMAGES)
    elif file_ext == "csv":
        loader = CSVLoader(file_path)
    elif file_ext == "rst":
--- a/backend/apps/rag/utils.py
+++ b/backend/apps/rag/utils.py
@ -0,0 +1,97 @@
 import re
 from typing import List
 from config import CHROMA_CLIENT
 def query_doc(collection_name: str, query: str, k: int, embedding_function):
    try:
        # if you use docker use the model from the environment variable
        collection = CHROMA_CLIENT.get_collection(
            name=collection_name,
            embedding_function=embedding_function,
        )
        result = collection.query(
            query_texts=[query],
            n_results=k,
        )
        return result
    except Exception as e:
        raise e
 def merge_and_sort_query_results(query_results, k):
    # Initialize lists to store combined data
    combined_ids = []
    combined_distances = []
    combined_metadatas = []
    combined_documents = []
    # Combine data from each dictionary
    for data in query_results:
        combined_ids.extend(data["ids"][0])
        combined_distances.extend(data["distances"][0])
        combined_metadatas.extend(data["metadatas"][0])
        combined_documents.extend(data["documents"][0])
    # Create a list of tuples (distance, id, metadata, document)
    combined = list(
        zip(combined_distances, combined_ids, combined_metadatas, combined_documents)
    )
    # Sort the list based on distances
    combined.sort(key=lambda x: x[0])
    # Unzip the sorted list
    sorted_distances, sorted_ids, sorted_metadatas, sorted_documents = zip(*combined)
    # Slicing the lists to include only k elements
    sorted_distances = list(sorted_distances)[:k]
    sorted_ids = list(sorted_ids)[:k]
    sorted_metadatas = list(sorted_metadatas)[:k]
    sorted_documents = list(sorted_documents)[:k]
    # Create the output dictionary
    merged_query_results = {
        "ids": [sorted_ids],
        "distances": [sorted_distances],
        "metadatas": [sorted_metadatas],
        "documents": [sorted_documents],
        "embeddings": None,
        "uris": None,
        "data": None,
    }
    return merged_query_results
 def query_collection(
    collection_names: List[str], query: str, k: int, embedding_function
 ):
    results = []
    for collection_name in collection_names:
        try:
            # if you use docker use the model from the environment variable
            collection = CHROMA_CLIENT.get_collection(
                name=collection_name,
                embedding_function=embedding_function,
            )
            result = collection.query(
                query_texts=[query],
                n_results=k,
            )
            results.append(result)
        except:
            pass
    return merge_and_sort_query_results(results, k)
 def rag_template(template: str, context: str, query: str):
    template = re.sub(r"\[context\]", context, template)
    template = re.sub(r"\[query\]", query, template)
    return template
--- a/backend/config.py
+++ b/backend/config.py
@ -251,7 +251,7 @@ OPENAI_API_BASE_URLS = (
    OPENAI_API_BASE_URLS if OPENAI_API_BASE_URLS != "" else OPENAI_API_BASE_URL
 )
-OPENAI_API_BASE_URLS = [url.strip() for url in OPENAI_API_BASE_URL.split(";")]
+OPENAI_API_BASE_URLS = [url.strip() for url in OPENAI_API_BASE_URLS.split(";")]
 ####################################
@ -292,6 +292,11 @@ DEFAULT_USER_ROLE = os.getenv("DEFAULT_USER_ROLE", "pending")
 USER_PERMISSIONS = {"chat": {"deletion": True}}
 MODEL_FILTER_ENABLED = os.environ.get("MODEL_FILTER_ENABLED", False)
 MODEL_FILTER_LIST = os.environ.get("MODEL_FILTER_LIST", "")
 MODEL_FILTER_LIST = [model.strip() for model in MODEL_FILTER_LIST.split(";")]
 ####################################
 # WEBUI_VERSION
 ####################################
--- a/backend/data/config.json
+++ b/backend/data/config.json
@ -1,4 +1,5 @@
 {
    "version": "0.0.1",
    "ui": {
        "prompt_suggestions": [
            {
--- a/backend/main.py
+++ b/backend/main.py
@ -9,28 +9,38 @@ import requests
 from fastapi import FastAPI, Request, Depends, status
 from fastapi.staticfiles import StaticFiles
 from fastapi import HTTPException
 from fastapi.responses import JSONResponse
 from fastapi.middleware.wsgi import WSGIMiddleware
 from fastapi.middleware.cors import CORSMiddleware
 from starlette.exceptions import HTTPException as StarletteHTTPException
 from starlette.middleware.base import BaseHTTPMiddleware
 from litellm.proxy.proxy_server import ProxyConfig, initialize
 from litellm.proxy.proxy_server import app as litellm_app
 from apps.ollama.main import app as ollama_app
 from apps.openai.main import app as openai_app
 from apps.litellm.main import app as litellm_app, startup as litellm_app_startup
 from apps.audio.main import app as audio_app
 from apps.images.main import app as images_app
 from apps.rag.main import app as rag_app
 from apps.web.main import app as webui_app
 from pydantic import BaseModel
 from typing import List
-from config import WEBUI_NAME, ENV, VERSION, CHANGELOG, FRONTEND_BUILD_DIR
+
 from utils.utils import get_admin_user
 from apps.rag.utils import query_doc, query_collection, rag_template
 from config import (
    WEBUI_NAME,
    ENV,
    VERSION,
    CHANGELOG,
    FRONTEND_BUILD_DIR,
    MODEL_FILTER_ENABLED,
    MODEL_FILTER_LIST,
 )
 from constants import ERROR_MESSAGES
 from utils.utils import get_http_authorization_cred, get_current_user
 class SPAStaticFiles(StaticFiles):
    async def get_response(self, path: str, scope):
@ -43,23 +53,11 @@ class SPAStaticFiles(StaticFiles):
                raise ex
 proxy_config = ProxyConfig()
 async def config():
    router, model_list, general_settings = await proxy_config.load_config(
        router=None, config_file_path="./data/litellm/config.yaml"
    )
    await initialize(config="./data/litellm/config.yaml", telemetry=False)
 async def startup():
    await config()
 app = FastAPI(docs_url="/docs" if ENV == "dev" else None, redoc_url=None)
 app.state.MODEL_FILTER_ENABLED = MODEL_FILTER_ENABLED
 app.state.MODEL_FILTER_LIST = MODEL_FILTER_LIST
 origins = ["*"]
 app.add_middleware(
@ -73,7 +71,127 @@ app.add_middleware(
@app.on_event("startup")
 async def on_startup():
-    await startup()
+    await litellm_app_startup()
 class RAGMiddleware(BaseHTTPMiddleware):
    async def dispatch(self, request: Request, call_next):
        if request.method == "POST" and (
            "/api/chat" in request.url.path or "/chat/completions" in request.url.path
        ):
            print(request.url.path)
            # Read the original request body
            body = await request.body()
            # Decode body to string
            body_str = body.decode("utf-8")
            # Parse string to JSON
            data = json.loads(body_str) if body_str else {}
            # Example: Add a new key-value pair or modify existing ones
            # data["modified"] = True  # Example modification
            if "docs" in data:
                docs = data["docs"]
                print(docs)
                last_user_message_idx = None
                for i in range(len(data["messages"]) - 1, -1, -1):
                    if data["messages"][i]["role"] == "user":
                        last_user_message_idx = i
                        break
                user_message = data["messages"][last_user_message_idx]
                if isinstance(user_message["content"], list):
                    # Handle list content input
                    content_type = "list"
                    query = ""
                    for content_item in user_message["content"]:
                        if content_item["type"] == "text":
                            query = content_item["text"]
                            break
                elif isinstance(user_message["content"], str):
                    # Handle text content input
                    content_type = "text"
                    query = user_message["content"]
                else:
                    # Fallback in case the input does not match expected types
                    content_type = None
                    query = ""
                relevant_contexts = []
                for doc in docs:
                    context = None
                    try:
                        if doc["type"] == "collection":
                            context = query_collection(
                                collection_names=doc["collection_names"],
                                query=query,
                                k=rag_app.state.TOP_K,
                                embedding_function=rag_app.state.sentence_transformer_ef,
                            )
                        else:
                            context = query_doc(
                                collection_name=doc["collection_name"],
                                query=query,
                                k=rag_app.state.TOP_K,
                                embedding_function=rag_app.state.sentence_transformer_ef,
                            )
                    except Exception as e:
                        print(e)
                        context = None
                    relevant_contexts.append(context)
                context_string = ""
                for context in relevant_contexts:
                    if context:
                        context_string += " ".join(context["documents"][0]) + "\n"
                ra_content = rag_template(
                    template=rag_app.state.RAG_TEMPLATE,
                    context=context_string,
                    query=query,
                )
                if content_type == "list":
                    new_content = []
                    for content_item in user_message["content"]:
                        if content_item["type"] == "text":
                            # Update the text item's content with ra_content
                            new_content.append({"type": "text", "text": ra_content})
                        else:
                            # Keep other types of content as they are
                            new_content.append(content_item)
                    new_user_message = {**user_message, "content": new_content}
                else:
                    new_user_message = {
                        **user_message,
                        "content": ra_content,
                    }
                data["messages"][last_user_message_idx] = new_user_message
                del data["docs"]
                print(data["messages"])
            modified_body_bytes = json.dumps(data).encode("utf-8")
            # Create a new request with the modified body
            scope = request.scope
            scope["body"] = modified_body_bytes
            request = Request(scope, receive=lambda: self._receive(modified_body_bytes))
        response = await call_next(request)
        return response
    async def _receive(self, body: bytes):
        return {"type": "http.request", "body": body, "more_body": False}
 app.add_middleware(RAGMiddleware)
@app.middleware("http")
@ -86,21 +204,6 @@ async def check_url(request: Request, call_next):
    return response
@litellm_app.middleware("http")
 async def auth_middleware(request: Request, call_next):
    auth_header = request.headers.get("Authorization", "")
    if ENV != "dev":
        try:
            user = get_current_user(get_http_authorization_cred(auth_header))
            print(user)
        except Exception as e:
            return JSONResponse(status_code=400, content={"detail": str(e)})
    response = await call_next(request)
    return response
 app.mount("/api/v1", webui_app)
 app.mount("/litellm/api", litellm_app)
@ -125,6 +228,39 @@ async def get_app_config():
    }
@app.get("/api/config/model/filter")
 async def get_model_filter_config(user=Depends(get_admin_user)):
    return {
        "enabled": app.state.MODEL_FILTER_ENABLED,
        "models": app.state.MODEL_FILTER_LIST,
    }
 class ModelFilterConfigForm(BaseModel):
    enabled: bool
    models: List[str]
@app.post("/api/config/model/filter")
 async def get_model_filter_config(
    form_data: ModelFilterConfigForm, user=Depends(get_admin_user)
 ):
    app.state.MODEL_FILTER_ENABLED = form_data.enabled
    app.state.MODEL_FILTER_LIST = form_data.models
    ollama_app.state.MODEL_FILTER_ENABLED = app.state.MODEL_FILTER_ENABLED
    ollama_app.state.MODEL_FILTER_LIST = app.state.MODEL_FILTER_LIST
    openai_app.state.MODEL_FILTER_ENABLED = app.state.MODEL_FILTER_ENABLED
    openai_app.state.MODEL_FILTER_LIST = app.state.MODEL_FILTER_LIST
    return {
        "enabled": app.state.MODEL_FILTER_ENABLED,
        "models": app.state.MODEL_FILTER_LIST,
    }
@app.get("/api/version")
 async def get_app_config():
@ -156,6 +292,7 @@ async def get_app_latest_release_version():
 app.mount("/static", StaticFiles(directory="static"), name="static")
 app.mount("/cache", StaticFiles(directory="data/cache"), name="cache")
 app.mount(
--- a/backend/requirements.txt
+++ b/backend/requirements.txt
@ -16,7 +16,8 @@ aiohttp
 peewee
 bcrypt
-litellm
+litellm==1.30.7
 argon2-cffi
 apscheduler
 google-generativeai
--- a/package.json
+++ b/package.json
@ -1,6 +1,6 @@
 {
 	"name": "open-webui",
-	"version": "0.1.110",
+	"version": "0.1.111",
 	"private": true,
 	"scripts": {
 		"dev": "vite dev --host",
--- a/src/lib/apis/images/index.ts
+++ b/src/lib/apis/images/index.ts
@ -1,9 +1,9 @@
 import { IMAGES_API_BASE_URL } from '$lib/constants';
-export const getImageGenerationEnabledStatus = async (token: string = '') => {
+export const getImageGenerationConfig = async (token: string = '') => {
 	let error = null;
-	const res = await fetch(`${IMAGES_API_BASE_URL}/enabled`, {
+	const res = await fetch(`${IMAGES_API_BASE_URL}/config`, {
 		method: 'GET',
 		headers: {
 			Accept: 'application/json',
@ -32,10 +32,50 @@ export const getImageGenerationEnabledStatus = async (token: string = '') => {
 	return res;
 };
-export const toggleImageGenerationEnabledStatus = async (token: string = '') => {
+export const updateImageGenerationConfig = async (
 	token: string = '',
 	engine: string,
 	enabled: boolean
 ) => {
 	let error = null;
-	const res = await fetch(`${IMAGES_API_BASE_URL}/enabled/toggle`, {
+	const res = await fetch(`${IMAGES_API_BASE_URL}/config/update`, {
 		method: 'POST',
 		headers: {
 			Accept: 'application/json',
 			'Content-Type': 'application/json',
 			...(token && { authorization: `Bearer ${token}` })
 		},
 		body: JSON.stringify({
 			engine,
 			enabled
 		})
 	})
 		.then(async (res) => {
 			if (!res.ok) throw await res.json();
 			return res.json();
 		})
 		.catch((err) => {
 			console.log(err);
 			if ('detail' in err) {
 				error = err.detail;
 			} else {
 				error = 'Server connection failed';
 			}
 			return null;
 		});
 	if (error) {
 		throw error;
 	}
 	return res;
 };
 export const getOpenAIKey = async (token: string = '') => {
 	let error = null;
 	const res = await fetch(`${IMAGES_API_BASE_URL}/key`, {
 		method: 'GET',
 		headers: {
 			Accept: 'application/json',
@ -61,7 +101,42 @@ export const toggleImageGenerationEnabledStatus = async (token: string = '') =>
 		throw error;
 	}
-	return res;
+	return res.OPENAI_API_KEY;
 };
 export const updateOpenAIKey = async (token: string = '', key: string) => {
 	let error = null;
 	const res = await fetch(`${IMAGES_API_BASE_URL}/key/update`, {
 		method: 'POST',
 		headers: {
 			Accept: 'application/json',
 			'Content-Type': 'application/json',
 			...(token && { authorization: `Bearer ${token}` })
 		},
 		body: JSON.stringify({
 			key: key
 		})
 	})
 		.then(async (res) => {
 			if (!res.ok) throw await res.json();
 			return res.json();
 		})
 		.catch((err) => {
 			console.log(err);
 			if ('detail' in err) {
 				error = err.detail;
 			} else {
 				error = 'Server connection failed';
 			}
 			return null;
 		});
 	if (error) {
 		throw error;
 	}
 	return res.OPENAI_API_KEY;
 };
 export const getAUTOMATIC1111Url = async (token: string = '') => {
@ -263,7 +338,7 @@ export const updateImageSteps = async (token: string = '', steps: number) => {
 	return res.IMAGE_STEPS;
 };
-export const getDiffusionModels = async (token: string = '') => {
+export const getImageGenerationModels = async (token: string = '') => {
 	let error = null;
 	const res = await fetch(`${IMAGES_API_BASE_URL}/models`, {
@ -295,7 +370,7 @@ export const getDiffusionModels = async (token: string = '') => {
 	return res;
 };
-export const getDefaultDiffusionModel = async (token: string = '') => {
+export const getDefaultImageGenerationModel = async (token: string = '') => {
 	let error = null;
 	const res = await fetch(`${IMAGES_API_BASE_URL}/models/default`, {
@ -327,7 +402,7 @@ export const getDefaultDiffusionModel = async (token: string = '') => {
 	return res.model;
 };
-export const updateDefaultDiffusionModel = async (token: string = '', model: string) => {
+export const updateDefaultImageGenerationModel = async (token: string = '', model: string) => {
 	let error = null;
 	const res = await fetch(`${IMAGES_API_BASE_URL}/models/default/update`, {
--- a/src/lib/apis/index.ts
+++ b/src/lib/apis/index.ts
@ -77,3 +77,65 @@ export const getVersionUpdates = async () => {
 	return res;
 };
 export const getModelFilterConfig = async (token: string) => {
 	let error = null;
 	const res = await fetch(`${WEBUI_BASE_URL}/api/config/model/filter`, {
 		method: 'GET',
 		headers: {
 			'Content-Type': 'application/json',
 			Authorization: `Bearer ${token}`
 		}
 	})
 		.then(async (res) => {
 			if (!res.ok) throw await res.json();
 			return res.json();
 		})
 		.catch((err) => {
 			console.log(err);
 			error = err;
 			return null;
 		});
 	if (error) {
 		throw error;
 	}
 	return res;
 };
 export const updateModelFilterConfig = async (
 	token: string,
 	enabled: boolean,
 	models: string[]
 ) => {
 	let error = null;
 	const res = await fetch(`${WEBUI_BASE_URL}/api/config/model/filter`, {
 		method: 'POST',
 		headers: {
 			'Content-Type': 'application/json',
 			Authorization: `Bearer ${token}`
 		},
 		body: JSON.stringify({
 			enabled: enabled,
 			models: models
 		})
 	})
 		.then(async (res) => {
 			if (!res.ok) throw await res.json();
 			return res.json();
 		})
 		.catch((err) => {
 			console.log(err);
 			error = err;
 			return null;
 		});
 	if (error) {
 		throw error;
 	}
 	return res;
 };
--- a/src/lib/apis/litellm/index.ts
+++ b/src/lib/apis/litellm/index.ts
@ -77,6 +77,7 @@ type AddLiteLLMModelForm = {
 	api_base: string;
 	api_key: string;
 	rpm: string;
 	max_tokens: string;
 };
 export const addLiteLLMModel = async (token: string = '', payload: AddLiteLLMModelForm) => {
@ -95,7 +96,8 @@ export const addLiteLLMModel = async (token: string = '', payload: AddLiteLLMMod
 				model: payload.model,
 				...(payload.api_base === '' ? {} : { api_base: payload.api_base }),
 				...(payload.api_key === '' ? {} : { api_key: payload.api_key }),
-				...(isNaN(parseInt(payload.rpm)) ? {} : { rpm: parseInt(payload.rpm) })
+				...(isNaN(parseInt(payload.rpm)) ? {} : { rpm: parseInt(payload.rpm) }),
 				...(payload.max_tokens === '' ? {} : { max_tokens: payload.max_tokens })
 			}
 		})
 	})
--- a/src/lib/apis/rag/index.ts
+++ b/src/lib/apis/rag/index.ts
@ -1,9 +1,9 @@
 import { RAG_API_BASE_URL } from '$lib/constants';
-export const getChunkParams = async (token: string) => {
+export const getRAGConfig = async (token: string) => {
 	let error = null;
-	const res = await fetch(`${RAG_API_BASE_URL}/chunk`, {
+	const res = await fetch(`${RAG_API_BASE_URL}/config`, {
 		method: 'GET',
 		headers: {
 			'Content-Type': 'application/json',
@ -27,18 +27,27 @@ export const getChunkParams = async (token: string) => {
 	return res;
 };
-export const updateChunkParams = async (token: string, size: number, overlap: number) => {
+type ChunkConfigForm = {
 	chunk_size: number;
 	chunk_overlap: number;
 };
 type RAGConfigForm = {
 	pdf_extract_images: boolean;
 	chunk: ChunkConfigForm;
 };
 export const updateRAGConfig = async (token: string, payload: RAGConfigForm) => {
 	let error = null;
-	const res = await fetch(`${RAG_API_BASE_URL}/chunk/update`, {
+	const res = await fetch(`${RAG_API_BASE_URL}/config/update`, {
 		method: 'POST',
 		headers: {
 			'Content-Type': 'application/json',
 			Authorization: `Bearer ${token}`
 		},
 		body: JSON.stringify({
-			chunk_size: size,
+			...payload
 			chunk_overlap: overlap
 		})
 	})
 		.then(async (res) => {
@ -252,7 +261,7 @@ export const queryCollection = async (
 	token: string,
 	collection_names: string,
 	query: string,
-	k: number
+	k: number | null = null
 ) => {
 	let error = null;
--- a/src/lib/components/admin/Settings/Users.svelte
+++ b/src/lib/components/admin/Settings/Users.svelte
@ -1,10 +1,14 @@
 <script lang="ts">
 	import { getModelFilterConfig, updateModelFilterConfig } from '$lib/apis';
 	import { getSignUpEnabledStatus, toggleSignUpEnabledStatus } from '$lib/apis/auths';
 	import { getUserPermissions, updateUserPermissions } from '$lib/apis/users';
 	import { models } from '$lib/stores';
 	import { onMount } from 'svelte';
 	export let saveHandler: Function;
 	let whitelistEnabled = false;
 	let whitelistModels = [''];
 	let permissions = {
 		chat: {
 			deletion: true
@ -13,6 +17,13 @@
 	onMount(async () => {
 		permissions = await getUserPermissions(localStorage.token);
 		const res = await getModelFilterConfig(localStorage.token);
 		if (res) {
 			whitelistEnabled = res.enabled;
 			whitelistModels = res.models.length > 0 ? res.models : [''];
 		}
 	});
 </script>
@ -21,6 +32,8 @@
 	on:submit|preventDefault={async () => {
 		// console.log('submit');
 		await updateUserPermissions(localStorage.token, permissions);
 		await updateModelFilterConfig(localStorage.token, whitelistEnabled, whitelistModels);
 		saveHandler();
 	}}
 >
@ -69,6 +82,106 @@
 				</button>
 			</div>
 		</div>
 		<hr class=" dark:border-gray-700 my-2" />
 		<div class="mt-2 space-y-3 pr-1.5">
 			<div>
 				<div class="mb-2">
 					<div class="flex justify-between items-center text-xs">
 						<div class=" text-sm font-medium">Manage Models</div>
 					</div>
 				</div>
 				<div class=" space-y-3">
 					<div>
 						<div class="flex justify-between items-center text-xs">
 							<div class=" text-xs font-medium">Model Whitelisting</div>
 							<button
 								class=" text-xs font-medium text-gray-500"
 								type="button"
 								on:click={() => {
 									whitelistEnabled = !whitelistEnabled;
 								}}>{whitelistEnabled ? 'On' : 'Off'}</button
 							>
 						</div>
 					</div>
 					{#if whitelistEnabled}
 						<div>
 							<div class=" space-y-1.5">
 								{#each whitelistModels as modelId, modelIdx}
 									<div class="flex w-full">
 										<div class="flex-1 mr-2">
 											<select
 												class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
 												bind:value={modelId}
 												placeholder="Select a model"
 											>
 												<option value="" disabled selected>Select a model</option>
 												{#each $models.filter((model) => model.id) as model}
 													<option value={model.id} class="bg-gray-100 dark:bg-gray-700"
 														>{model.name}</option
 													>
 												{/each}
 											</select>
 										</div>
 										{#if modelIdx === 0}
 											<button
 												class="px-2.5 bg-gray-100 hover:bg-gray-200 text-gray-800 dark:bg-gray-900 dark:text-white rounded-lg transition"
 												type="button"
 												on:click={() => {
 													if (whitelistModels.at(-1) !== '') {
 														whitelistModels = [...whitelistModels, ''];
 													}
 												}}
 											>
 												<svg
 													xmlns="http://www.w3.org/2000/svg"
 													viewBox="0 0 16 16"
 													fill="currentColor"
 													class="w-4 h-4"
 												>
 													<path
 														d="M8.75 3.75a.75.75 0 0 0-1.5 0v3.5h-3.5a.75.75 0 0 0 0 1.5h3.5v3.5a.75.75 0 0 0 1.5 0v-3.5h3.5a.75.75 0 0 0 0-1.5h-3.5v-3.5Z"
 													/>
 												</svg>
 											</button>
 										{:else}
 											<button
 												class="px-2.5 bg-gray-100 hover:bg-gray-200 text-gray-800 dark:bg-gray-900 dark:text-white rounded-lg transition"
 												type="button"
 												on:click={() => {
 													whitelistModels.splice(modelIdx, 1);
 													whitelistModels = whitelistModels;
 												}}
 											>
 												<svg
 													xmlns="http://www.w3.org/2000/svg"
 													viewBox="0 0 16 16"
 													fill="currentColor"
 													class="w-4 h-4"
 												>
 													<path d="M3.75 7.25a.75.75 0 0 0 0 1.5h8.5a.75.75 0 0 0 0-1.5h-8.5Z" />
 												</svg>
 											</button>
 										{/if}
 									</div>
 								{/each}
 							</div>
 							<div class="flex justify-end items-center text-xs mt-1.5 text-right">
 								<div class=" text-xs font-medium">
 									{whitelistModels.length} Model(s) Whitelisted
 								</div>
 							</div>
 						</div>
 					{/if}
 				</div>
 			</div>
 		</div>
 	</div>
 	<div class="flex justify-end pt-3 text-sm font-medium">
--- a/src/lib/components/chat/MessageInput.svelte
+++ b/src/lib/components/chat/MessageInput.svelte
@ -19,7 +19,7 @@
 	export let suggestionPrompts = [];
 	export let autoScroll = true;
-	let chatTextAreaElement:HTMLTextAreaElement
+	let chatTextAreaElement: HTMLTextAreaElement;
 	let filesInputElement;
 	let promptsElement;
@ -359,12 +359,12 @@
 {#if dragged}
 	<div
-		class="fixed w-full h-full flex z-50 touch-none pointer-events-none"
+		class="fixed lg:w-[calc(100%-260px)] w-full h-full flex z-50 touch-none pointer-events-none"
 		id="dropzone"
 		role="region"
 		aria-label="Drag and Drop Container"
 	>
-		<div class="absolute rounded-xl w-full h-full backdrop-blur bg-gray-800/40 flex justify-center">
+		<div class="absolute w-full h-full backdrop-blur bg-gray-800/40 flex justify-center">
 			<div class="m-auto pt-64 flex flex-col justify-center">
 				<div class="max-w-md">
 					<AddFilesPlaceholder />
--- a/src/lib/components/chat/Messages/ResponseMessage.svelte
+++ b/src/lib/components/chat/Messages/ResponseMessage.svelte
@ -6,6 +6,7 @@
 	import auto_render from 'katex/dist/contrib/auto-render.mjs';
 	import 'katex/dist/katex.min.css';
 	import { fade } from 'svelte/transition';
 	import { createEventDispatcher } from 'svelte';
 	import { onMount, tick } from 'svelte';
@ -276,13 +277,15 @@
 	const generateImage = async (message) => {
 		generatingImage = true;
-		const res = await imageGenerations(localStorage.token, message.content);
+		const res = await imageGenerations(localStorage.token, message.content).catch((error) => {
 			toast.error(error);
 		});
 		console.log(res);
 		if (res) {
-			message.files = res.images.map((image) => ({
+			message.files = res.map((image) => ({
 				type: 'image',
-				url: `data:image/png;base64,${image}`
+				url: `${image.url}`
 			}));
 			dispatch('save', message);
@ -477,7 +480,7 @@
 													xmlns="http://www.w3.org/2000/svg"
 													fill="none"
 													viewBox="0 0 24 24"
-													stroke-width="1.5"
+													stroke-width="2"
 													stroke="currentColor"
 													class="w-4 h-4"
 												>
@ -503,7 +506,7 @@
 													xmlns="http://www.w3.org/2000/svg"
 													fill="none"
 													viewBox="0 0 24 24"
-													stroke-width="1.5"
+													stroke-width="2"
 													stroke="currentColor"
 													class="w-4 h-4"
 												>
@ -622,7 +625,7 @@
 														xmlns="http://www.w3.org/2000/svg"
 														fill="none"
 														viewBox="0 0 24 24"
-														stroke-width="1.5"
+														stroke-width="2"
 														stroke="currentColor"
 														class="w-4 h-4"
 													>
@ -637,7 +640,7 @@
 														xmlns="http://www.w3.org/2000/svg"
 														fill="none"
 														viewBox="0 0 24 24"
-														stroke-width="1.5"
+														stroke-width="2"
 														stroke="currentColor"
 														class="w-4 h-4"
 													>
@ -703,7 +706,7 @@
 															xmlns="http://www.w3.org/2000/svg"
 															fill="none"
 															viewBox="0 0 24 24"
-															stroke-width="1.5"
+															stroke-width="2"
 															stroke="currentColor"
 															class="w-4 h-4"
 														>
@ -733,7 +736,7 @@
 														xmlns="http://www.w3.org/2000/svg"
 														fill="none"
 														viewBox="0 0 24 24"
-														stroke-width="1.5"
+														stroke-width="2"
 														stroke="currentColor"
 														class="w-4 h-4"
 													>
@ -762,7 +765,7 @@
 														xmlns="http://www.w3.org/2000/svg"
 														fill="none"
 														viewBox="0 0 24 24"
-														stroke-width="1.5"
+														stroke-width="2"
 														stroke="currentColor"
 														class="w-4 h-4"
 													>
@ -792,7 +795,7 @@
 														xmlns="http://www.w3.org/2000/svg"
 														fill="none"
 														viewBox="0 0 24 24"
-														stroke-width="1.5"
+														stroke-width="2"
 														stroke="currentColor"
 														class="w-4 h-4"
 													>
--- a/src/lib/components/chat/Messages/UserMessage.svelte
+++ b/src/lib/components/chat/Messages/UserMessage.svelte
@ -258,7 +258,7 @@
 									xmlns="http://www.w3.org/2000/svg"
 									fill="none"
 									viewBox="0 0 24 24"
-									stroke-width="1.5"
+									stroke-width="2"
 									stroke="currentColor"
 									class="w-4 h-4"
 								>
@ -282,7 +282,7 @@
 									xmlns="http://www.w3.org/2000/svg"
 									fill="none"
 									viewBox="0 0 24 24"
-									stroke-width="1.5"
+									stroke-width="2"
 									stroke="currentColor"
 									class="w-4 h-4"
 								>
@ -307,7 +307,7 @@
 										xmlns="http://www.w3.org/2000/svg"
 										fill="none"
 										viewBox="0 0 24 24"
-										stroke-width="1.5"
+										stroke-width="2"
 										stroke="currentColor"
 										class="w-4 h-4"
 									>
--- a/src/lib/components/chat/Settings/Account.svelte
+++ b/src/lib/components/chat/Settings/Account.svelte
@ -271,7 +271,7 @@
 	<div class="flex justify-end pt-3 text-sm font-medium">
 		<button
-			class=" px-4 py-2 bg-emerald-600 hover:bg-emerald-700 text-gray-100 transition rounded"
+			class="  px-4 py-2 bg-emerald-700 hover:bg-emerald-800 text-gray-100 transition rounded-lg"
 			on:click={async () => {
 				const res = await submitHandler();
--- a/src/lib/components/chat/Settings/Audio.svelte
+++ b/src/lib/components/chat/Settings/Audio.svelte
@ -251,7 +251,7 @@
 	<div class="flex justify-end pt-3 text-sm font-medium">
 		<button
-			class=" px-4 py-2 bg-emerald-600 hover:bg-emerald-700 text-gray-100 transition rounded"
+			class=" px-4 py-2 bg-emerald-700 hover:bg-emerald-800 text-gray-100 transition rounded-lg"
 			type="submit"
 		>
 			Save
--- a/src/lib/components/chat/Settings/Connections.svelte
+++ b/src/lib/components/chat/Settings/Connections.svelte
@ -247,7 +247,7 @@
 	<div class="flex justify-end pt-3 text-sm font-medium">
 		<button
-			class=" px-4 py-2 bg-emerald-600 hover:bg-emerald-700 text-gray-100 transition rounded"
+			class="  px-4 py-2 bg-emerald-700 hover:bg-emerald-800 text-gray-100 transition rounded-lg"
 			type="submit"
 		>
 			Save
--- a/src/lib/components/chat/Settings/General.svelte
+++ b/src/lib/components/chat/Settings/General.svelte
@ -176,7 +176,7 @@
 			<div class=" my-2.5 text-sm font-medium">System Prompt</div>
 			<textarea
 				bind:value={system}
-				class="w-full rounded p-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none resize-none"
+				class="w-full rounded-lg p-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none resize-none"
 				rows="4"
 			/>
 		</div>
@ -262,7 +262,7 @@
 	<div class="flex justify-end pt-3 text-sm font-medium">
 		<button
-			class=" px-4 py-2 bg-emerald-600 hover:bg-emerald-700 text-gray-100 transition rounded"
+			class="  px-4 py-2 bg-emerald-700 hover:bg-emerald-800 text-gray-100 transition rounded-lg"
 			on:click={() => {
 				saveSettings({
 					system: system !== '' ? system : undefined,
--- a/src/lib/components/chat/Settings/Images.svelte
+++ b/src/lib/components/chat/Settings/Images.svelte
@ -5,16 +5,18 @@
 	import { config, user } from '$lib/stores';
 	import {
 		getAUTOMATIC1111Url,
-		getDefaultDiffusionModel,
+		getImageGenerationModels,
-		getDiffusionModels,
+		getDefaultImageGenerationModel,
-		getImageGenerationEnabledStatus,
+		updateDefaultImageGenerationModel,
 		getImageSize,
-		toggleImageGenerationEnabledStatus,
+		getImageGenerationConfig,
 		updateImageGenerationConfig,
 		updateAUTOMATIC1111Url,
 		updateDefaultDiffusionModel,
 		updateImageSize,
 		getImageSteps,
-		updateImageSteps
+		updateImageSteps,
 		getOpenAIKey,
 		updateOpenAIKey
 	} from '$lib/apis/images';
 	import { getBackendConfig } from '$lib/apis';
 	const dispatch = createEventDispatcher();
@ -23,8 +25,11 @@
 	let loading = false;
 	let imageGenerationEngine = '';
 	let enableImageGeneration = false;
 	let AUTOMATIC1111_BASE_URL = '';
 	let OPENAI_API_KEY = '';
 	let selectedModel = '';
 	let models = null;
@ -33,11 +38,11 @@
 	let steps = 50;
 	const getModels = async () => {
-		models = await getDiffusionModels(localStorage.token).catch((error) => {
+		models = await getImageGenerationModels(localStorage.token).catch((error) => {
 			toast.error(error);
 			return null;
 		});
-		selectedModel = await getDefaultDiffusionModel(localStorage.token).catch((error) => {
+		selectedModel = await getDefaultImageGenerationModel(localStorage.token).catch((error) => {
 			return '';
 		});
 	};
@ -62,33 +67,45 @@
 			AUTOMATIC1111_BASE_URL = await getAUTOMATIC1111Url(localStorage.token);
 		}
 	};
-	const toggleImageGeneration = async () => {
+	const updateImageGeneration = async () => {
-		if (AUTOMATIC1111_BASE_URL) {
+		const res = await updateImageGenerationConfig(
-			enableImageGeneration = await toggleImageGenerationEnabledStatus(localStorage.token).catch(
+			localStorage.token,
-				(error) => {
+			imageGenerationEngine,
 			enableImageGeneration
 		).catch((error) => {
 			toast.error(error);
-					return false;
+			return null;
 		});
 		if (res) {
 			imageGenerationEngine = res.engine;
 			enableImageGeneration = res.enabled;
 		}
 			);
 		if (enableImageGeneration) {
 			config.set(await getBackendConfig(localStorage.token));
 			getModels();
 		}
 		} else {
 			enableImageGeneration = false;
 			toast.error('AUTOMATIC1111_BASE_URL not provided');
 		}
 	};
 	onMount(async () => {
 		if ($user.role === 'admin') {
-			enableImageGeneration = await getImageGenerationEnabledStatus(localStorage.token);
+			const res = await getImageGenerationConfig(localStorage.token).catch((error) => {
-			AUTOMATIC1111_BASE_URL = await getAUTOMATIC1111Url(localStorage.token);
+				toast.error(error);
 				return null;
 			});
 			if (res) {
 				imageGenerationEngine = res.engine;
 				enableImageGeneration = res.enabled;
 			}
 			AUTOMATIC1111_BASE_URL = await getAUTOMATIC1111Url(localStorage.token);
 			OPENAI_API_KEY = await getOpenAIKey(localStorage.token);
 			if (enableImageGeneration && AUTOMATIC1111_BASE_URL) {
 			imageSize = await getImageSize(localStorage.token);
 			steps = await getImageSteps(localStorage.token);
 			if (enableImageGeneration) {
 				getModels();
 			}
 		}
@ -99,7 +116,11 @@
 	class="flex flex-col h-full justify-between space-y-3 text-sm"
 	on:submit|preventDefault={async () => {
 		loading = true;
-		await updateDefaultDiffusionModel(localStorage.token, selectedModel);
+		await updateOpenAIKey(localStorage.token, OPENAI_API_KEY);
 		await updateDefaultImageGenerationModel(localStorage.token, selectedModel);
 		await updateDefaultImageGenerationModel(localStorage.token, selectedModel);
 		await updateImageSize(localStorage.token, imageSize).catch((error) => {
 			toast.error(error);
 			return null;
@ -117,6 +138,23 @@
 		<div>
 			<div class=" mb-1 text-sm font-medium">Image Settings</div>
 			<div class=" py-0.5 flex w-full justify-between">
 				<div class=" self-center text-xs font-medium">Image Generation Engine</div>
 				<div class="flex items-center relative">
 					<select
 						class="w-fit pr-8 rounded px-2 p-1 text-xs bg-transparent outline-none text-right"
 						bind:value={imageGenerationEngine}
 						placeholder="Select a mode"
 						on:change={async () => {
 							await updateImageGeneration();
 						}}
 					>
 						<option value="">Default (Automatic1111)</option>
 						<option value="openai">Open AI (Dall-E)</option>
 					</select>
 				</div>
 			</div>
 			<div>
 				<div class=" py-0.5 flex w-full justify-between">
 					<div class=" self-center text-xs font-medium">Image Generation (Experimental)</div>
@ -124,7 +162,17 @@
 					<button
 						class="p-1 px-3 text-xs flex rounded transition"
 						on:click={() => {
-							toggleImageGeneration();
+							if (imageGenerationEngine === '' && AUTOMATIC1111_BASE_URL === '') {
 								toast.error('AUTOMATIC1111 Base URL is required.');
 								enableImageGeneration = false;
 							} else if (imageGenerationEngine === 'openai' && OPENAI_API_KEY === '') {
 								toast.error('OpenAI API Key is required.');
 								enableImageGeneration = false;
 							} else {
 								enableImageGeneration = !enableImageGeneration;
 							}
 							updateImageGeneration();
 						}}
 						type="button"
 					>
@ -139,17 +187,18 @@
 		</div>
 		<hr class=" dark:border-gray-700" />
 		{#if imageGenerationEngine === ''}
 			<div class=" mb-2.5 text-sm font-medium">AUTOMATIC1111 Base URL</div>
 			<div class="flex w-full">
 				<div class="flex-1 mr-2">
 					<input
-					class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
+						class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
 						placeholder="Enter URL (e.g. http://127.0.0.1:7860/)"
 						bind:value={AUTOMATIC1111_BASE_URL}
 					/>
 				</div>
 				<button
-				class="px-3 bg-gray-200 hover:bg-gray-300 dark:bg-gray-600 dark:hover:bg-gray-700 rounded transition"
+					class="px-3 bg-gray-200 hover:bg-gray-300 dark:bg-gray-600 dark:hover:bg-gray-700 rounded-lg transition"
 					type="button"
 					on:click={() => {
 						// updateOllamaAPIUrlHandler();
@ -182,6 +231,18 @@
 					(e.g. `sh webui.sh --api`)
 				</a>
 			</div>
 		{:else if imageGenerationEngine === 'openai'}
 			<div class=" mb-2.5 text-sm font-medium">OpenAI API Key</div>
 			<div class="flex w-full">
 				<div class="flex-1 mr-2">
 					<input
 						class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
 						placeholder="Enter API Key"
 						bind:value={OPENAI_API_KEY}
 					/>
 				</div>
 			</div>
 		{/if}
 		{#if enableImageGeneration}
 			<hr class=" dark:border-gray-700" />
@ -191,7 +252,7 @@
 				<div class="flex w-full">
 					<div class="flex-1 mr-2">
 						<select
-							class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
+							class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
 							bind:value={selectedModel}
 							placeholder="Select a model"
 						>
@ -199,9 +260,7 @@
 								<option value="" disabled selected>Select a model</option>
 							{/if}
 							{#each models ?? [] as model}
-								<option value={model.title} class="bg-gray-100 dark:bg-gray-700"
+								<option value={model.id} class="bg-gray-100 dark:bg-gray-700">{model.name}</option>
 									>{model.model_name}</option
 								>
 							{/each}
 						</select>
 					</div>
@ -213,7 +272,7 @@
 				<div class="flex w-full">
 					<div class="flex-1 mr-2">
 						<input
-							class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
+							class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
 							placeholder="Enter Image Size (e.g. 512x512)"
 							bind:value={imageSize}
 						/>
@ -226,7 +285,7 @@
 				<div class="flex w-full">
 					<div class="flex-1 mr-2">
 						<input
-							class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
+							class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
 							placeholder="Enter Number of Steps (e.g. 50)"
 							bind:value={steps}
 						/>
@ -238,7 +297,7 @@
 	<div class="flex justify-end pt-3 text-sm font-medium">
 		<button
-			class=" px-4 py-2 bg-emerald-600 hover:bg-emerald-700 text-gray-100 transition rounded flex flex-row space-x-1 items-center {loading
+			class=" px-4 py-2 bg-emerald-700 hover:bg-emerald-800 text-gray-100 transition rounded-lg flex flex-row space-x-1 items-center {loading
 				? ' cursor-not-allowed'
 				: ''}"
 			type="submit"
--- a/src/lib/components/chat/Settings/Interface.svelte
+++ b/src/lib/components/chat/Settings/Interface.svelte
@ -63,6 +63,7 @@
 		}
 		saveSettings({
 			titleAutoGenerateModel: titleAutoGenerateModel !== '' ? titleAutoGenerateModel : undefined,
 			titleGenerationPrompt: titleGenerationPrompt ? titleGenerationPrompt : undefined
 		});
 	};
@ -186,7 +187,7 @@
 			<div class="flex w-full">
 				<div class="flex-1 mr-2">
 					<select
-						class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
+						class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
 						bind:value={titleAutoGenerateModel}
 						placeholder="Select a model"
 					>
@ -200,35 +201,12 @@
 						{/each}
 					</select>
 				</div>
 				<button
 					class="px-3 bg-gray-200 hover:bg-gray-300 dark:bg-gray-700 dark:hover:bg-gray-800 dark:text-gray-100 rounded transition"
 					on:click={() => {
 						saveSettings({
 							titleAutoGenerateModel:
 								titleAutoGenerateModel !== '' ? titleAutoGenerateModel : undefined
 						});
 					}}
 					type="button"
 				>
 					<svg
 						xmlns="http://www.w3.org/2000/svg"
 						viewBox="0 0 16 16"
 						fill="currentColor"
 						class="w-3.5 h-3.5"
 					>
 						<path
 							fill-rule="evenodd"
 							d="M13.836 2.477a.75.75 0 0 1 .75.75v3.182a.75.75 0 0 1-.75.75h-3.182a.75.75 0 0 1 0-1.5h1.37l-.84-.841a4.5 4.5 0 0 0-7.08.932.75.75 0 0 1-1.3-.75 6 6 0 0 1 9.44-1.242l.842.84V3.227a.75.75 0 0 1 .75-.75Zm-.911 7.5A.75.75 0 0 1 13.199 11a6 6 0 0 1-9.44 1.241l-.84-.84v1.371a.75.75 0 0 1-1.5 0V9.591a.75.75 0 0 1 .75-.75H5.35a.75.75 0 0 1 0 1.5H3.98l.841.841a4.5 4.5 0 0 0 7.08-.932.75.75 0 0 1 1.025-.273Z"
 							clip-rule="evenodd"
 						/>
 					</svg>
 				</button>
 			</div>
-			<div class="mt-3">
+			<div class="mt-3 mr-2">
 				<div class=" mb-2.5 text-sm font-medium">Title Generation Prompt</div>
 				<textarea
 					bind:value={titleGenerationPrompt}
-					class="w-full rounded p-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none resize-none"
+					class="w-full rounded-lg p-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none resize-none"
 					rows="3"
 				/>
 			</div>
@ -321,7 +299,7 @@
 	<div class="flex justify-end pt-3 text-sm font-medium">
 		<button
-			class=" px-4 py-2 bg-emerald-600 hover:bg-emerald-700 text-gray-100 transition rounded"
+			class=" px-4 py-2 bg-emerald-700 hover:bg-emerald-800 text-gray-100 transition rounded-lg"
 			type="submit"
 		>
 			Save
--- a/src/lib/components/chat/Settings/Models.svelte
+++ b/src/lib/components/chat/Settings/Models.svelte
@ -14,6 +14,7 @@
 	import { splitStream } from '$lib/utils';
 	import { onMount } from 'svelte';
 	import { addLiteLLMModel, deleteLiteLLMModel, getLiteLLMModelInfo } from '$lib/apis/litellm';
 	import Tooltip from '$lib/components/common/Tooltip.svelte';
 	export let getModels: Function;
@ -27,6 +28,7 @@
 	let liteLLMAPIBase = '';
 	let liteLLMAPIKey = '';
 	let liteLLMRPM = '';
 	let liteLLMMaxTokens = '';
 	let deleteLiteLLMModelId = '';
@ -36,6 +38,10 @@
 	let OLLAMA_URLS = [];
 	let selectedOllamaUrlIdx: string | null = null;
 	let updateModelId = null;
 	let updateProgress = null;
 	let showExperimentalOllama = false;
 	let ollamaVersion = '';
 	const MAX_PARALLEL_DOWNLOADS = 3;
@ -60,6 +66,71 @@
 	let deleteModelTag = '';
 	const updateModelsHandler = async () => {
 		for (const model of $models.filter(
 			(m) =>
 				m.size != null &&
 				(selectedOllamaUrlIdx === null ? true : (m?.urls ?? []).includes(selectedOllamaUrlIdx))
 		)) {
 			console.log(model);
 			updateModelId = model.id;
 			const res = await pullModel(localStorage.token, model.id, selectedOllamaUrlIdx).catch(
 				(error) => {
 					toast.error(error);
 					return null;
 				}
 			);
 			if (res) {
 				const reader = res.body
 					.pipeThrough(new TextDecoderStream())
 					.pipeThrough(splitStream('\n'))
 					.getReader();
 				while (true) {
 					try {
 						const { value, done } = await reader.read();
 						if (done) break;
 						let lines = value.split('\n');
 						for (const line of lines) {
 							if (line !== '') {
 								let data = JSON.parse(line);
 								console.log(data);
 								if (data.error) {
 									throw data.error;
 								}
 								if (data.detail) {
 									throw data.detail;
 								}
 								if (data.status) {
 									if (data.digest) {
 										updateProgress = 0;
 										if (data.completed) {
 											updateProgress = Math.round((data.completed / data.total) * 1000) / 10;
 										} else {
 											updateProgress = 100;
 										}
 									} else {
 										toast.success(data.status);
 									}
 								}
 							}
 						}
 					} catch (error) {
 						console.log(error);
 					}
 				}
 			}
 		}
 		updateModelId = null;
 		updateProgress = null;
 	};
 	const pullModelHandler = async () => {
 		const sanitizedModelTag = modelTag.trim();
 		if (modelDownloadStatus[sanitizedModelTag]) {
@ -326,7 +397,8 @@
 				model: liteLLMModel,
 				api_base: liteLLMAPIBase,
 				api_key: liteLLMAPIKey,
-				rpm: liteLLMRPM
+				rpm: liteLLMRPM,
 				max_tokens: liteLLMMaxTokens
 			}).catch((error) => {
 				toast.error(error);
 				return null;
@ -346,6 +418,7 @@
 		liteLLMAPIBase = '';
 		liteLLMAPIKey = '';
 		liteLLMRPM = '';
 		liteLLMMaxTokens = '';
 		liteLLMModelInfo = await getLiteLLMModelInfo(localStorage.token);
 		models.set(await getModels());
@ -376,7 +449,7 @@
 			return [];
 		});
-		if (OLLAMA_URLS.length > 1) {
+		if (OLLAMA_URLS.length > 0) {
 			selectedOllamaUrlIdx = 0;
 		}
@ -391,7 +464,8 @@
 			<div class="space-y-2 pr-1.5">
 				<div class="text-sm font-medium">Manage Ollama Models</div>
-				{#if OLLAMA_URLS.length > 1}
+				{#if OLLAMA_URLS.length > 0}
 					<div class="flex gap-2">
 						<div class="flex-1 pb-1">
 							<select
 								class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
@ -403,6 +477,38 @@
 								{/each}
 							</select>
 						</div>
 						<div>
 							<div class="flex w-full justify-end">
 								<Tooltip content="Update All Models" placement="top">
 									<button
 										class="p-2.5 flex gap-2 items-center bg-gray-100 hover:bg-gray-200 text-gray-800 dark:bg-gray-850 dark:hover:bg-gray-800 dark:text-gray-100 rounded-lg transition"
 										on:click={() => {
 											updateModelsHandler();
 										}}
 									>
 										<svg
 											xmlns="http://www.w3.org/2000/svg"
 											viewBox="0 0 16 16"
 											fill="currentColor"
 											class="w-4 h-4"
 										>
 											<path
 												d="M7 1a.75.75 0 0 1 .75.75V6h-1.5V1.75A.75.75 0 0 1 7 1ZM6.25 6v2.94L5.03 7.72a.75.75 0 0 0-1.06 1.06l2.5 2.5a.75.75 0 0 0 1.06 0l2.5-2.5a.75.75 0 1 0-1.06-1.06L7.75 8.94V6H10a2 2 0 0 1 2 2v3a2 2 0 0 1-2 2H4a2 2 0 0 1-2-2V8a2 2 0 0 1 2-2h2.25Z"
 											/>
 											<path
 												d="M4.268 14A2 2 0 0 0 6 15h6a2 2 0 0 0 2-2v-3a2 2 0 0 0-1-1.732V11a3 3 0 0 1-3 3H4.268Z"
 											/>
 										</svg>
 									</button>
 								</Tooltip>
 							</div>
 						</div>
 					</div>
 					{#if updateModelId}
 						Updating "{updateModelId}" {updateProgress ? `(${updateProgress}%)` : ''}
 					{/if}
 				{/if}
 				<div class="space-y-2">
@ -467,6 +573,7 @@
 							</button>
 						</div>
 						<div>
 							<div class="mt-2 mb-1 text-xs text-gray-400 dark:text-gray-500">
 								To access the available model names for downloading, <a
 									class=" text-gray-500 dark:text-gray-300 font-medium underline"
@ -474,6 +581,7 @@
 									target="_blank">click here.</a
 								>
 							</div>
 						</div>
 						{#if Object.keys(modelDownloadStatus).length > 0}
 							{#each Object.keys(modelDownloadStatus) as model}
@ -589,7 +697,7 @@
 												on:change={() => {
 													console.log(modelInputFile);
 												}}
-												accept=".gguf"
+												accept=".gguf,.safetensors"
 												required
 												hidden
 											/>
@ -722,8 +830,20 @@
 		<div class=" space-y-3">
 			<div class="mt-2 space-y-3 pr-1.5">
 				<div>
-					<div class=" mb-2 text-sm font-medium">Manage LiteLLM Models</div>
+					<div class="mb-2">
 						<div class="flex justify-between items-center text-xs">
 							<div class=" text-sm font-medium">Manage LiteLLM Models</div>
 							<button
 								class=" text-xs font-medium text-gray-500"
 								type="button"
 								on:click={() => {
 									showLiteLLM = !showLiteLLM;
 								}}>{showLiteLLM ? 'Hide' : 'Show'}</button
 							>
 						</div>
 					</div>
 					{#if showLiteLLM}
 						<div>
 							<div class="flex justify-between items-center text-xs">
 								<div class=" text-sm font-medium">Add a model</div>
@ -732,7 +852,8 @@
 									type="button"
 									on:click={() => {
 										showLiteLLMParams = !showLiteLLMParams;
-								}}>{showLiteLLMParams ? 'Hide Additional Params' : 'Show Additional Params'}</button
+									}}
 									>{showLiteLLMParams ? 'Hide Additional Params' : 'Show Additional Params'}</button
 								>
 							</div>
 						</div>
@ -823,6 +944,22 @@
 										</div>
 									</div>
 								</div>
 								<div>
 									<div class="mb-1.5 text-sm font-medium">Max Tokens</div>
 									<div class="flex w-full">
 										<div class="flex-1">
 											<input
 												class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
 												placeholder="Enter Max Tokens (litellm_params.max_tokens)"
 												bind:value={liteLLMMaxTokens}
 												type="number"
 												min="1"
 												autocomplete="off"
 											/>
 										</div>
 									</div>
 								</div>
 							{/if}
 						</div>
@ -877,90 +1014,9 @@
 								</button>
 							</div>
 						</div>
 				</div>
 			</div>
 			<!-- <div class="mt-2 space-y-3 pr-1.5">
 				<div>
 					<div class=" mb-2.5 text-sm font-medium">Add LiteLLM Model</div>
 					<div class="flex w-full mb-2">
 						<div class="flex-1">
 							<input
 								class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
 								placeholder="Enter LiteLLM Model (e.g. ollama/mistral)"
 								bind:value={liteLLMModel}
 								autocomplete="off"
 							/>
 						</div>
 					</div>
 					<div class="flex justify-between items-center text-sm">
 						<div class="  font-medium">Advanced Model Params</div>
 						<button
 							class=" text-xs font-medium text-gray-500"
 							type="button"
 							on:click={() => {
 								showLiteLLMParams = !showLiteLLMParams;
 							}}>{showLiteLLMParams ? 'Hide' : 'Show'}</button
 						>
 					</div>
 					{#if showLiteLLMParams}
 						<div>
 							<div class=" mb-2.5 text-sm font-medium">LiteLLM API Key</div>
 							<div class="flex w-full">
 								<div class="flex-1">
 									<input
 										class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
 										placeholder="Enter LiteLLM API Key (e.g. os.environ/AZURE_API_KEY_CA)"
 										bind:value={liteLLMAPIKey}
 										autocomplete="off"
 									/>
 								</div>
 							</div>
 						</div>
 						<div>
 							<div class=" mb-2.5 text-sm font-medium">LiteLLM API Base URL</div>
 							<div class="flex w-full">
 								<div class="flex-1">
 									<input
 										class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
 										placeholder="Enter LiteLLM API Base URL"
 										bind:value={liteLLMAPIBase}
 										autocomplete="off"
 									/>
 								</div>
 							</div>
 						</div>
 						<div>
 							<div class=" mb-2.5 text-sm font-medium">LiteLLM API RPM</div>
 							<div class="flex w-full">
 								<div class="flex-1">
 									<input
 										class="w-full rounded py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none"
 										placeholder="Enter LiteLLM API RPM"
 										bind:value={liteLLMRPM}
 										autocomplete="off"
 									/>
 								</div>
 							</div>
 						</div>
 					{/if}
-
+				</div>
-					<div class="mt-2 text-xs text-gray-400 dark:text-gray-500">
+			</div>
 						Not sure what to add?
 						<a
 							class=" text-gray-300 font-medium underline"
 							href="https://litellm.vercel.app/docs/proxy/configs#quick-start"
 							target="_blank"
 						>
 							Click here for help.
 						</a>
 					</div>
 				</div>
 			</div> -->
 		</div>
 	</div>
 </div>
--- a/src/lib/components/chat/SettingsModal.svelte
+++ b/src/lib/components/chat/SettingsModal.svelte
@ -326,7 +326,7 @@
 						{getModels}
 						{saveSettings}
 						on:save={() => {
-							show = false;
+							toast.success('Settings saved successfully!');
 						}}
 					/>
 				{:else if selectedTab === 'models'}
@ -335,28 +335,28 @@
 					<Connections
 						{getModels}
 						on:save={() => {
-							show = false;
+							toast.success('Settings saved successfully!');
 						}}
 					/>
 				{:else if selectedTab === 'interface'}
 					<Interface
 						{saveSettings}
 						on:save={() => {
-							show = false;
+							toast.success('Settings saved successfully!');
 						}}
 					/>
 				{:else if selectedTab === 'audio'}
 					<Audio
 						{saveSettings}
 						on:save={() => {
-							show = false;
+							toast.success('Settings saved successfully!');
 						}}
 					/>
 				{:else if selectedTab === 'images'}
 					<Images
 						{saveSettings}
 						on:save={() => {
-							show = false;
+							toast.success('Settings saved successfully!');
 						}}
 					/>
 				{:else if selectedTab === 'chats'}
@ -364,7 +364,7 @@
 				{:else if selectedTab === 'account'}
 					<Account
 						saveHandler={() => {
-							show = false;
+							toast.success('Settings saved successfully!');
 						}}
 					/>
 				{:else if selectedTab === 'about'}
--- a/src/lib/components/common/Image.svelte
+++ b/src/lib/components/common/Image.svelte
@ -1,18 +1,23 @@
 <script lang="ts">
 	import { WEBUI_BASE_URL } from '$lib/constants';
 	import ImagePreview from './ImagePreview.svelte';
 	export let src = '';
 	export let alt = '';
 	let _src = '';
 	$: _src = src.startsWith('/') ? `${WEBUI_BASE_URL}${src}` : src;
 	let showImagePreview = false;
 </script>
-<ImagePreview bind:show={showImagePreview} {src} {alt} />
+<ImagePreview bind:show={showImagePreview} src={_src} {alt} />
 <button
 	on:click={() => {
 		console.log('image preview');
 		showImagePreview = true;
 	}}
 >
-	<img {src} {alt} class=" max-h-96 rounded-lg" draggable="false" />
+	<img src={_src} {alt} class=" max-h-96 rounded-lg" draggable="false" />
 </button>
--- a/src/lib/components/documents/Settings/General.svelte
+++ b/src/lib/components/documents/Settings/General.svelte
@ -1,10 +1,10 @@
 <script lang="ts">
 	import { getDocs } from '$lib/apis/documents';
 	import {
-		getChunkParams,
+		getRAGConfig,
 		updateRAGConfig,
 		getQuerySettings,
 		scanDocs,
 		updateChunkParams,
 		updateQuerySettings
 	} from '$lib/apis/rag';
 	import { documents } from '$lib/stores';
@ -17,6 +17,7 @@
 	let chunkSize = 0;
 	let chunkOverlap = 0;
 	let pdfExtractImages = true;
 	let querySettings = {
 		template: '',
@ -35,16 +36,24 @@
 	};
 	const submitHandler = async () => {
-		const res = await updateChunkParams(localStorage.token, chunkSize, chunkOverlap);
+		const res = await updateRAGConfig(localStorage.token, {
 			pdf_extract_images: pdfExtractImages,
 			chunk: {
 				chunk_overlap: chunkOverlap,
 				chunk_size: chunkSize
 			}
 		});
 		querySettings = await updateQuerySettings(localStorage.token, querySettings);
 	};
 	onMount(async () => {
-		const res = await getChunkParams(localStorage.token);
+		const res = await getRAGConfig(localStorage.token);
 		if (res) {
-			chunkSize = res.chunk_size;
+			pdfExtractImages = res.pdf_extract_images;
-			chunkOverlap = res.chunk_overlap;
+
 			chunkSize = res.chunk.chunk_size;
 			chunkOverlap = res.chunk.chunk_overlap;
 		}
 		querySettings = await getQuerySettings(localStorage.token);
@ -124,14 +133,15 @@
 		<hr class=" dark:border-gray-700" />
-		<div class=" ">
+		<div class=" space-y-3">
 			<div class=" space-y-3">
 				<div class=" text-sm font-medium">Chunk Params</div>
-			<div class=" flex">
+				<div class=" flex gap-2">
-				<div class="  flex w-full justify-between">
+					<div class="  flex w-full justify-between gap-2">
 						<div class="self-center text-xs font-medium min-w-fit">Chunk Size</div>
-					<div class="self-center p-3">
+						<div class="self-center">
 							<input
 								class=" w-full rounded py-1.5 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none border border-gray-100 dark:border-gray-600"
 								type="number"
@ -143,10 +153,10 @@
 						</div>
 					</div>
-				<div class="flex w-full">
+					<div class="flex w-full gap-2">
 						<div class=" self-center text-xs font-medium min-w-fit">Chunk Overlap</div>
-					<div class="self-center p-3">
+						<div class="self-center">
 							<input
 								class="w-full rounded py-1.5 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none border border-gray-100 dark:border-gray-600"
 								type="number"
@ -159,13 +169,29 @@
 					</div>
 				</div>
 				<div>
 					<div class="flex justify-between items-center text-xs">
 						<div class=" text-xs font-medium">PDF Extract Images (OCR)</div>
 						<button
 							class=" text-xs font-medium text-gray-500"
 							type="button"
 							on:click={() => {
 								pdfExtractImages = !pdfExtractImages;
 							}}>{pdfExtractImages ? 'On' : 'Off'}</button
 						>
 					</div>
 				</div>
 			</div>
 			<div>
 				<div class=" text-sm font-medium">Query Params</div>
-			<div class=" flex">
+				<div class=" flex py-2">
-				<div class="  flex w-full justify-between">
+					<div class="  flex w-full justify-between gap-2">
 						<div class="self-center text-xs font-medium flex-1">Top K</div>
-					<div class="self-center p-3">
+						<div class="self-center">
 							<input
 								class=" w-full rounded py-1.5 px-4 text-sm dark:text-gray-300 dark:bg-gray-800 outline-none border border-gray-100 dark:border-gray-600"
 								type="number"
@ -203,6 +229,7 @@
 				</div>
 			</div>
 		</div>
 	</div>
 	<div class="flex justify-end pt-3 text-sm font-medium">
 		<button
--- a/src/lib/components/layout/Sidebar.svelte
+++ b/src/lib/components/layout/Sidebar.svelte
@ -61,12 +61,16 @@
 	};
 	const editChatTitle = async (id, _title) => {
 		if (_title === '') {
 			toast.error('Title cannot be an empty string.');
 		} else {
 			title = _title;
 			await updateChatById(localStorage.token, id, {
 				title: _title
 			});
 			await chats.set(await getChatList(localStorage.token));
 		}
 	};
 	const deleteChat = async (id) => {
@ -388,12 +392,13 @@
 										show = false;
 									}
 								}}
 								draggable="false"
 							>
 								<div class=" flex self-center flex-1 w-full">
 									<div
 										class=" text-left self-center overflow-hidden {chat.id === $chatId
 											? 'w-[160px]'
-											: 'w-full'} "
+											: 'w-full'}  h-[20px]"
 									>
 										{chat.title}
 									</div>
--- a/src/routes/(app)/+page.svelte
+++ b/src/routes/(app)/+page.svelte
@ -232,53 +232,6 @@
 	const sendPrompt = async (prompt, parentId) => {
 		const _chatId = JSON.parse(JSON.stringify($chatId));
 		const docs = messages
 			.filter((message) => message?.files ?? null)
 			.map((message) =>
 				message.files.filter((item) => item.type === 'doc' || item.type === 'collection')
 			)
 			.flat(1);
 		console.log(docs);
 		if (docs.length > 0) {
 			processing = 'Reading';
 			const query = history.messages[parentId].content;
 			let relevantContexts = await Promise.all(
 				docs.map(async (doc) => {
 					if (doc.type === 'collection') {
 						return await queryCollection(localStorage.token, doc.collection_names, query).catch(
 							(error) => {
 								console.log(error);
 								return null;
 							}
 						);
 					} else {
 						return await queryDoc(localStorage.token, doc.collection_name, query).catch((error) => {
 							console.log(error);
 							return null;
 						});
 					}
 				})
 			);
 			relevantContexts = relevantContexts.filter((context) => context);
 			const contextString = relevantContexts.reduce((a, context, i, arr) => {
 				return `${a}${context.documents.join(' ')}\n`;
 			}, '');
 			console.log(contextString);
 			history.messages[parentId].raContent = await RAGTemplate(
 				localStorage.token,
 				contextString,
 				query
 			);
 			history.messages[parentId].contexts = relevantContexts;
 			await tick();
 			processing = '';
 		}
 		await Promise.all(
 			selectedModels.map(async (modelId) => {
 				const model = $models.filter((m) => m.id === modelId).at(0);
@ -342,15 +295,25 @@
 			...messages
 		]
 			.filter((message) => message)
-			.map((message, idx, arr) => ({
+			.map((message, idx, arr) => {
 				// Prepare the base message object
 				const baseMessage = {
 					role: message.role,
-				content: arr.length - 2 !== idx ? message.content : message?.raContent ?? message.content,
+					content: arr.length - 2 !== idx ? message.content : message?.raContent ?? message.content
-				...(message.files && {
+				};
-					images: message.files
+
-						.filter((file) => file.type === 'image')
+				// Extract and format image URLs if any exist
-						.map((file) => file.url.slice(file.url.indexOf(',') + 1))
+				const imageUrls = message.files
-				})
+					?.filter((file) => file.type === 'image')
-			}));
+					.map((file) => file.url.slice(file.url.indexOf(',') + 1));
 				// Add images array only if it contains elements
 				if (imageUrls && imageUrls.length > 0) {
 					baseMessage.images = imageUrls;
 				}
 				return baseMessage;
 			});
 		let lastImageIndex = -1;
@ -368,6 +331,13 @@
 			}
 		});
 		const docs = messages
 			.filter((message) => message?.files ?? null)
 			.map((message) =>
 				message.files.filter((item) => item.type === 'doc' || item.type === 'collection')
 			)
 			.flat(1);
 		const [res, controller] = await generateChatCompletion(localStorage.token, {
 			model: model,
 			messages: messagesBody,
@ -375,7 +345,8 @@
 				...($settings.options ?? {})
 			},
 			format: $settings.requestFormat ?? undefined,
-			keep_alive: $settings.keepAlive ?? undefined
+			keep_alive: $settings.keepAlive ?? undefined,
 			docs: docs.length > 0 ? docs : undefined
 		});
 		if (res && res.ok) {
@ -535,6 +506,15 @@
 		const responseMessage = history.messages[responseMessageId];
 		scrollToBottom();
 		const docs = messages
 			.filter((message) => message?.files ?? null)
 			.map((message) =>
 				message.files.filter((item) => item.type === 'doc' || item.type === 'collection')
 			)
 			.flat(1);
 		console.log(docs);
 		const res = await generateOpenAIChatCompletion(
 			localStorage.token,
 			{
@ -583,7 +563,8 @@
 				top_p: $settings?.options?.top_p ?? undefined,
 				num_ctx: $settings?.options?.num_ctx ?? undefined,
 				frequency_penalty: $settings?.options?.repeat_penalty ?? undefined,
-				max_tokens: $settings?.options?.num_predict ?? undefined
+				max_tokens: $settings?.options?.num_predict ?? undefined,
 				docs: docs.length > 0 ? docs : undefined
 			},
 			model.source === 'litellm' ? `${LITELLM_API_BASE_URL}/v1` : `${OPENAI_API_BASE_URL}`
 		);
@ -694,8 +675,13 @@
 		if (messages.length == 2) {
 			window.history.replaceState(history.state, '', `/c/${_chatId}`);
 			if ($settings?.titleAutoGenerateModel) {
 				await generateChatTitle(_chatId, userPrompt);
 			} else {
 				await setChatTitle(_chatId, userPrompt);
 			}
 		}
 	};
 	const stopResponse = () => {
--- a/src/routes/(app)/c/[id]/+page.svelte
+++ b/src/routes/(app)/c/[id]/+page.svelte
@ -245,53 +245,6 @@
 	const sendPrompt = async (prompt, parentId) => {
 		const _chatId = JSON.parse(JSON.stringify($chatId));
 		const docs = messages
 			.filter((message) => message?.files ?? null)
 			.map((message) =>
 				message.files.filter((item) => item.type === 'doc' || item.type === 'collection')
 			)
 			.flat(1);
 		console.log(docs);
 		if (docs.length > 0) {
 			processing = 'Reading';
 			const query = history.messages[parentId].content;
 			let relevantContexts = await Promise.all(
 				docs.map(async (doc) => {
 					if (doc.type === 'collection') {
 						return await queryCollection(localStorage.token, doc.collection_names, query).catch(
 							(error) => {
 								console.log(error);
 								return null;
 							}
 						);
 					} else {
 						return await queryDoc(localStorage.token, doc.collection_name, query).catch((error) => {
 							console.log(error);
 							return null;
 						});
 					}
 				})
 			);
 			relevantContexts = relevantContexts.filter((context) => context);
 			const contextString = relevantContexts.reduce((a, context, i, arr) => {
 				return `${a}${context.documents.join(' ')}\n`;
 			}, '');
 			console.log(contextString);
 			history.messages[parentId].raContent = await RAGTemplate(
 				localStorage.token,
 				contextString,
 				query
 			);
 			history.messages[parentId].contexts = relevantContexts;
 			await tick();
 			processing = '';
 		}
 		await Promise.all(
 			selectedModels.map(async (modelId) => {
 				const model = $models.filter((m) => m.id === modelId).at(0);
@ -355,15 +308,25 @@
 			...messages
 		]
 			.filter((message) => message)
-			.map((message, idx, arr) => ({
+			.map((message, idx, arr) => {
 				// Prepare the base message object
 				const baseMessage = {
 					role: message.role,
-				content: arr.length - 2 !== idx ? message.content : message?.raContent ?? message.content,
+					content: arr.length - 2 !== idx ? message.content : message?.raContent ?? message.content
-				...(message.files && {
+				};
-					images: message.files
+
-						.filter((file) => file.type === 'image')
+				// Extract and format image URLs if any exist
-						.map((file) => file.url.slice(file.url.indexOf(',') + 1))
+				const imageUrls = message.files
-				})
+					?.filter((file) => file.type === 'image')
-			}));
+					.map((file) => file.url.slice(file.url.indexOf(',') + 1));
 				// Add images array only if it contains elements
 				if (imageUrls && imageUrls.length > 0) {
 					baseMessage.images = imageUrls;
 				}
 				return baseMessage;
 			});
 		let lastImageIndex = -1;
@ -381,6 +344,13 @@
 			}
 		});
 		const docs = messages
 			.filter((message) => message?.files ?? null)
 			.map((message) =>
 				message.files.filter((item) => item.type === 'doc' || item.type === 'collection')
 			)
 			.flat(1);
 		const [res, controller] = await generateChatCompletion(localStorage.token, {
 			model: model,
 			messages: messagesBody,
@ -388,7 +358,8 @@
 				...($settings.options ?? {})
 			},
 			format: $settings.requestFormat ?? undefined,
-			keep_alive: $settings.keepAlive ?? undefined
+			keep_alive: $settings.keepAlive ?? undefined,
 			docs: docs.length > 0 ? docs : undefined
 		});
 		if (res && res.ok) {
@ -548,6 +519,15 @@
 		const responseMessage = history.messages[responseMessageId];
 		scrollToBottom();
 		const docs = messages
 			.filter((message) => message?.files ?? null)
 			.map((message) =>
 				message.files.filter((item) => item.type === 'doc' || item.type === 'collection')
 			)
 			.flat(1);
 		console.log(docs);
 		const res = await generateOpenAIChatCompletion(
 			localStorage.token,
 			{
@ -596,7 +576,8 @@
 				top_p: $settings?.options?.top_p ?? undefined,
 				num_ctx: $settings?.options?.num_ctx ?? undefined,
 				frequency_penalty: $settings?.options?.repeat_penalty ?? undefined,
-				max_tokens: $settings?.options?.num_predict ?? undefined
+				max_tokens: $settings?.options?.num_predict ?? undefined,
 				docs: docs.length > 0 ? docs : undefined
 			},
 			model.source === 'litellm' ? `${LITELLM_API_BASE_URL}/v1` : `${OPENAI_API_BASE_URL}`
 		);
@ -710,6 +691,7 @@
 			await setChatTitle(_chatId, userPrompt);
 		}
 	};
 	const stopResponse = () => {
 		stopResponseFlag = true;
 		console.log('stopResponse');
--- a/src/routes/(app)/playground/+page.svelte
+++ b/src/routes/(app)/playground/+page.svelte
@ -267,7 +267,7 @@
 <div class="min-h-screen max-h-[100dvh] w-full flex justify-center dark:text-white">
 	<div class=" flex flex-col justify-between w-full overflow-y-auto h-[100dvh]">
-		<div class="max-w-2xl mx-auto w-full px-3 p-3 md:px-0 h-full">
+		<div class="max-w-2xl mx-auto w-full px-3 md:px-0 my-10 h-full">
 			<div class=" flex flex-col h-full">
 				<div class="flex flex-col justify-between mb-2.5 gap-1">
 					<div class="flex justify-between items-center gap-2">