refac: ollama gguf upload

2024-03-21 23:45:00 -07:00 · 2024-03-21 23:45:00 -07:00 · af4caec4f5
commit af4caec4f5
parent c54fb92263
4 changed files with 268 additions and 176 deletions
--- a/backend/apps/ollama/main.py
+++ b/backend/apps/ollama/main.py
@ -1,23 +1,39 @@
-from fastapi import FastAPI, Request, Response, HTTPException, Depends, status
+from fastapi import (
    FastAPI,
    Request,
    Response,
    HTTPException,
    Depends,
    status,
    UploadFile,
    File,
    BackgroundTasks,
 )
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import StreamingResponse
 from fastapi.concurrency import run_in_threadpool
 from pydantic import BaseModel, ConfigDict
 import os
 import random
 import requests
 import json
 import uuid
 import aiohttp
 import asyncio
 import aiofiles
 from urllib.parse import urlparse
 from typing import Optional, List, Union
 from apps.web.models.users import Users
 from constants import ERROR_MESSAGES
 from utils.utils import decode_token, get_current_user, get_admin_user
-from config import OLLAMA_BASE_URLS, MODEL_FILTER_ENABLED, MODEL_FILTER_LIST
+from utils.misc import calculate_sha256
-from typing import Optional, List, Union
+
 from config import OLLAMA_BASE_URLS, MODEL_FILTER_ENABLED, MODEL_FILTER_LIST, UPLOAD_DIR
 app = FastAPI()
@ -897,6 +913,170 @@ async def generate_openai_chat_completion(
        )
 class UrlForm(BaseModel):
    url: str
 class UploadBlobForm(BaseModel):
    filename: str
 def parse_huggingface_url(hf_url):
    try:
        # Parse the URL
        parsed_url = urlparse(hf_url)
        # Get the path and split it into components
        path_components = parsed_url.path.split("/")
        # Extract the desired output
        user_repo = "/".join(path_components[1:3])
        model_file = path_components[-1]
        return model_file
    except ValueError:
        return None
 async def download_file_stream(
    ollama_url, file_url, file_path, file_name, chunk_size=1024 * 1024
 ):
    done = False
    if os.path.exists(file_path):
        current_size = os.path.getsize(file_path)
    else:
        current_size = 0
    headers = {"Range": f"bytes={current_size}-"} if current_size > 0 else {}
    timeout = aiohttp.ClientTimeout(total=600)  # Set the timeout
    async with aiohttp.ClientSession(timeout=timeout) as session:
        async with session.get(file_url, headers=headers) as response:
            total_size = int(response.headers.get("content-length", 0)) + current_size
            with open(file_path, "ab+") as file:
                async for data in response.content.iter_chunked(chunk_size):
                    current_size += len(data)
                    file.write(data)
                    done = current_size == total_size
                    progress = round((current_size / total_size) * 100, 2)
                    yield f'data: {{"progress": {progress}, "completed": {current_size}, "total": {total_size}}}\n\n'
                if done:
                    file.seek(0)
                    hashed = calculate_sha256(file)
                    file.seek(0)
                    url = f"{ollama_url}/api/blobs/sha256:{hashed}"
                    response = requests.post(url, data=file)
                    if response.ok:
                        res = {
                            "done": done,
                            "blob": f"sha256:{hashed}",
                            "name": file_name,
                        }
                        os.remove(file_path)
                        yield f"data: {json.dumps(res)}\n\n"
                    else:
                        raise "Ollama: Could not create blob, Please try again."
 # url = "https://huggingface.co/TheBloke/stablelm-zephyr-3b-GGUF/resolve/main/stablelm-zephyr-3b.Q2_K.gguf"
@app.post("/models/download")
@app.post("/models/download/{url_idx}")
 async def download_model(
    form_data: UrlForm,
    url_idx: Optional[int] = None,
 ):
    if url_idx == None:
        url_idx = 0
    url = app.state.OLLAMA_BASE_URLS[url_idx]
    file_name = parse_huggingface_url(form_data.url)
    if file_name:
        file_path = f"{UPLOAD_DIR}/{file_name}"
        return StreamingResponse(
            download_file_stream(url, form_data.url, file_path, file_name)
        )
    else:
        return None
@app.post("/models/upload")
@app.post("/models/upload/{url_idx}")
 def upload_model(file: UploadFile = File(...), url_idx: Optional[int] = None):
    if url_idx == None:
        url_idx = 0
    ollama_url = app.state.OLLAMA_BASE_URLS[url_idx]
    file_path = f"{UPLOAD_DIR}/{file.filename}"
    # Save file in chunks
    with open(file_path, "wb+") as f:
        for chunk in file.file:
            f.write(chunk)
    def file_process_stream():
        nonlocal ollama_url
        total_size = os.path.getsize(file_path)
        chunk_size = 1024 * 1024
        try:
            with open(file_path, "rb") as f:
                total = 0
                done = False
                while not done:
                    chunk = f.read(chunk_size)
                    if not chunk:
                        done = True
                        continue
                    total += len(chunk)
                    progress = round((total / total_size) * 100, 2)
                    res = {
                        "progress": progress,
                        "total": total_size,
                        "completed": total,
                    }
                    yield f"data: {json.dumps(res)}\n\n"
                if done:
                    f.seek(0)
                    hashed = calculate_sha256(f)
                    f.seek(0)
                    url = f"{ollama_url}/blobs/sha256:{hashed}"
                    response = requests.post(url, data=f)
                    if response.ok:
                        res = {
                            "done": done,
                            "blob": f"sha256:{hashed}",
                            "name": file.filename,
                        }
                        os.remove(file_path)
                        yield f"data: {json.dumps(res)}\n\n"
                    else:
                        raise Exception(
                            "Ollama: Could not create blob, Please try again."
                        )
        except Exception as e:
            res = {"error": str(e)}
            yield f"data: {json.dumps(res)}\n\n"
    return StreamingResponse(file_process_stream(), media_type="text/event-stream")
@app.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE"])
 async def deprecated_proxy(path: str, request: Request, user=Depends(get_current_user)):
    url = app.state.OLLAMA_BASE_URLS[0]
--- a/backend/apps/web/routers/utils.py
+++ b/backend/apps/web/routers/utils.py
@ -21,155 +21,6 @@ from constants import ERROR_MESSAGES
 router = APIRouter()
 class UploadBlobForm(BaseModel):
    filename: str
 from urllib.parse import urlparse
 def parse_huggingface_url(hf_url):
    try:
        # Parse the URL
        parsed_url = urlparse(hf_url)
        # Get the path and split it into components
        path_components = parsed_url.path.split("/")
        # Extract the desired output
        user_repo = "/".join(path_components[1:3])
        model_file = path_components[-1]
        return model_file
    except ValueError:
        return None
 async def download_file_stream(url, file_path, file_name, chunk_size=1024 * 1024):
    done = False
    if os.path.exists(file_path):
        current_size = os.path.getsize(file_path)
    else:
        current_size = 0
    headers = {"Range": f"bytes={current_size}-"} if current_size > 0 else {}
    timeout = aiohttp.ClientTimeout(total=600)  # Set the timeout
    async with aiohttp.ClientSession(timeout=timeout) as session:
        async with session.get(url, headers=headers) as response:
            total_size = int(response.headers.get("content-length", 0)) + current_size
            with open(file_path, "ab+") as file:
                async for data in response.content.iter_chunked(chunk_size):
                    current_size += len(data)
                    file.write(data)
                    done = current_size == total_size
                    progress = round((current_size / total_size) * 100, 2)
                    yield f'data: {{"progress": {progress}, "completed": {current_size}, "total": {total_size}}}\n\n'
                if done:
                    file.seek(0)
                    hashed = calculate_sha256(file)
                    file.seek(0)
                    url = f"{OLLAMA_BASE_URLS[0]}/api/blobs/sha256:{hashed}"
                    response = requests.post(url, data=file)
                    if response.ok:
                        res = {
                            "done": done,
                            "blob": f"sha256:{hashed}",
                            "name": file_name,
                        }
                        os.remove(file_path)
                        yield f"data: {json.dumps(res)}\n\n"
                    else:
                        raise "Ollama: Could not create blob, Please try again."
@router.get("/download")
 async def download(
    url: str,
 ):
    # url = "https://huggingface.co/TheBloke/stablelm-zephyr-3b-GGUF/resolve/main/stablelm-zephyr-3b.Q2_K.gguf"
    file_name = parse_huggingface_url(url)
    if file_name:
        file_path = f"{UPLOAD_DIR}/{file_name}"
        return StreamingResponse(
            download_file_stream(url, file_path, file_name),
            media_type="text/event-stream",
        )
    else:
        return None
@router.post("/upload")
 def upload(file: UploadFile = File(...)):
    file_path = f"{UPLOAD_DIR}/{file.filename}"
    # Save file in chunks
    with open(file_path, "wb+") as f:
        for chunk in file.file:
            f.write(chunk)
    def file_process_stream():
        total_size = os.path.getsize(file_path)
        chunk_size = 1024 * 1024
        try:
            with open(file_path, "rb") as f:
                total = 0
                done = False
                while not done:
                    chunk = f.read(chunk_size)
                    if not chunk:
                        done = True
                        continue
                    total += len(chunk)
                    progress = round((total / total_size) * 100, 2)
                    res = {
                        "progress": progress,
                        "total": total_size,
                        "completed": total,
                    }
                    yield f"data: {json.dumps(res)}\n\n"
                if done:
                    f.seek(0)
                    hashed = calculate_sha256(f)
                    f.seek(0)
                    url = f"{OLLAMA_BASE_URLS[0]}/blobs/sha256:{hashed}"
                    response = requests.post(url, data=f)
                    if response.ok:
                        res = {
                            "done": done,
                            "blob": f"sha256:{hashed}",
                            "name": file.filename,
                        }
                        os.remove(file_path)
                        yield f"data: {json.dumps(res)}\n\n"
                    else:
                        raise Exception(
                            "Ollama: Could not create blob, Please try again."
                        )
        except Exception as e:
            res = {"error": str(e)}
            yield f"data: {json.dumps(res)}\n\n"
    return StreamingResponse(file_process_stream(), media_type="text/event-stream")
@router.get("/gravatar")
 async def get_gravatar(
    email: str,
--- a/src/lib/apis/ollama/index.ts
+++ b/src/lib/apis/ollama/index.ts
@ -390,6 +390,71 @@ export const pullModel = async (token: string, tagName: string, urlIdx: string |
 	return res;
 };
 export const downloadModel = async (
 	token: string,
 	download_url: string,
 	urlIdx: string | null = null
 ) => {
 	let error = null;
 	const res = await fetch(
 		`${OLLAMA_API_BASE_URL}/models/download${urlIdx !== null ? `/${urlIdx}` : ''}`,
 		{
 			method: 'POST',
 			headers: {
 				Authorization: `Bearer ${token}`
 			},
 			body: JSON.stringify({
 				url: download_url
 			})
 		}
 	).catch((err) => {
 		console.log(err);
 		error = err;
 		if ('detail' in err) {
 			error = err.detail;
 		}
 		return null;
 	});
 	if (error) {
 		throw error;
 	}
 	return res;
 };
 export const uploadModel = async (token: string, file: File, urlIdx: string | null = null) => {
 	let error = null;
 	const formData = new FormData();
 	formData.append('file', file);
 	const res = await fetch(
 		`${OLLAMA_API_BASE_URL}/models/upload${urlIdx !== null ? `/${urlIdx}` : ''}`,
 		{
 			method: 'POST',
 			headers: {
 				Authorization: `Bearer ${token}`
 			},
 			body: formData
 		}
 	).catch((err) => {
 		console.log(err);
 		error = err;
 		if ('detail' in err) {
 			error = err.detail;
 		}
 		return null;
 	});
 	if (error) {
 		throw error;
 	}
 	return res;
 };
 // export const pullModel = async (token: string, tagName: string) => {
 // 	return await fetch(`${OLLAMA_API_BASE_URL}/pull`, {
 // 		method: 'POST',
--- a/src/lib/components/chat/Settings/Models.svelte
+++ b/src/lib/components/chat/Settings/Models.svelte
@ -5,9 +5,11 @@
 	import {
 		createModel,
 		deleteModel,
 		downloadModel,
 		getOllamaUrls,
 		getOllamaVersion,
-		pullModel
+		pullModel,
 		uploadModel
 	} from '$lib/apis/ollama';
 	import { WEBUI_API_BASE_URL, WEBUI_BASE_URL } from '$lib/constants';
 	import { WEBUI_NAME, models, user } from '$lib/stores';
@ -60,7 +62,7 @@
 	let pullProgress = null;
 	let modelUploadMode = 'file';
-	let modelInputFile = '';
+	let modelInputFile: File[] | null = null;
 	let modelFileUrl = '';
 	let modelFileContent = `TEMPLATE """{{ .System }}\nUSER: {{ .Prompt }}\nASSISTANT: """\nPARAMETER num_ctx 4096\nPARAMETER stop "</s>"\nPARAMETER stop "USER:"\nPARAMETER stop "ASSISTANT:"`;
 	let modelFileDigest = '';
@ -191,30 +193,23 @@
 		let name = '';
 		if (modelUploadMode === 'file') {
-			const file = modelInputFile[0];
+			const file = modelInputFile ? modelInputFile[0] : null;
 			const formData = new FormData();
 			formData.append('file', file);
-			fileResponse = await fetch(`${WEBUI_API_BASE_URL}/utils/upload`, {
+			if (file) {
-				method: 'POST',
+				fileResponse = uploadModel(localStorage.token, file, selectedOllamaUrlIdx).catch(
-				headers: {
+					(error) => {
-					...($user && { Authorization: `Bearer ${localStorage.token}` })
+						toast.error(error);
-				},
+						return null;
-				body: formData
+					}
-			}).catch((error) => {
+				);
-				console.log(error);
+			}
 				return null;
 			});
 		} else {
-			fileResponse = await fetch(`${WEBUI_API_BASE_URL}/utils/download?url=${modelFileUrl}`, {
+			fileResponse = downloadModel(localStorage.token, modelFileUrl, selectedOllamaUrlIdx).catch(
-				method: 'GET',
+				(error) => {
-				headers: {
+					toast.error(error);
-					...($user && { Authorization: `Bearer ${localStorage.token}` })
+					return null;
 				}
-			}).catch((error) => {
+			);
 				console.log(error);
 				return null;
 			});
 		}
 		if (fileResponse && fileResponse.ok) {
@ -318,7 +313,8 @@
 		}
 		modelFileUrl = '';
-		modelInputFile = '';
+		modelUploadInputElement.value = '';
 		modelInputFile = null;
 		modelTransferring = false;
 		uploadProgress = null;