main.py 14.8 KB
Newer Older
Timothy J. Baek's avatar
Timothy J. Baek committed
1
2
from fastapi import FastAPI, Request, Response, HTTPException, Depends
from fastapi.middleware.cors import CORSMiddleware
Timothy J. Baek's avatar
Timothy J. Baek committed
3
from fastapi.responses import StreamingResponse, JSONResponse, FileResponse
Timothy J. Baek's avatar
Timothy J. Baek committed
4
5

import requests
Timothy J. Baek's avatar
Timothy J. Baek committed
6
7
import aiohttp
import asyncio
Timothy J. Baek's avatar
Timothy J. Baek committed
8
import json
9
import logging
Timothy J. Baek's avatar
Timothy J. Baek committed
10

Timothy J. Baek's avatar
Timothy J. Baek committed
11
12
from pydantic import BaseModel

13
14
from apps.webui.models.models import Models
from apps.webui.models.users import Users
Timothy J. Baek's avatar
Timothy J. Baek committed
15
from constants import ERROR_MESSAGES
Timothy J. Baek's avatar
Timothy J. Baek committed
16
17
18
19
20
21
from utils.utils import (
    decode_token,
    get_current_user,
    get_verified_user,
    get_admin_user,
)
22
from config import (
23
    SRC_LOG_LEVELS,
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
24
    ENABLE_OPENAI_API,
25
26
27
    OPENAI_API_BASE_URLS,
    OPENAI_API_KEYS,
    CACHE_DIR,
Timothy J. Baek's avatar
Timothy J. Baek committed
28
    ENABLE_MODEL_FILTER,
29
    MODEL_FILTER_LIST,
30
    AppConfig,
31
)
Timothy J. Baek's avatar
Timothy J. Baek committed
32
33
from typing import List, Optional

Timothy J. Baek's avatar
Timothy J. Baek committed
34
35
36

import hashlib
from pathlib import Path
Timothy J. Baek's avatar
Timothy J. Baek committed
37

38
39
40
log = logging.getLogger(__name__)
log.setLevel(SRC_LOG_LEVELS["OPENAI"])

Timothy J. Baek's avatar
Timothy J. Baek committed
41
42
43
44
45
46
47
48
49
app = FastAPI()
app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)

Timothy J. Baek's avatar
Timothy J. Baek committed
50

51
52
app.state.config = AppConfig()

Timothy J. Baek's avatar
Timothy J. Baek committed
53
54
app.state.config.ENABLE_MODEL_FILTER = ENABLE_MODEL_FILTER
app.state.config.MODEL_FILTER_LIST = MODEL_FILTER_LIST
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
55
56

app.state.config.ENABLE_OPENAI_API = ENABLE_OPENAI_API
57
58
app.state.config.OPENAI_API_BASE_URLS = OPENAI_API_BASE_URLS
app.state.config.OPENAI_API_KEYS = OPENAI_API_KEYS
Timothy J. Baek's avatar
Timothy J. Baek committed
59
60
61

app.state.MODELS = {}

Timothy J. Baek's avatar
Timothy J. Baek committed
62

Timothy J. Baek's avatar
Timothy J. Baek committed
63
64
65
66
67
68
@app.middleware("http")
async def check_url(request: Request, call_next):
    if len(app.state.MODELS) == 0:
        await get_all_models()
    else:
        pass
Timothy J. Baek's avatar
Timothy J. Baek committed
69

Timothy J. Baek's avatar
Timothy J. Baek committed
70
71
    response = await call_next(request)
    return response
Timothy J. Baek's avatar
Timothy J. Baek committed
72
73


Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
@app.get("/config")
async def get_config(user=Depends(get_admin_user)):
    return {"ENABLE_OPENAI_API": app.state.config.ENABLE_OPENAI_API}


class OpenAIConfigForm(BaseModel):
    enable_openai_api: Optional[bool] = None


@app.post("/config/update")
async def update_config(form_data: OpenAIConfigForm, user=Depends(get_admin_user)):
    app.state.config.ENABLE_OPENAI_API = form_data.enable_openai_api
    return {"ENABLE_OPENAI_API": app.state.config.ENABLE_OPENAI_API}


Timothy J. Baek's avatar
Timothy J. Baek committed
89
90
class UrlsUpdateForm(BaseModel):
    urls: List[str]
Timothy J. Baek's avatar
Timothy J. Baek committed
91
92


Timothy J. Baek's avatar
Timothy J. Baek committed
93
94
class KeysUpdateForm(BaseModel):
    keys: List[str]
Timothy J. Baek's avatar
Timothy J. Baek committed
95
96


Timothy J. Baek's avatar
Timothy J. Baek committed
97
98
@app.get("/urls")
async def get_openai_urls(user=Depends(get_admin_user)):
99
    return {"OPENAI_API_BASE_URLS": app.state.config.OPENAI_API_BASE_URLS}
100

Timothy J. Baek's avatar
Timothy J. Baek committed
101

Timothy J. Baek's avatar
Timothy J. Baek committed
102
103
@app.post("/urls/update")
async def update_openai_urls(form_data: UrlsUpdateForm, user=Depends(get_admin_user)):
104
    await get_all_models()
105
106
    app.state.config.OPENAI_API_BASE_URLS = form_data.urls
    return {"OPENAI_API_BASE_URLS": app.state.config.OPENAI_API_BASE_URLS}
Timothy J. Baek's avatar
Timothy J. Baek committed
107
108


Timothy J. Baek's avatar
Timothy J. Baek committed
109
110
@app.get("/keys")
async def get_openai_keys(user=Depends(get_admin_user)):
111
    return {"OPENAI_API_KEYS": app.state.config.OPENAI_API_KEYS}
Timothy J. Baek's avatar
Timothy J. Baek committed
112
113
114
115


@app.post("/keys/update")
async def update_openai_key(form_data: KeysUpdateForm, user=Depends(get_admin_user)):
116
117
    app.state.config.OPENAI_API_KEYS = form_data.keys
    return {"OPENAI_API_KEYS": app.state.config.OPENAI_API_KEYS}
Timothy J. Baek's avatar
Timothy J. Baek committed
118
119


Timothy J. Baek's avatar
Timothy J. Baek committed
120
@app.post("/audio/speech")
121
async def speech(request: Request, user=Depends(get_verified_user)):
Timothy J. Baek's avatar
Timothy J. Baek committed
122
123
    idx = None
    try:
124
        idx = app.state.config.OPENAI_API_BASE_URLS.index("https://api.openai.com/v1")
Timothy J. Baek's avatar
Timothy J. Baek committed
125
126
127
128
129
130
131
132
133
134
135
136
137
        body = await request.body()
        name = hashlib.sha256(body).hexdigest()

        SPEECH_CACHE_DIR = Path(CACHE_DIR).joinpath("./audio/speech/")
        SPEECH_CACHE_DIR.mkdir(parents=True, exist_ok=True)
        file_path = SPEECH_CACHE_DIR.joinpath(f"{name}.mp3")
        file_body_path = SPEECH_CACHE_DIR.joinpath(f"{name}.json")

        # Check if the file already exists in the cache
        if file_path.is_file():
            return FileResponse(file_path)

        headers = {}
138
        headers["Authorization"] = f"Bearer {app.state.config.OPENAI_API_KEYS[idx]}"
Timothy J. Baek's avatar
Timothy J. Baek committed
139
        headers["Content-Type"] = "application/json"
140
141
142
        if "openrouter.ai" in app.state.config.OPENAI_API_BASE_URLS[idx]:
            headers["HTTP-Referer"] = "https://openwebui.com/"
            headers["X-Title"] = "Open WebUI"
Timothy J. Baek's avatar
Timothy J. Baek committed
143
        r = None
Timothy J. Baek's avatar
Timothy J. Baek committed
144
145
        try:
            r = requests.post(
146
                url=f"{app.state.config.OPENAI_API_BASE_URLS[idx]}/audio/speech",
Timothy J. Baek's avatar
Timothy J. Baek committed
147
148
149
150
                data=body,
                headers=headers,
                stream=True,
            )
Timothy J. Baek's avatar
Timothy J. Baek committed
151

Timothy J. Baek's avatar
Timothy J. Baek committed
152
            r.raise_for_status()
Timothy J. Baek's avatar
Timothy J. Baek committed
153

Timothy J. Baek's avatar
Timothy J. Baek committed
154
155
156
157
            # Save the streaming content to a file
            with open(file_path, "wb") as f:
                for chunk in r.iter_content(chunk_size=8192):
                    f.write(chunk)
Timothy J. Baek's avatar
Timothy J. Baek committed
158

Timothy J. Baek's avatar
Timothy J. Baek committed
159
160
            with open(file_body_path, "w") as f:
                json.dump(json.loads(body.decode("utf-8")), f)
Timothy J. Baek's avatar
Timothy J. Baek committed
161

Timothy J. Baek's avatar
Timothy J. Baek committed
162
163
            # Return the saved file
            return FileResponse(file_path)
Timothy J. Baek's avatar
Timothy J. Baek committed
164

Timothy J. Baek's avatar
Timothy J. Baek committed
165
        except Exception as e:
166
            log.exception(e)
Timothy J. Baek's avatar
Timothy J. Baek committed
167
168
169
170
171
172
173
174
175
            error_detail = "Open WebUI: Server Connection Error"
            if r is not None:
                try:
                    res = r.json()
                    if "error" in res:
                        error_detail = f"External: {res['error']}"
                except:
                    error_detail = f"External: {e}"

Timothy J. Baek's avatar
Timothy J. Baek committed
176
177
178
            raise HTTPException(
                status_code=r.status_code if r else 500, detail=error_detail
            )
Timothy J. Baek's avatar
Timothy J. Baek committed
179
180
181

    except ValueError:
        raise HTTPException(status_code=401, detail=ERROR_MESSAGES.OPENAI_NOT_FOUND)
Timothy J. Baek's avatar
Timothy J. Baek committed
182
183


Timothy J. Baek's avatar
Timothy J. Baek committed
184
async def fetch_url(url, key):
Timothy J. Baek's avatar
Timothy J. Baek committed
185
    timeout = aiohttp.ClientTimeout(total=5)
Timothy J. Baek's avatar
Timothy J. Baek committed
186
    try:
187
188
189
190
        headers = {"Authorization": f"Bearer {key}"}
        async with aiohttp.ClientSession(timeout=timeout) as session:
            async with session.get(url, headers=headers) as response:
                return await response.json()
Timothy J. Baek's avatar
Timothy J. Baek committed
191
192
    except Exception as e:
        # Handle connection error here
193
        log.error(f"Connection error: {e}")
Timothy J. Baek's avatar
Timothy J. Baek committed
194
195
196
197
        return None


def merge_models_lists(model_lists):
198
    log.debug(f"merge_models_lists {model_lists}")
Timothy J. Baek's avatar
Timothy J. Baek committed
199
200
201
    merged_list = []

    for idx, models in enumerate(model_lists):
Timothy J. Baek's avatar
Timothy J. Baek committed
202
203
204
        if models is not None and "error" not in models:
            merged_list.extend(
                [
205
206
                    {
                        **model,
207
                        "name": model.get("name", model["id"]),
208
209
210
211
                        "owned_by": "openai",
                        "openai": model,
                        "urlIdx": idx,
                    }
Timothy J. Baek's avatar
Timothy J. Baek committed
212
                    for model in models
213
                    if "api.openai.com"
214
                    not in app.state.config.OPENAI_API_BASE_URLS[idx]
Timothy J. Baek's avatar
Timothy J. Baek committed
215
216
217
                    or "gpt" in model["id"]
                ]
            )
Timothy J. Baek's avatar
Timothy J. Baek committed
218

Timothy J. Baek's avatar
Timothy J. Baek committed
219
    return merged_list
Timothy J. Baek's avatar
Timothy J. Baek committed
220
221


Timothy J. Baek's avatar
Timothy J. Baek committed
222
async def get_all_models(raw: bool = False):
223
    log.info("get_all_models()")
224

225
    if (
226
227
        len(app.state.config.OPENAI_API_KEYS) == 1
        and app.state.config.OPENAI_API_KEYS[0] == ""
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
228
    ) or not app.state.config.ENABLE_OPENAI_API:
229
230
231
        models = {"data": []}
    else:
        tasks = [
232
233
            fetch_url(f"{url}/models", app.state.config.OPENAI_API_KEYS[idx])
            for idx, url in enumerate(app.state.config.OPENAI_API_BASE_URLS)
234
        ]
Timothy J. Baek's avatar
Timothy J. Baek committed
235

236
        responses = await asyncio.gather(*tasks)
237
        log.debug(f"get_all_models:responses() {responses}")
Timothy J. Baek's avatar
Timothy J. Baek committed
238

Timothy J. Baek's avatar
Timothy J. Baek committed
239
240
241
        if raw:
            return responses

242
243
        models = {
            "data": merge_models_lists(
Timothy J. Baek's avatar
Timothy J. Baek committed
244
245
                list(
                    map(
Timothy J. Baek's avatar
Timothy J. Baek committed
246
                        lambda response: (
Timothy J. Baek's avatar
Timothy J. Baek committed
247
                            response["data"]
Timothy J. Baek's avatar
Timothy J. Baek committed
248
249
                            if (response and "data" in response)
                            else (response if isinstance(response, list) else None)
Timothy J. Baek's avatar
Timothy J. Baek committed
250
                        ),
Timothy J. Baek's avatar
Timothy J. Baek committed
251
252
253
                        responses,
                    )
                )
254
255
            )
        }
Timothy J. Baek's avatar
Timothy J. Baek committed
256

257
        log.debug(f"models: {models}")
258
        app.state.MODELS = {model["id"]: model for model in models["data"]}
Timothy J. Baek's avatar
Timothy J. Baek committed
259

260
261
262
    return models


Timothy J. Baek's avatar
Timothy J. Baek committed
263
264
@app.get("/models")
@app.get("/models/{url_idx}")
Timothy J. Baek's avatar
Timothy J. Baek committed
265
async def get_models(url_idx: Optional[int] = None, user=Depends(get_current_user)):
Timothy J. Baek's avatar
Timothy J. Baek committed
266
    if url_idx == None:
Timothy J. Baek's avatar
Timothy J. Baek committed
267
        models = await get_all_models()
Timothy J. Baek's avatar
Timothy J. Baek committed
268
        if app.state.config.ENABLE_MODEL_FILTER:
Timothy J. Baek's avatar
Timothy J. Baek committed
269
            if user.role == "user":
270
271
                models["data"] = list(
                    filter(
Timothy J. Baek's avatar
Timothy J. Baek committed
272
                        lambda model: model["id"] in app.state.config.MODEL_FILTER_LIST,
273
274
                        models["data"],
                    )
Timothy J. Baek's avatar
Timothy J. Baek committed
275
276
277
                )
                return models
        return models
Timothy J. Baek's avatar
Timothy J. Baek committed
278
    else:
279
        url = app.state.config.OPENAI_API_BASE_URLS[url_idx]
280
281
282
283
284
        key = app.state.config.OPENAI_API_KEYS[url_idx]

        headers = {}
        headers["Authorization"] = f"Bearer {key}"
        headers["Content-Type"] = "application/json"
Timothy J. Baek's avatar
Timothy J. Baek committed
285
286
287

        r = None

Timothy J. Baek's avatar
Timothy J. Baek committed
288
        try:
289
            r = requests.request(method="GET", url=f"{url}/models", headers=headers)
Timothy J. Baek's avatar
Timothy J. Baek committed
290
291
292
293
294
295
296
297
298
299
            r.raise_for_status()

            response_data = r.json()
            if "api.openai.com" in url:
                response_data["data"] = list(
                    filter(lambda model: "gpt" in model["id"], response_data["data"])
                )

            return response_data
        except Exception as e:
300
            log.exception(e)
Timothy J. Baek's avatar
Timothy J. Baek committed
301
302
303
304
305
306
307
308
309
310
311
312
313
            error_detail = "Open WebUI: Server Connection Error"
            if r is not None:
                try:
                    res = r.json()
                    if "error" in res:
                        error_detail = f"External: {res['error']}"
                except:
                    error_detail = f"External: {e}"

            raise HTTPException(
                status_code=r.status_code if r else 500,
                detail=error_detail,
            )
Timothy J. Baek's avatar
Timothy J. Baek committed
314
315


Timothy J. Baek's avatar
Timothy J. Baek committed
316
@app.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE"])
317
async def proxy(path: str, request: Request, user=Depends(get_verified_user)):
Timothy J. Baek's avatar
Timothy J. Baek committed
318
    idx = 0
Timothy J. Baek's avatar
Timothy J. Baek committed
319

Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
320
321
    body = await request.body()
    # TODO: Remove below after gpt-4-vision fix from Open AI
322
    # Try to decode the body of the request from bytes to a UTF-8 string (Require add max_token to fix gpt-4-vision)
Timothy J. Baek's avatar
Timothy J. Baek committed
323
324
325

    payload = None

326
    try:
Timothy J. Baek's avatar
Timothy J. Baek committed
327
328
329
        if "chat/completions" in path:
            body = body.decode("utf-8")
            body = json.loads(body)
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
330

Timothy J. Baek's avatar
Timothy J. Baek committed
331
            payload = {**body}
332

Timothy J. Baek's avatar
Timothy J. Baek committed
333
334
            model_id = body.get("model")
            model_info = Models.get_model_by_id(model_id)
Timothy J. Baek's avatar
Timothy J. Baek committed
335

Timothy J. Baek's avatar
Timothy J. Baek committed
336
337
338
339
            if model_info:
                print(model_info)
                if model_info.base_model_id:
                    payload["model"] = model_info.base_model_id
Timothy J. Baek's avatar
Timothy J. Baek committed
340

Timothy J. Baek's avatar
Timothy J. Baek committed
341
342
343
                model_info.params = model_info.params.model_dump()

                if model_info.params:
Timothy J. Baek's avatar
Timothy J. Baek committed
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
                    if model_info.params.get("temperature", None):
                        payload["temperature"] = int(
                            model_info.params.get("temperature")
                        )

                    if model_info.params.get("top_p", None):
                        payload["top_p"] = int(model_info.params.get("top_p", None))

                    if model_info.params.get("max_tokens", None):
                        payload["max_tokens"] = int(
                            model_info.params.get("max_tokens", None)
                        )

                    if model_info.params.get("frequency_penalty", None):
                        payload["frequency_penalty"] = int(
                            model_info.params.get("frequency_penalty", None)
                        )

                    if model_info.params.get("seed", None):
                        payload["seed"] = model_info.params.get("seed", None)

                    if model_info.params.get("stop", None):
                        payload["stop"] = (
                            [
                                bytes(stop, "utf-8").decode("unicode_escape")
                                for stop in model_info.params["stop"]
                            ]
                            if model_info.params.get("stop", None)
                            else None
                        )
Timothy J. Baek's avatar
Timothy J. Baek committed
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412

                if model_info.params.get("system", None):
                    # Check if the payload already has a system message
                    # If not, add a system message to the payload
                    if payload.get("messages"):
                        for message in payload["messages"]:
                            if message.get("role") == "system":
                                message["content"] = (
                                    model_info.params.get("system", None)
                                    + message["content"]
                                )
                                break
                        else:
                            payload["messages"].insert(
                                0,
                                {
                                    "role": "system",
                                    "content": model_info.params.get("system", None),
                                },
                            )
            else:
                pass

            model = app.state.MODELS[payload.get("model")]

            idx = model["urlIdx"]

            if "pipeline" in model and model.get("pipeline"):
                payload["user"] = {"name": user.name, "id": user.id}

            # Check if the model is "gpt-4-vision-preview" and set "max_tokens" to 4000
            # This is a workaround until OpenAI fixes the issue with this model
            if payload.get("model") == "gpt-4-vision-preview":
                if "max_tokens" not in payload:
                    payload["max_tokens"] = 4000
                log.debug("Modified payload:", payload)

            # Convert the modified body back to JSON
            payload = json.dumps(payload)
Timothy J. Baek's avatar
Timothy J. Baek committed
413

Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
414
    except json.JSONDecodeError as e:
415
        log.error("Error loading request body into a dictionary:", e)
Timothy J. Baek's avatar
Timothy J. Baek committed
416

Timothy J. Baek's avatar
Timothy J. Baek committed
417
418
    print(payload)

419
420
    url = app.state.config.OPENAI_API_BASE_URLS[idx]
    key = app.state.config.OPENAI_API_KEYS[idx]
Timothy J. Baek's avatar
Timothy J. Baek committed
421
422
423

    target_url = f"{url}/{path}"

424
    headers = {}
Timothy J. Baek's avatar
Timothy J. Baek committed
425
    headers["Authorization"] = f"Bearer {key}"
Timothy J. Baek's avatar
Timothy J. Baek committed
426
    headers["Content-Type"] = "application/json"
Timothy J. Baek's avatar
Timothy J. Baek committed
427

Timothy J. Baek's avatar
Timothy J. Baek committed
428
429
    r = None

Timothy J. Baek's avatar
Timothy J. Baek committed
430
431
432
433
    try:
        r = requests.request(
            method=request.method,
            url=target_url,
Timothy J. Baek's avatar
Timothy J. Baek committed
434
            data=payload if payload else body,
Timothy J. Baek's avatar
Timothy J. Baek committed
435
436
437
438
439
440
            headers=headers,
            stream=True,
        )

        r.raise_for_status()

441
442
443
444
445
446
447
448
449
450
        # Check if response is SSE
        if "text/event-stream" in r.headers.get("Content-Type", ""):
            return StreamingResponse(
                r.iter_content(chunk_size=8192),
                status_code=r.status_code,
                headers=dict(r.headers),
            )
        else:
            response_data = r.json()
            return response_data
Timothy J. Baek's avatar
Timothy J. Baek committed
451
    except Exception as e:
452
        log.exception(e)
Timothy J. Baek's avatar
Timothy J. Baek committed
453
        error_detail = "Open WebUI: Server Connection Error"
Timothy J. Baek's avatar
Timothy J. Baek committed
454
455
456
        if r is not None:
            try:
                res = r.json()
Timothy J. Baek's avatar
Timothy J. Baek committed
457
                print(res)
Timothy J. Baek's avatar
Timothy J. Baek committed
458
                if "error" in res:
Timothy J. Baek's avatar
Timothy J. Baek committed
459
                    error_detail = f"External: {res['error']['message'] if 'message' in res['error'] else res['error']}"
Timothy J. Baek's avatar
Timothy J. Baek committed
460
461
462
            except:
                error_detail = f"External: {e}"

Timothy J. Baek's avatar
Timothy J. Baek committed
463
464
465
        raise HTTPException(
            status_code=r.status_code if r else 500, detail=error_detail
        )