2024-01-07 14:59:22 +08:00
import os
import chromadb
2024-01-07 17:40:36 +08:00
from chromadb import Settings
2023-11-19 08:47:12 +08:00
from base64 import b64encode
2024-02-24 09:12:19 +08:00
from bs4 import BeautifulSoup
2024-01-07 17:40:36 +08:00
from pathlib import Path
2024-02-20 10:54:22 +08:00
import json
2024-02-25 14:35:11 +08:00
import yaml
2024-02-23 16:36:53 +08:00
import markdown
2024-02-24 09:12:19 +08:00
import requests
import shutil
from secrets import token_bytes
from constants import ERROR_MESSAGES
2024-02-20 10:54:22 +08:00
2024-01-07 17:40:36 +08:00
2024-01-20 04:12:14 +08:00
try :
from dotenv import load_dotenv , find_dotenv
2024-01-22 17:47:07 +08:00
2024-01-20 04:12:14 +08:00
load_dotenv ( find_dotenv ( " ../.env " ) )
except ImportError :
print ( " dotenv not installed, skipping... " )
2023-11-15 08:28:51 +08:00
2024-02-24 09:12:19 +08:00
WEBUI_NAME = " Open WebUI "
2024-02-24 09:24:46 +08:00
shutil . copyfile ( " ../build/favicon.png " , " ./static/favicon.png " )
2024-01-07 17:40:36 +08:00
2024-01-25 16:40:19 +08:00
# ENV (dev,test,prod)
2024-01-07 17:40:36 +08:00
2024-01-25 16:40:19 +08:00
ENV = os . environ . get ( " ENV " , " dev " )
2024-01-07 17:40:36 +08:00
2024-02-23 16:30:26 +08:00
try :
with open ( f " ../package.json " , " r " ) as f :
PACKAGE_DATA = json . load ( f )
except :
PACKAGE_DATA = { " version " : " 0.0.0 " }
VERSION = PACKAGE_DATA [ " version " ]
2024-02-23 16:36:53 +08:00
# Function to parse each section
def parse_section ( section ) :
items = [ ]
for li in section . find_all ( " li " ) :
# Extract raw HTML string
raw_html = str ( li )
# Extract text without HTML tags
text = li . get_text ( separator = " " , strip = True )
# Split into title and content
parts = text . split ( " : " , 1 )
title = parts [ 0 ] . strip ( ) if len ( parts ) > 1 else " "
content = parts [ 1 ] . strip ( ) if len ( parts ) > 1 else text
items . append ( { " title " : title , " content " : content , " raw " : raw_html } )
return items
try :
with open ( " ../CHANGELOG.md " , " r " ) as file :
changelog_content = file . read ( )
except :
changelog_content = " "
# Convert markdown content to HTML
html_content = markdown . markdown ( changelog_content )
# Parse the HTML content
soup = BeautifulSoup ( html_content , " html.parser " )
# Initialize JSON structure
changelog_json = { }
# Iterate over each version
for version in soup . find_all ( " h2 " ) :
version_number = version . get_text ( ) . strip ( ) . split ( " - " ) [ 0 ] [ 1 : - 1 ] # Remove brackets
date = version . get_text ( ) . strip ( ) . split ( " - " ) [ 1 ]
version_data = { " date " : date }
# Find the next sibling that is a h3 tag (section title)
current = version . find_next_sibling ( )
while current and current . name != " h2 " :
if current . name == " h3 " :
section_title = current . get_text ( ) . lower ( ) # e.g., "added", "fixed"
section_items = parse_section ( current . find_next_sibling ( " ul " ) )
version_data [ section_title ] = section_items
# Move to the next element
current = current . find_next_sibling ( )
changelog_json [ version_number ] = version_data
CHANGELOG = changelog_json
2024-02-24 09:12:19 +08:00
CUSTOM_NAME = os . environ . get ( " CUSTOM_NAME " , " " )
2024-02-24 09:36:38 +08:00
try :
r = requests . get ( f " https://api.openwebui.com/api/v1/custom/ { CUSTOM_NAME } " )
data = r . json ( )
if r . ok :
if " logo " in data :
url = (
f " https://api.openwebui.com { data [ ' logo ' ] } "
if data [ " logo " ] [ 0 ] == " / "
else data [ " logo " ]
r = requests . get ( url , stream = True )
if r . status_code == 200 :
with open ( " ./static/favicon.png " , " wb " ) as f :
r . raw . decode_content = True
shutil . copyfileobj ( r . raw , f )
WEBUI_NAME = data [ " name " ]
except Exception as e :
print ( e )
2024-02-24 09:12:19 +08:00
2024-01-25 16:40:19 +08:00
2024-01-23 23:59:52 +08:00
2024-01-25 16:40:19 +08:00
DATA_DIR = str ( Path ( os . getenv ( " DATA_DIR " , " ./data " ) ) . resolve ( ) )
2024-01-23 23:59:52 +08:00
FRONTEND_BUILD_DIR = str ( Path ( os . getenv ( " FRONTEND_BUILD_DIR " , " ../build " ) ) )
2024-01-07 17:40:36 +08:00
2024-02-20 10:54:22 +08:00
try :
with open ( f " { DATA_DIR } /config.json " , " r " ) as f :
CONFIG_DATA = json . load ( f )
except :
2023-11-19 08:47:12 +08:00
2024-01-25 16:40:19 +08:00
# File Upload DIR
2023-11-19 08:47:12 +08:00
2024-01-25 16:40:19 +08:00
UPLOAD_DIR = f " { DATA_DIR } /uploads "
Path ( UPLOAD_DIR ) . mkdir ( parents = True , exist_ok = True )
2023-11-15 08:28:51 +08:00
2024-02-06 14:51:08 +08:00
# Cache DIR
CACHE_DIR = f " { DATA_DIR } /cache "
Path ( CACHE_DIR ) . mkdir ( parents = True , exist_ok = True )
2024-02-18 13:06:08 +08:00
# Docs DIR
DOCS_DIR = f " { DATA_DIR } /docs "
Path ( DOCS_DIR ) . mkdir ( parents = True , exist_ok = True )
2024-02-06 14:51:08 +08:00
2024-02-25 14:35:11 +08:00
def create_config_file ( file_path ) :
directory = os . path . dirname ( file_path )
# Check if directory exists, if not, create it
if not os . path . exists ( directory ) :
os . makedirs ( directory )
# Data to write into the YAML file
config_data = {
" general_settings " : { } ,
" litellm_settings " : { } ,
" model_list " : [ ] ,
" router_settings " : { } ,
# Write data to YAML file
with open ( file_path , " w " ) as file :
yaml . dump ( config_data , file )
LITELLM_CONFIG_PATH = f " { DATA_DIR } /litellm/config.yaml "
if not os . path . exists ( LITELLM_CONFIG_PATH ) :
print ( " Config file doesn ' t exist. Creating... " )
create_config_file ( LITELLM_CONFIG_PATH )
print ( " Config file created successfully. " )
2023-11-19 08:47:12 +08:00
2024-01-07 14:59:22 +08:00
OLLAMA_API_BASE_URL = os . environ . get (
" OLLAMA_API_BASE_URL " , " http://localhost:11434/api "
2023-11-15 08:28:51 +08:00
if ENV == " prod " :
if OLLAMA_API_BASE_URL == " /ollama/api " :
OLLAMA_API_BASE_URL = " http://host.docker.internal:11434/api "
2023-11-19 08:47:12 +08:00
2024-01-05 08:49:34 +08:00
OPENAI_API_KEY = os . environ . get ( " OPENAI_API_KEY " , " " )
2024-01-05 10:38:03 +08:00
OPENAI_API_BASE_URL = os . environ . get ( " OPENAI_API_BASE_URL " , " " )
OPENAI_API_BASE_URL = " https://api.openai.com/v1 "
2024-01-05 08:49:34 +08:00
2024-01-23 13:07:40 +08:00
2024-02-07 02:58:07 +08:00
ENABLE_SIGNUP = os . environ . get ( " ENABLE_SIGNUP " , True )
2024-01-23 13:07:40 +08:00
DEFAULT_MODELS = os . environ . get ( " DEFAULT_MODELS " , None )
2024-02-20 10:54:22 +08:00
CONFIG_DATA [ " ui " ] [ " prompt_suggestions " ]
2024-02-20 11:09:09 +08:00
if " ui " in CONFIG_DATA
and " prompt_suggestions " in CONFIG_DATA [ " ui " ]
and type ( CONFIG_DATA [ " ui " ] [ " prompt_suggestions " ] ) is list
2024-02-20 10:54:22 +08:00
else [
2024-01-23 13:07:40 +08:00
" title " : [ " Help me study " , " vocabulary for a college entrance exam " ] ,
" content " : " Help me study vocabulary: write a sentence for me to fill in the blank, and I ' ll try to pick the correct option. " ,
} ,
" title " : [ " Give me ideas " , " for what to do with my kids ' art " ] ,
" content " : " What are 5 creative things I could do with my kids ' art? I don ' t want to throw them away, but it ' s also so much clutter. " ,
} ,
" title " : [ " Tell me a fun fact " , " about the Roman Empire " ] ,
" content " : " Tell me a random fun fact about the Roman Empire " ,
} ,
" title " : [ " Show me a code snippet " , " of a website ' s sticky header " ] ,
" content " : " Show me a code snippet of a website ' s sticky header in CSS and JavaScript. " ,
} ,
2024-02-20 10:54:22 +08:00
2024-01-23 13:07:40 +08:00
2024-02-20 10:54:22 +08:00
2024-02-23 18:03:06 +08:00
DEFAULT_USER_ROLE = os . getenv ( " DEFAULT_USER_ROLE " , " pending " )
2024-02-14 17:17:43 +08:00
USER_PERMISSIONS = { " chat " : { " deletion " : True } }
2024-01-23 13:07:40 +08:00
2023-11-19 08:47:12 +08:00
2023-11-19 16:41:29 +08:00
2023-11-19 08:47:12 +08:00
2024-02-14 17:19:39 +08:00
WEBUI_VERSION = os . environ . get ( " WEBUI_VERSION " , " v1.0.0-alpha.100 " )
2023-11-19 08:47:12 +08:00
2023-12-26 14:14:06 +08:00
# WEBUI_AUTH (Required for security)
2023-11-19 08:47:12 +08:00
2023-12-26 14:14:06 +08:00
2023-11-19 08:47:12 +08:00
2023-11-21 08:22:43 +08:00
2024-02-02 03:40:59 +08:00
2023-11-21 08:22:43 +08:00
2024-02-02 03:40:59 +08:00
WEBUI_SECRET_KEY = os . environ . get (
2024-02-04 09:42:08 +08:00
os . environ . get (
" WEBUI_JWT_SECRET_KEY " , " t0p-s3cr3t "
) , # DEPRECATED: remove at next major version
2024-02-02 03:40:59 +08:00
2023-11-19 08:47:12 +08:00
2024-02-02 03:40:59 +08:00
2023-11-21 08:22:43 +08:00
2024-01-07 14:59:22 +08:00
2024-01-22 17:47:07 +08:00
CHROMA_DATA_PATH = f " { DATA_DIR } /vector_db "
2024-02-18 02:38:29 +08:00
# this uses the model defined in the Dockerfile ENV variable. If you dont use docker or docker based deployments such as k8s, the default embedding model will be used (all-MiniLM-L6-v2)
2024-02-20 02:56:50 +08:00
RAG_EMBEDDING_MODEL = os . environ . get ( " RAG_EMBEDDING_MODEL " , " all-MiniLM-L6-v2 " )
2024-02-19 14:51:17 +08:00
# device type ebbeding models - "cpu" (default), "cuda" (nvidia gpu required) or "mps" (apple silicon) - choosing this right can lead to better performance
2024-02-20 02:56:50 +08:00
RAG_EMBEDDING_MODEL_DEVICE_TYPE = os . environ . get (
2024-01-07 17:40:36 +08:00
CHROMA_CLIENT = chromadb . PersistentClient (
2024-02-04 09:42:08 +08:00
settings = Settings ( allow_reset = True , anonymized_telemetry = False ) ,
2024-01-07 17:40:36 +08:00
2024-01-07 14:59:22 +08:00
2024-02-11 16:17:50 +08:00
2024-02-18 14:41:03 +08:00
RAG_TEMPLATE = """ Use the following context as your learned knowledge, inside <context></context> XML tags.
< context >
[ context ]
< / context >
When answer to user :
- If you don ' t know, just say that you don ' t know .
- If you don ' t know when you are not sure, ask for clarification.
Avoid mentioning that you obtained the information from the context .
And answer according to the language of the user ' s question.
Given the context information , answer the query .
Query : [ query ] """
2024-02-11 16:17:50 +08:00
# Transcribe
2024-02-15 15:32:54 +08:00
WHISPER_MODEL = os . getenv ( " WHISPER_MODEL " , " base " )
WHISPER_MODEL_DIR = os . getenv ( " WHISPER_MODEL_DIR " , f " { CACHE_DIR } /whisper/models " )
2024-02-22 10:12:01 +08:00
# Images
AUTOMATIC1111_BASE_URL = os . getenv ( " AUTOMATIC1111_BASE_URL " , " " )