github-actions[bot] commited on
Commit
a6c0eee
0 Parent(s):

GitHub deploy: 66c5a17453142e0afee794b163349521ecdb7894

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .dockerignore +20 -0
  2. .env.example +13 -0
  3. .eslintignore +13 -0
  4. .eslintrc.cjs +31 -0
  5. .gitattributes +3 -0
  6. .github/FUNDING.yml +1 -0
  7. .github/ISSUE_TEMPLATE/bug_report.md +80 -0
  8. .github/ISSUE_TEMPLATE/feature_request.md +35 -0
  9. .github/dependabot.yml +12 -0
  10. .github/pull_request_template.md +72 -0
  11. .github/workflows/build-release.yml +72 -0
  12. .github/workflows/deploy-to-hf-spaces.yml +63 -0
  13. .github/workflows/docker-build.yaml +477 -0
  14. .github/workflows/format-backend.yaml +39 -0
  15. .github/workflows/format-build-frontend.yaml +57 -0
  16. .github/workflows/integration-test.yml +253 -0
  17. .github/workflows/lint-backend.disabled +27 -0
  18. .github/workflows/lint-frontend.disabled +21 -0
  19. .github/workflows/release-pypi.yml +32 -0
  20. .gitignore +310 -0
  21. .npmrc +1 -0
  22. .prettierignore +316 -0
  23. .prettierrc +9 -0
  24. CHANGELOG.md +1297 -0
  25. CODE_OF_CONDUCT.md +77 -0
  26. Caddyfile.localhost +64 -0
  27. Dockerfile +176 -0
  28. INSTALLATION.md +35 -0
  29. LICENSE +21 -0
  30. Makefile +33 -0
  31. README.md +221 -0
  32. TROUBLESHOOTING.md +36 -0
  33. backend/.dockerignore +14 -0
  34. backend/.gitignore +12 -0
  35. backend/dev.sh +2 -0
  36. backend/open_webui/__init__.py +77 -0
  37. backend/open_webui/alembic.ini +114 -0
  38. backend/open_webui/apps/audio/main.py +713 -0
  39. backend/open_webui/apps/images/main.py +609 -0
  40. backend/open_webui/apps/images/utils/comfyui.py +186 -0
  41. backend/open_webui/apps/ollama/main.py +1324 -0
  42. backend/open_webui/apps/openai/main.py +714 -0
  43. backend/open_webui/apps/retrieval/loaders/main.py +190 -0
  44. backend/open_webui/apps/retrieval/loaders/youtube.py +98 -0
  45. backend/open_webui/apps/retrieval/main.py +1452 -0
  46. backend/open_webui/apps/retrieval/models/colbert.py +81 -0
  47. backend/open_webui/apps/retrieval/utils.py +592 -0
  48. backend/open_webui/apps/retrieval/vector/connector.py +22 -0
  49. backend/open_webui/apps/retrieval/vector/dbs/chroma.py +174 -0
  50. backend/open_webui/apps/retrieval/vector/dbs/milvus.py +286 -0
.dockerignore ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ .github
2
+ .DS_Store
3
+ docs
4
+ kubernetes
5
+ node_modules
6
+ /.svelte-kit
7
+ /package
8
+ .env
9
+ .env.*
10
+ vite.config.js.timestamp-*
11
+ vite.config.ts.timestamp-*
12
+ __pycache__
13
+ .idea
14
+ venv
15
+ _old
16
+ uploads
17
+ .ipynb_checkpoints
18
+ **/*.db
19
+ _test
20
+ backend/data/*
.env.example ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Ollama URL for the backend to connect
2
+ # The path '/ollama' will be redirected to the specified backend URL
3
+ OLLAMA_BASE_URL='http://localhost:11434'
4
+
5
+ OPENAI_API_BASE_URL=''
6
+ OPENAI_API_KEY=''
7
+
8
+ # AUTOMATIC1111_BASE_URL="http://localhost:7860"
9
+
10
+ # DO NOT TRACK
11
+ SCARF_NO_ANALYTICS=true
12
+ DO_NOT_TRACK=true
13
+ ANONYMIZED_TELEMETRY=false
.eslintignore ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ .DS_Store
2
+ node_modules
3
+ /build
4
+ /.svelte-kit
5
+ /package
6
+ .env
7
+ .env.*
8
+ !.env.example
9
+
10
+ # Ignore files for PNPM, NPM and YARN
11
+ pnpm-lock.yaml
12
+ package-lock.json
13
+ yarn.lock
.eslintrc.cjs ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ module.exports = {
2
+ root: true,
3
+ extends: [
4
+ 'eslint:recommended',
5
+ 'plugin:@typescript-eslint/recommended',
6
+ 'plugin:svelte/recommended',
7
+ 'plugin:cypress/recommended',
8
+ 'prettier'
9
+ ],
10
+ parser: '@typescript-eslint/parser',
11
+ plugins: ['@typescript-eslint'],
12
+ parserOptions: {
13
+ sourceType: 'module',
14
+ ecmaVersion: 2020,
15
+ extraFileExtensions: ['.svelte']
16
+ },
17
+ env: {
18
+ browser: true,
19
+ es2017: true,
20
+ node: true
21
+ },
22
+ overrides: [
23
+ {
24
+ files: ['*.svelte'],
25
+ parser: 'svelte-eslint-parser',
26
+ parserOptions: {
27
+ parser: '@typescript-eslint/parser'
28
+ }
29
+ }
30
+ ]
31
+ };
.gitattributes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ *.sh text eol=lf
2
+ *.ttf filter=lfs diff=lfs merge=lfs -text
3
+ *.jpg filter=lfs diff=lfs merge=lfs -text
.github/FUNDING.yml ADDED
@@ -0,0 +1 @@
 
 
1
+ github: tjbck
.github/ISSUE_TEMPLATE/bug_report.md ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ name: Bug report
3
+ about: Create a report to help us improve
4
+ title: ''
5
+ labels: ''
6
+ assignees: ''
7
+ ---
8
+
9
+ # Bug Report
10
+
11
+ ## Important Notes
12
+
13
+ - **Before submitting a bug report**: Please check the Issues or Discussions section to see if a similar issue or feature request has already been posted. It's likely we're already tracking it! If you’re unsure, start a discussion post first. This will help us efficiently focus on improving the project.
14
+
15
+ - **Collaborate respectfully**: We value a constructive attitude, so please be mindful of your communication. If negativity is part of your approach, our capacity to engage may be limited. We’re here to help if you’re open to learning and communicating positively. Remember, Open WebUI is a volunteer-driven project managed by a single maintainer and supported by contributors who also have full-time jobs. We appreciate your time and ask that you respect ours.
16
+
17
+ - **Contributing**: If you encounter an issue, we highly encourage you to submit a pull request or fork the project. We actively work to prevent contributor burnout to maintain the quality and continuity of Open WebUI.
18
+
19
+ - **Bug reproducibility**: If a bug cannot be reproduced with a `:main` or `:dev` Docker setup, or a pip install with Python 3.11, it may require additional help from the community. In such cases, we will move it to the "issues" Discussions section due to our limited resources. We encourage the community to assist with these issues. Remember, it’s not that the issue doesn’t exist; we need your help!
20
+
21
+ Note: Please remove the notes above when submitting your post. Thank you for your understanding and support!
22
+
23
+ ---
24
+
25
+ ## Installation Method
26
+
27
+ [Describe the method you used to install the project, e.g., git clone, Docker, pip, etc.]
28
+
29
+ ## Environment
30
+
31
+ - **Open WebUI Version:** [e.g., v0.3.11]
32
+ - **Ollama (if applicable):** [e.g., v0.2.0, v0.1.32-rc1]
33
+
34
+ - **Operating System:** [e.g., Windows 10, macOS Big Sur, Ubuntu 20.04]
35
+ - **Browser (if applicable):** [e.g., Chrome 100.0, Firefox 98.0]
36
+
37
+ **Confirmation:**
38
+
39
+ - [ ] I have read and followed all the instructions provided in the README.md.
40
+ - [ ] I am on the latest version of both Open WebUI and Ollama.
41
+ - [ ] I have included the browser console logs.
42
+ - [ ] I have included the Docker container logs.
43
+ - [ ] I have provided the exact steps to reproduce the bug in the "Steps to Reproduce" section below.
44
+
45
+ ## Expected Behavior:
46
+
47
+ [Describe what you expected to happen.]
48
+
49
+ ## Actual Behavior:
50
+
51
+ [Describe what actually happened.]
52
+
53
+ ## Description
54
+
55
+ **Bug Summary:**
56
+ [Provide a brief but clear summary of the bug]
57
+
58
+ ## Reproduction Details
59
+
60
+ **Steps to Reproduce:**
61
+ [Outline the steps to reproduce the bug. Be as detailed as possible.]
62
+
63
+ ## Logs and Screenshots
64
+
65
+ **Browser Console Logs:**
66
+ [Include relevant browser console logs, if applicable]
67
+
68
+ **Docker Container Logs:**
69
+ [Include relevant Docker container logs, if applicable]
70
+
71
+ **Screenshots/Screen Recordings (if applicable):**
72
+ [Attach any relevant screenshots to help illustrate the issue]
73
+
74
+ ## Additional Information
75
+
76
+ [Include any additional details that may help in understanding and reproducing the issue. This could include specific configurations, error messages, or anything else relevant to the bug.]
77
+
78
+ ## Note
79
+
80
+ If the bug report is incomplete or does not follow the provided instructions, it may not be addressed. Please ensure that you have followed the steps outlined in the README.md and troubleshooting.md documents, and provide all necessary information for us to reproduce and address the issue. Thank you!
.github/ISSUE_TEMPLATE/feature_request.md ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ name: Feature request
3
+ about: Suggest an idea for this project
4
+ title: ''
5
+ labels: ''
6
+ assignees: ''
7
+ ---
8
+
9
+ # Feature Request
10
+
11
+ ## Important Notes
12
+
13
+ - **Before submitting a report**: Please check the Issues or Discussions section to see if a similar issue or feature request has already been posted. It's likely we're already tracking it! If you’re unsure, start a discussion post first. This will help us efficiently focus on improving the project.
14
+
15
+ - **Collaborate respectfully**: We value a constructive attitude, so please be mindful of your communication. If negativity is part of your approach, our capacity to engage may be limited. We’re here to help if you’re open to learning and communicating positively. Remember, Open WebUI is a volunteer-driven project managed by a single maintainer and supported by contributors who also have full-time jobs. We appreciate your time and ask that you respect ours.
16
+
17
+ - **Contributing**: If you encounter an issue, we highly encourage you to submit a pull request or fork the project. We actively work to prevent contributor burnout to maintain the quality and continuity of Open WebUI.
18
+
19
+ - **Bug reproducibility**: If a bug cannot be reproduced with a `:main` or `:dev` Docker setup, or a pip install with Python 3.11, it may require additional help from the community. In such cases, we will move it to the "issues" Discussions section due to our limited resources. We encourage the community to assist with these issues. Remember, it’s not that the issue doesn’t exist; we need your help!
20
+
21
+ Note: Please remove the notes above when submitting your post. Thank you for your understanding and support!
22
+
23
+ ---
24
+
25
+ **Is your feature request related to a problem? Please describe.**
26
+ A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]
27
+
28
+ **Describe the solution you'd like**
29
+ A clear and concise description of what you want to happen.
30
+
31
+ **Describe alternatives you've considered**
32
+ A clear and concise description of any alternative solutions or features you've considered.
33
+
34
+ **Additional context**
35
+ Add any other context or screenshots about the feature request here.
.github/dependabot.yml ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ version: 2
2
+ updates:
3
+ - package-ecosystem: pip
4
+ directory: '/backend'
5
+ schedule:
6
+ interval: monthly
7
+ target-branch: 'dev'
8
+ - package-ecosystem: 'github-actions'
9
+ directory: '/'
10
+ schedule:
11
+ # Check for updates to GitHub Actions every week
12
+ interval: monthly
.github/pull_request_template.md ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Pull Request Checklist
2
+
3
+ ### Note to first-time contributors: Please open a discussion post in [Discussions](https://github.com/open-webui/open-webui/discussions) and describe your changes before submitting a pull request.
4
+
5
+ **Before submitting, make sure you've checked the following:**
6
+
7
+ - [ ] **Target branch:** Please verify that the pull request targets the `dev` branch.
8
+ - [ ] **Description:** Provide a concise description of the changes made in this pull request.
9
+ - [ ] **Changelog:** Ensure a changelog entry following the format of [Keep a Changelog](https://keepachangelog.com/) is added at the bottom of the PR description.
10
+ - [ ] **Documentation:** Have you updated relevant documentation [Open WebUI Docs](https://github.com/open-webui/docs), or other documentation sources?
11
+ - [ ] **Dependencies:** Are there any new dependencies? Have you updated the dependency versions in the documentation?
12
+ - [ ] **Testing:** Have you written and run sufficient tests for validating the changes?
13
+ - [ ] **Code review:** Have you performed a self-review of your code, addressing any coding standard issues and ensuring adherence to the project's coding standards?
14
+ - [ ] **Prefix:** To cleary categorize this pull request, prefix the pull request title, using one of the following:
15
+ - **BREAKING CHANGE**: Significant changes that may affect compatibility
16
+ - **build**: Changes that affect the build system or external dependencies
17
+ - **ci**: Changes to our continuous integration processes or workflows
18
+ - **chore**: Refactor, cleanup, or other non-functional code changes
19
+ - **docs**: Documentation update or addition
20
+ - **feat**: Introduces a new feature or enhancement to the codebase
21
+ - **fix**: Bug fix or error correction
22
+ - **i18n**: Internationalization or localization changes
23
+ - **perf**: Performance improvement
24
+ - **refactor**: Code restructuring for better maintainability, readability, or scalability
25
+ - **style**: Changes that do not affect the meaning of the code (white-space, formatting, missing semi-colons, etc.)
26
+ - **test**: Adding missing tests or correcting existing tests
27
+ - **WIP**: Work in progress, a temporary label for incomplete or ongoing work
28
+
29
+ # Changelog Entry
30
+
31
+ ### Description
32
+
33
+ - [Concisely describe the changes made in this pull request, including any relevant motivation and impact (e.g., fixing a bug, adding a feature, or improving performance)]
34
+
35
+ ### Added
36
+
37
+ - [List any new features, functionalities, or additions]
38
+
39
+ ### Changed
40
+
41
+ - [List any changes, updates, refactorings, or optimizations]
42
+
43
+ ### Deprecated
44
+
45
+ - [List any deprecated functionality or features that have been removed]
46
+
47
+ ### Removed
48
+
49
+ - [List any removed features, files, or functionalities]
50
+
51
+ ### Fixed
52
+
53
+ - [List any fixes, corrections, or bug fixes]
54
+
55
+ ### Security
56
+
57
+ - [List any new or updated security-related changes, including vulnerability fixes]
58
+
59
+ ### Breaking Changes
60
+
61
+ - **BREAKING CHANGE**: [List any breaking changes affecting compatibility or functionality]
62
+
63
+ ---
64
+
65
+ ### Additional Information
66
+
67
+ - [Insert any additional context, notes, or explanations for the changes]
68
+ - [Reference any related issues, commits, or other relevant information]
69
+
70
+ ### Screenshots or Videos
71
+
72
+ - [Attach any relevant screenshots or videos demonstrating the changes]
.github/workflows/build-release.yml ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Release
2
+
3
+ on:
4
+ push:
5
+ branches:
6
+ - main # or whatever branch you want to use
7
+
8
+ jobs:
9
+ release:
10
+ runs-on: ubuntu-latest
11
+
12
+ steps:
13
+ - name: Checkout repository
14
+ uses: actions/checkout@v4
15
+
16
+ - name: Check for changes in package.json
17
+ run: |
18
+ git diff --cached --diff-filter=d package.json || {
19
+ echo "No changes to package.json"
20
+ exit 1
21
+ }
22
+
23
+ - name: Get version number from package.json
24
+ id: get_version
25
+ run: |
26
+ VERSION=$(jq -r '.version' package.json)
27
+ echo "::set-output name=version::$VERSION"
28
+
29
+ - name: Extract latest CHANGELOG entry
30
+ id: changelog
31
+ run: |
32
+ CHANGELOG_CONTENT=$(awk 'BEGIN {print_section=0;} /^## \[/ {if (print_section == 0) {print_section=1;} else {exit;}} print_section {print;}' CHANGELOG.md)
33
+ CHANGELOG_ESCAPED=$(echo "$CHANGELOG_CONTENT" | sed ':a;N;$!ba;s/\n/%0A/g')
34
+ echo "Extracted latest release notes from CHANGELOG.md:"
35
+ echo -e "$CHANGELOG_CONTENT"
36
+ echo "::set-output name=content::$CHANGELOG_ESCAPED"
37
+
38
+ - name: Create GitHub release
39
+ uses: actions/github-script@v7
40
+ with:
41
+ github-token: ${{ secrets.GITHUB_TOKEN }}
42
+ script: |
43
+ const changelog = `${{ steps.changelog.outputs.content }}`;
44
+ const release = await github.rest.repos.createRelease({
45
+ owner: context.repo.owner,
46
+ repo: context.repo.repo,
47
+ tag_name: `v${{ steps.get_version.outputs.version }}`,
48
+ name: `v${{ steps.get_version.outputs.version }}`,
49
+ body: changelog,
50
+ })
51
+ console.log(`Created release ${release.data.html_url}`)
52
+
53
+ - name: Upload package to GitHub release
54
+ uses: actions/upload-artifact@v4
55
+ with:
56
+ name: package
57
+ path: |
58
+ .
59
+ !.git
60
+ env:
61
+ GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
62
+
63
+ - name: Trigger Docker build workflow
64
+ uses: actions/github-script@v7
65
+ with:
66
+ script: |
67
+ github.rest.actions.createWorkflowDispatch({
68
+ owner: context.repo.owner,
69
+ repo: context.repo.repo,
70
+ workflow_id: 'docker-build.yaml',
71
+ ref: 'v${{ steps.get_version.outputs.version }}',
72
+ })
.github/workflows/deploy-to-hf-spaces.yml ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Deploy to HuggingFace Spaces
2
+
3
+ on:
4
+ push:
5
+ branches:
6
+ - dev
7
+ - main
8
+ workflow_dispatch:
9
+
10
+ jobs:
11
+ check-secret:
12
+ runs-on: ubuntu-latest
13
+ outputs:
14
+ token-set: ${{ steps.check-key.outputs.defined }}
15
+ steps:
16
+ - id: check-key
17
+ env:
18
+ HF_TOKEN: ${{ secrets.HF_TOKEN }}
19
+ if: "${{ env.HF_TOKEN != '' }}"
20
+ run: echo "defined=true" >> $GITHUB_OUTPUT
21
+
22
+ deploy:
23
+ runs-on: ubuntu-latest
24
+ needs: [check-secret]
25
+ if: needs.check-secret.outputs.token-set == 'true'
26
+ env:
27
+ HF_TOKEN: ${{ secrets.HF_TOKEN }}
28
+ steps:
29
+ - name: Checkout repository
30
+ uses: actions/checkout@v4
31
+ with:
32
+ lfs: true
33
+
34
+ - name: Remove git history
35
+ run: rm -rf .git
36
+
37
+ - name: Prepend YAML front matter to README.md
38
+ run: |
39
+ echo "---" > temp_readme.md
40
+ echo "title: Open WebUI" >> temp_readme.md
41
+ echo "emoji: 🐳" >> temp_readme.md
42
+ echo "colorFrom: purple" >> temp_readme.md
43
+ echo "colorTo: gray" >> temp_readme.md
44
+ echo "sdk: docker" >> temp_readme.md
45
+ echo "app_port: 8080" >> temp_readme.md
46
+ echo "---" >> temp_readme.md
47
+ cat README.md >> temp_readme.md
48
+ mv temp_readme.md README.md
49
+
50
+ - name: Configure git
51
+ run: |
52
+ git config --global user.email "41898282+github-actions[bot]@users.noreply.github.com"
53
+ git config --global user.name "github-actions[bot]"
54
+ - name: Set up Git and push to Space
55
+ run: |
56
+ git init --initial-branch=main
57
+ git lfs install
58
+ git lfs track "*.ttf"
59
+ git lfs track "*.jpg"
60
+ rm demo.gif
61
+ git add .
62
+ git commit -m "GitHub deploy: ${{ github.sha }}"
63
+ git push --force https://arcticaurora:${HF_TOKEN}@huggingface.co/spaces/arcticaurora/ai main
.github/workflows/docker-build.yaml ADDED
@@ -0,0 +1,477 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Create and publish Docker images with specific build args
2
+
3
+ on:
4
+ workflow_dispatch:
5
+ push:
6
+ branches:
7
+ - main
8
+ - dev
9
+ tags:
10
+ - v*
11
+
12
+ env:
13
+ REGISTRY: ghcr.io
14
+
15
+ jobs:
16
+ build-main-image:
17
+ runs-on: ubuntu-latest
18
+ permissions:
19
+ contents: read
20
+ packages: write
21
+ strategy:
22
+ fail-fast: false
23
+ matrix:
24
+ platform:
25
+ - linux/amd64
26
+ - linux/arm64
27
+
28
+ steps:
29
+ # GitHub Packages requires the entire repository name to be in lowercase
30
+ # although the repository owner has a lowercase username, this prevents some people from running actions after forking
31
+ - name: Set repository and image name to lowercase
32
+ run: |
33
+ echo "IMAGE_NAME=${IMAGE_NAME,,}" >>${GITHUB_ENV}
34
+ echo "FULL_IMAGE_NAME=ghcr.io/${IMAGE_NAME,,}" >>${GITHUB_ENV}
35
+ env:
36
+ IMAGE_NAME: '${{ github.repository }}'
37
+
38
+ - name: Prepare
39
+ run: |
40
+ platform=${{ matrix.platform }}
41
+ echo "PLATFORM_PAIR=${platform//\//-}" >> $GITHUB_ENV
42
+
43
+ - name: Checkout repository
44
+ uses: actions/checkout@v4
45
+
46
+ - name: Set up QEMU
47
+ uses: docker/setup-qemu-action@v3
48
+
49
+ - name: Set up Docker Buildx
50
+ uses: docker/setup-buildx-action@v3
51
+
52
+ - name: Log in to the Container registry
53
+ uses: docker/login-action@v3
54
+ with:
55
+ registry: ${{ env.REGISTRY }}
56
+ username: ${{ github.actor }}
57
+ password: ${{ secrets.GITHUB_TOKEN }}
58
+
59
+ - name: Extract metadata for Docker images (default latest tag)
60
+ id: meta
61
+ uses: docker/metadata-action@v5
62
+ with:
63
+ images: ${{ env.FULL_IMAGE_NAME }}
64
+ tags: |
65
+ type=ref,event=branch
66
+ type=ref,event=tag
67
+ type=sha,prefix=git-
68
+ type=semver,pattern={{version}}
69
+ type=semver,pattern={{major}}.{{minor}}
70
+ flavor: |
71
+ latest=${{ github.ref == 'refs/heads/main' }}
72
+
73
+ - name: Extract metadata for Docker cache
74
+ id: cache-meta
75
+ uses: docker/metadata-action@v5
76
+ with:
77
+ images: ${{ env.FULL_IMAGE_NAME }}
78
+ tags: |
79
+ type=ref,event=branch
80
+ ${{ github.ref_type == 'tag' && 'type=raw,value=main' || '' }}
81
+ flavor: |
82
+ prefix=cache-${{ matrix.platform }}-
83
+ latest=false
84
+
85
+ - name: Build Docker image (latest)
86
+ uses: docker/build-push-action@v5
87
+ id: build
88
+ with:
89
+ context: .
90
+ push: true
91
+ platforms: ${{ matrix.platform }}
92
+ labels: ${{ steps.meta.outputs.labels }}
93
+ outputs: type=image,name=${{ env.FULL_IMAGE_NAME }},push-by-digest=true,name-canonical=true,push=true
94
+ cache-from: type=registry,ref=${{ steps.cache-meta.outputs.tags }}
95
+ cache-to: type=registry,ref=${{ steps.cache-meta.outputs.tags }},mode=max
96
+ build-args: |
97
+ BUILD_HASH=${{ github.sha }}
98
+
99
+ - name: Export digest
100
+ run: |
101
+ mkdir -p /tmp/digests
102
+ digest="${{ steps.build.outputs.digest }}"
103
+ touch "/tmp/digests/${digest#sha256:}"
104
+
105
+ - name: Upload digest
106
+ uses: actions/upload-artifact@v4
107
+ with:
108
+ name: digests-main-${{ env.PLATFORM_PAIR }}
109
+ path: /tmp/digests/*
110
+ if-no-files-found: error
111
+ retention-days: 1
112
+
113
+ build-cuda-image:
114
+ runs-on: ubuntu-latest
115
+ permissions:
116
+ contents: read
117
+ packages: write
118
+ strategy:
119
+ fail-fast: false
120
+ matrix:
121
+ platform:
122
+ - linux/amd64
123
+ - linux/arm64
124
+
125
+ steps:
126
+ # GitHub Packages requires the entire repository name to be in lowercase
127
+ # although the repository owner has a lowercase username, this prevents some people from running actions after forking
128
+ - name: Set repository and image name to lowercase
129
+ run: |
130
+ echo "IMAGE_NAME=${IMAGE_NAME,,}" >>${GITHUB_ENV}
131
+ echo "FULL_IMAGE_NAME=ghcr.io/${IMAGE_NAME,,}" >>${GITHUB_ENV}
132
+ env:
133
+ IMAGE_NAME: '${{ github.repository }}'
134
+
135
+ - name: Prepare
136
+ run: |
137
+ platform=${{ matrix.platform }}
138
+ echo "PLATFORM_PAIR=${platform//\//-}" >> $GITHUB_ENV
139
+
140
+ - name: Checkout repository
141
+ uses: actions/checkout@v4
142
+
143
+ - name: Set up QEMU
144
+ uses: docker/setup-qemu-action@v3
145
+
146
+ - name: Set up Docker Buildx
147
+ uses: docker/setup-buildx-action@v3
148
+
149
+ - name: Log in to the Container registry
150
+ uses: docker/login-action@v3
151
+ with:
152
+ registry: ${{ env.REGISTRY }}
153
+ username: ${{ github.actor }}
154
+ password: ${{ secrets.GITHUB_TOKEN }}
155
+
156
+ - name: Extract metadata for Docker images (cuda tag)
157
+ id: meta
158
+ uses: docker/metadata-action@v5
159
+ with:
160
+ images: ${{ env.FULL_IMAGE_NAME }}
161
+ tags: |
162
+ type=ref,event=branch
163
+ type=ref,event=tag
164
+ type=sha,prefix=git-
165
+ type=semver,pattern={{version}}
166
+ type=semver,pattern={{major}}.{{minor}}
167
+ type=raw,enable=${{ github.ref == 'refs/heads/main' }},prefix=,suffix=,value=cuda
168
+ flavor: |
169
+ latest=${{ github.ref == 'refs/heads/main' }}
170
+ suffix=-cuda,onlatest=true
171
+
172
+ - name: Extract metadata for Docker cache
173
+ id: cache-meta
174
+ uses: docker/metadata-action@v5
175
+ with:
176
+ images: ${{ env.FULL_IMAGE_NAME }}
177
+ tags: |
178
+ type=ref,event=branch
179
+ ${{ github.ref_type == 'tag' && 'type=raw,value=main' || '' }}
180
+ flavor: |
181
+ prefix=cache-cuda-${{ matrix.platform }}-
182
+ latest=false
183
+
184
+ - name: Build Docker image (cuda)
185
+ uses: docker/build-push-action@v5
186
+ id: build
187
+ with:
188
+ context: .
189
+ push: true
190
+ platforms: ${{ matrix.platform }}
191
+ labels: ${{ steps.meta.outputs.labels }}
192
+ outputs: type=image,name=${{ env.FULL_IMAGE_NAME }},push-by-digest=true,name-canonical=true,push=true
193
+ cache-from: type=registry,ref=${{ steps.cache-meta.outputs.tags }}
194
+ cache-to: type=registry,ref=${{ steps.cache-meta.outputs.tags }},mode=max
195
+ build-args: |
196
+ BUILD_HASH=${{ github.sha }}
197
+ USE_CUDA=true
198
+
199
+ - name: Export digest
200
+ run: |
201
+ mkdir -p /tmp/digests
202
+ digest="${{ steps.build.outputs.digest }}"
203
+ touch "/tmp/digests/${digest#sha256:}"
204
+
205
+ - name: Upload digest
206
+ uses: actions/upload-artifact@v4
207
+ with:
208
+ name: digests-cuda-${{ env.PLATFORM_PAIR }}
209
+ path: /tmp/digests/*
210
+ if-no-files-found: error
211
+ retention-days: 1
212
+
213
+ build-ollama-image:
214
+ runs-on: ubuntu-latest
215
+ permissions:
216
+ contents: read
217
+ packages: write
218
+ strategy:
219
+ fail-fast: false
220
+ matrix:
221
+ platform:
222
+ - linux/amd64
223
+ - linux/arm64
224
+
225
+ steps:
226
+ # GitHub Packages requires the entire repository name to be in lowercase
227
+ # although the repository owner has a lowercase username, this prevents some people from running actions after forking
228
+ - name: Set repository and image name to lowercase
229
+ run: |
230
+ echo "IMAGE_NAME=${IMAGE_NAME,,}" >>${GITHUB_ENV}
231
+ echo "FULL_IMAGE_NAME=ghcr.io/${IMAGE_NAME,,}" >>${GITHUB_ENV}
232
+ env:
233
+ IMAGE_NAME: '${{ github.repository }}'
234
+
235
+ - name: Prepare
236
+ run: |
237
+ platform=${{ matrix.platform }}
238
+ echo "PLATFORM_PAIR=${platform//\//-}" >> $GITHUB_ENV
239
+
240
+ - name: Checkout repository
241
+ uses: actions/checkout@v4
242
+
243
+ - name: Set up QEMU
244
+ uses: docker/setup-qemu-action@v3
245
+
246
+ - name: Set up Docker Buildx
247
+ uses: docker/setup-buildx-action@v3
248
+
249
+ - name: Log in to the Container registry
250
+ uses: docker/login-action@v3
251
+ with:
252
+ registry: ${{ env.REGISTRY }}
253
+ username: ${{ github.actor }}
254
+ password: ${{ secrets.GITHUB_TOKEN }}
255
+
256
+ - name: Extract metadata for Docker images (ollama tag)
257
+ id: meta
258
+ uses: docker/metadata-action@v5
259
+ with:
260
+ images: ${{ env.FULL_IMAGE_NAME }}
261
+ tags: |
262
+ type=ref,event=branch
263
+ type=ref,event=tag
264
+ type=sha,prefix=git-
265
+ type=semver,pattern={{version}}
266
+ type=semver,pattern={{major}}.{{minor}}
267
+ type=raw,enable=${{ github.ref == 'refs/heads/main' }},prefix=,suffix=,value=ollama
268
+ flavor: |
269
+ latest=${{ github.ref == 'refs/heads/main' }}
270
+ suffix=-ollama,onlatest=true
271
+
272
+ - name: Extract metadata for Docker cache
273
+ id: cache-meta
274
+ uses: docker/metadata-action@v5
275
+ with:
276
+ images: ${{ env.FULL_IMAGE_NAME }}
277
+ tags: |
278
+ type=ref,event=branch
279
+ ${{ github.ref_type == 'tag' && 'type=raw,value=main' || '' }}
280
+ flavor: |
281
+ prefix=cache-ollama-${{ matrix.platform }}-
282
+ latest=false
283
+
284
+ - name: Build Docker image (ollama)
285
+ uses: docker/build-push-action@v5
286
+ id: build
287
+ with:
288
+ context: .
289
+ push: true
290
+ platforms: ${{ matrix.platform }}
291
+ labels: ${{ steps.meta.outputs.labels }}
292
+ outputs: type=image,name=${{ env.FULL_IMAGE_NAME }},push-by-digest=true,name-canonical=true,push=true
293
+ cache-from: type=registry,ref=${{ steps.cache-meta.outputs.tags }}
294
+ cache-to: type=registry,ref=${{ steps.cache-meta.outputs.tags }},mode=max
295
+ build-args: |
296
+ BUILD_HASH=${{ github.sha }}
297
+ USE_OLLAMA=true
298
+
299
+ - name: Export digest
300
+ run: |
301
+ mkdir -p /tmp/digests
302
+ digest="${{ steps.build.outputs.digest }}"
303
+ touch "/tmp/digests/${digest#sha256:}"
304
+
305
+ - name: Upload digest
306
+ uses: actions/upload-artifact@v4
307
+ with:
308
+ name: digests-ollama-${{ env.PLATFORM_PAIR }}
309
+ path: /tmp/digests/*
310
+ if-no-files-found: error
311
+ retention-days: 1
312
+
313
+ merge-main-images:
314
+ runs-on: ubuntu-latest
315
+ needs: [build-main-image]
316
+ steps:
317
+ # GitHub Packages requires the entire repository name to be in lowercase
318
+ # although the repository owner has a lowercase username, this prevents some people from running actions after forking
319
+ - name: Set repository and image name to lowercase
320
+ run: |
321
+ echo "IMAGE_NAME=${IMAGE_NAME,,}" >>${GITHUB_ENV}
322
+ echo "FULL_IMAGE_NAME=ghcr.io/${IMAGE_NAME,,}" >>${GITHUB_ENV}
323
+ env:
324
+ IMAGE_NAME: '${{ github.repository }}'
325
+
326
+ - name: Download digests
327
+ uses: actions/download-artifact@v4
328
+ with:
329
+ pattern: digests-main-*
330
+ path: /tmp/digests
331
+ merge-multiple: true
332
+
333
+ - name: Set up Docker Buildx
334
+ uses: docker/setup-buildx-action@v3
335
+
336
+ - name: Log in to the Container registry
337
+ uses: docker/login-action@v3
338
+ with:
339
+ registry: ${{ env.REGISTRY }}
340
+ username: ${{ github.actor }}
341
+ password: ${{ secrets.GITHUB_TOKEN }}
342
+
343
+ - name: Extract metadata for Docker images (default latest tag)
344
+ id: meta
345
+ uses: docker/metadata-action@v5
346
+ with:
347
+ images: ${{ env.FULL_IMAGE_NAME }}
348
+ tags: |
349
+ type=ref,event=branch
350
+ type=ref,event=tag
351
+ type=sha,prefix=git-
352
+ type=semver,pattern={{version}}
353
+ type=semver,pattern={{major}}.{{minor}}
354
+ flavor: |
355
+ latest=${{ github.ref == 'refs/heads/main' }}
356
+
357
+ - name: Create manifest list and push
358
+ working-directory: /tmp/digests
359
+ run: |
360
+ docker buildx imagetools create $(jq -cr '.tags | map("-t " + .) | join(" ")' <<< "$DOCKER_METADATA_OUTPUT_JSON") \
361
+ $(printf '${{ env.FULL_IMAGE_NAME }}@sha256:%s ' *)
362
+
363
+ - name: Inspect image
364
+ run: |
365
+ docker buildx imagetools inspect ${{ env.FULL_IMAGE_NAME }}:${{ steps.meta.outputs.version }}
366
+
367
+ merge-cuda-images:
368
+ runs-on: ubuntu-latest
369
+ needs: [build-cuda-image]
370
+ steps:
371
+ # GitHub Packages requires the entire repository name to be in lowercase
372
+ # although the repository owner has a lowercase username, this prevents some people from running actions after forking
373
+ - name: Set repository and image name to lowercase
374
+ run: |
375
+ echo "IMAGE_NAME=${IMAGE_NAME,,}" >>${GITHUB_ENV}
376
+ echo "FULL_IMAGE_NAME=ghcr.io/${IMAGE_NAME,,}" >>${GITHUB_ENV}
377
+ env:
378
+ IMAGE_NAME: '${{ github.repository }}'
379
+
380
+ - name: Download digests
381
+ uses: actions/download-artifact@v4
382
+ with:
383
+ pattern: digests-cuda-*
384
+ path: /tmp/digests
385
+ merge-multiple: true
386
+
387
+ - name: Set up Docker Buildx
388
+ uses: docker/setup-buildx-action@v3
389
+
390
+ - name: Log in to the Container registry
391
+ uses: docker/login-action@v3
392
+ with:
393
+ registry: ${{ env.REGISTRY }}
394
+ username: ${{ github.actor }}
395
+ password: ${{ secrets.GITHUB_TOKEN }}
396
+
397
+ - name: Extract metadata for Docker images (default latest tag)
398
+ id: meta
399
+ uses: docker/metadata-action@v5
400
+ with:
401
+ images: ${{ env.FULL_IMAGE_NAME }}
402
+ tags: |
403
+ type=ref,event=branch
404
+ type=ref,event=tag
405
+ type=sha,prefix=git-
406
+ type=semver,pattern={{version}}
407
+ type=semver,pattern={{major}}.{{minor}}
408
+ type=raw,enable=${{ github.ref == 'refs/heads/main' }},prefix=,suffix=,value=cuda
409
+ flavor: |
410
+ latest=${{ github.ref == 'refs/heads/main' }}
411
+ suffix=-cuda,onlatest=true
412
+
413
+ - name: Create manifest list and push
414
+ working-directory: /tmp/digests
415
+ run: |
416
+ docker buildx imagetools create $(jq -cr '.tags | map("-t " + .) | join(" ")' <<< "$DOCKER_METADATA_OUTPUT_JSON") \
417
+ $(printf '${{ env.FULL_IMAGE_NAME }}@sha256:%s ' *)
418
+
419
+ - name: Inspect image
420
+ run: |
421
+ docker buildx imagetools inspect ${{ env.FULL_IMAGE_NAME }}:${{ steps.meta.outputs.version }}
422
+
423
+ merge-ollama-images:
424
+ runs-on: ubuntu-latest
425
+ needs: [build-ollama-image]
426
+ steps:
427
+ # GitHub Packages requires the entire repository name to be in lowercase
428
+ # although the repository owner has a lowercase username, this prevents some people from running actions after forking
429
+ - name: Set repository and image name to lowercase
430
+ run: |
431
+ echo "IMAGE_NAME=${IMAGE_NAME,,}" >>${GITHUB_ENV}
432
+ echo "FULL_IMAGE_NAME=ghcr.io/${IMAGE_NAME,,}" >>${GITHUB_ENV}
433
+ env:
434
+ IMAGE_NAME: '${{ github.repository }}'
435
+
436
+ - name: Download digests
437
+ uses: actions/download-artifact@v4
438
+ with:
439
+ pattern: digests-ollama-*
440
+ path: /tmp/digests
441
+ merge-multiple: true
442
+
443
+ - name: Set up Docker Buildx
444
+ uses: docker/setup-buildx-action@v3
445
+
446
+ - name: Log in to the Container registry
447
+ uses: docker/login-action@v3
448
+ with:
449
+ registry: ${{ env.REGISTRY }}
450
+ username: ${{ github.actor }}
451
+ password: ${{ secrets.GITHUB_TOKEN }}
452
+
453
+ - name: Extract metadata for Docker images (default ollama tag)
454
+ id: meta
455
+ uses: docker/metadata-action@v5
456
+ with:
457
+ images: ${{ env.FULL_IMAGE_NAME }}
458
+ tags: |
459
+ type=ref,event=branch
460
+ type=ref,event=tag
461
+ type=sha,prefix=git-
462
+ type=semver,pattern={{version}}
463
+ type=semver,pattern={{major}}.{{minor}}
464
+ type=raw,enable=${{ github.ref == 'refs/heads/main' }},prefix=,suffix=,value=ollama
465
+ flavor: |
466
+ latest=${{ github.ref == 'refs/heads/main' }}
467
+ suffix=-ollama,onlatest=true
468
+
469
+ - name: Create manifest list and push
470
+ working-directory: /tmp/digests
471
+ run: |
472
+ docker buildx imagetools create $(jq -cr '.tags | map("-t " + .) | join(" ")' <<< "$DOCKER_METADATA_OUTPUT_JSON") \
473
+ $(printf '${{ env.FULL_IMAGE_NAME }}@sha256:%s ' *)
474
+
475
+ - name: Inspect image
476
+ run: |
477
+ docker buildx imagetools inspect ${{ env.FULL_IMAGE_NAME }}:${{ steps.meta.outputs.version }}
.github/workflows/format-backend.yaml ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Python CI
2
+
3
+ on:
4
+ push:
5
+ branches:
6
+ - main
7
+ - dev
8
+ pull_request:
9
+ branches:
10
+ - main
11
+ - dev
12
+
13
+ jobs:
14
+ build:
15
+ name: 'Format Backend'
16
+ runs-on: ubuntu-latest
17
+
18
+ strategy:
19
+ matrix:
20
+ python-version: [3.11]
21
+
22
+ steps:
23
+ - uses: actions/checkout@v4
24
+
25
+ - name: Set up Python
26
+ uses: actions/setup-python@v5
27
+ with:
28
+ python-version: ${{ matrix.python-version }}
29
+
30
+ - name: Install dependencies
31
+ run: |
32
+ python -m pip install --upgrade pip
33
+ pip install black
34
+
35
+ - name: Format backend
36
+ run: npm run format:backend
37
+
38
+ - name: Check for changes after format
39
+ run: git diff --exit-code
.github/workflows/format-build-frontend.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Frontend Build
2
+
3
+ on:
4
+ push:
5
+ branches:
6
+ - main
7
+ - dev
8
+ pull_request:
9
+ branches:
10
+ - main
11
+ - dev
12
+
13
+ jobs:
14
+ build:
15
+ name: 'Format & Build Frontend'
16
+ runs-on: ubuntu-latest
17
+ steps:
18
+ - name: Checkout Repository
19
+ uses: actions/checkout@v4
20
+
21
+ - name: Setup Node.js
22
+ uses: actions/setup-node@v4
23
+ with:
24
+ node-version: '22' # Or specify any other version you want to use
25
+
26
+ - name: Install Dependencies
27
+ run: npm install
28
+
29
+ - name: Format Frontend
30
+ run: npm run format
31
+
32
+ - name: Run i18next
33
+ run: npm run i18n:parse
34
+
35
+ - name: Check for Changes After Format
36
+ run: git diff --exit-code
37
+
38
+ - name: Build Frontend
39
+ run: npm run build
40
+
41
+ test-frontend:
42
+ name: 'Frontend Unit Tests'
43
+ runs-on: ubuntu-latest
44
+ steps:
45
+ - name: Checkout Repository
46
+ uses: actions/checkout@v4
47
+
48
+ - name: Setup Node.js
49
+ uses: actions/setup-node@v4
50
+ with:
51
+ node-version: '22'
52
+
53
+ - name: Install Dependencies
54
+ run: npm ci
55
+
56
+ - name: Run vitest
57
+ run: npm run test:frontend
.github/workflows/integration-test.yml ADDED
@@ -0,0 +1,253 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Integration Test
2
+
3
+ on:
4
+ push:
5
+ branches:
6
+ - main
7
+ - dev
8
+ pull_request:
9
+ branches:
10
+ - main
11
+ - dev
12
+
13
+ jobs:
14
+ cypress-run:
15
+ name: Run Cypress Integration Tests
16
+ runs-on: ubuntu-latest
17
+ steps:
18
+ - name: Maximize build space
19
+ uses: AdityaGarg8/[email protected]
20
+ with:
21
+ remove-android: 'true'
22
+ remove-haskell: 'true'
23
+ remove-codeql: 'true'
24
+
25
+ - name: Checkout Repository
26
+ uses: actions/checkout@v4
27
+
28
+ - name: Build and run Compose Stack
29
+ run: |
30
+ docker compose \
31
+ --file docker-compose.yaml \
32
+ --file docker-compose.api.yaml \
33
+ --file docker-compose.a1111-test.yaml \
34
+ up --detach --build
35
+
36
+ - name: Delete Docker build cache
37
+ run: |
38
+ docker builder prune --all --force
39
+
40
+ - name: Wait for Ollama to be up
41
+ timeout-minutes: 5
42
+ run: |
43
+ until curl --output /dev/null --silent --fail http://localhost:11434; do
44
+ printf '.'
45
+ sleep 1
46
+ done
47
+ echo "Service is up!"
48
+
49
+ - name: Preload Ollama model
50
+ run: |
51
+ docker exec ollama ollama pull qwen:0.5b-chat-v1.5-q2_K
52
+
53
+ - name: Cypress run
54
+ uses: cypress-io/github-action@v6
55
+ with:
56
+ browser: chrome
57
+ wait-on: 'http://localhost:3000'
58
+ config: baseUrl=http://localhost:3000
59
+
60
+ - uses: actions/upload-artifact@v4
61
+ if: always()
62
+ name: Upload Cypress videos
63
+ with:
64
+ name: cypress-videos
65
+ path: cypress/videos
66
+ if-no-files-found: ignore
67
+
68
+ - name: Extract Compose logs
69
+ if: always()
70
+ run: |
71
+ docker compose logs > compose-logs.txt
72
+
73
+ - uses: actions/upload-artifact@v4
74
+ if: always()
75
+ name: Upload Compose logs
76
+ with:
77
+ name: compose-logs
78
+ path: compose-logs.txt
79
+ if-no-files-found: ignore
80
+
81
+ # pytest:
82
+ # name: Run Backend Tests
83
+ # runs-on: ubuntu-latest
84
+ # steps:
85
+ # - uses: actions/checkout@v4
86
+
87
+ # - name: Set up Python
88
+ # uses: actions/setup-python@v5
89
+ # with:
90
+ # python-version: ${{ matrix.python-version }}
91
+
92
+ # - name: Install dependencies
93
+ # run: |
94
+ # python -m pip install --upgrade pip
95
+ # pip install -r backend/requirements.txt
96
+
97
+ # - name: pytest run
98
+ # run: |
99
+ # ls -al
100
+ # cd backend
101
+ # PYTHONPATH=. pytest . -o log_cli=true -o log_cli_level=INFO
102
+
103
+ migration_test:
104
+ name: Run Migration Tests
105
+ runs-on: ubuntu-latest
106
+ services:
107
+ postgres:
108
+ image: postgres
109
+ env:
110
+ POSTGRES_PASSWORD: postgres
111
+ options: >-
112
+ --health-cmd pg_isready
113
+ --health-interval 10s
114
+ --health-timeout 5s
115
+ --health-retries 5
116
+ ports:
117
+ - 5432:5432
118
+ # mysql:
119
+ # image: mysql
120
+ # env:
121
+ # MYSQL_ROOT_PASSWORD: mysql
122
+ # MYSQL_DATABASE: mysql
123
+ # options: >-
124
+ # --health-cmd "mysqladmin ping -h localhost"
125
+ # --health-interval 10s
126
+ # --health-timeout 5s
127
+ # --health-retries 5
128
+ # ports:
129
+ # - 3306:3306
130
+ steps:
131
+ - name: Checkout Repository
132
+ uses: actions/checkout@v4
133
+
134
+ - name: Set up Python
135
+ uses: actions/setup-python@v5
136
+ with:
137
+ python-version: ${{ matrix.python-version }}
138
+
139
+ - name: Set up uv
140
+ uses: yezz123/setup-uv@v4
141
+ with:
142
+ uv-venv: venv
143
+
144
+ - name: Activate virtualenv
145
+ run: |
146
+ . venv/bin/activate
147
+ echo PATH=$PATH >> $GITHUB_ENV
148
+
149
+ - name: Install dependencies
150
+ run: |
151
+ uv pip install -r backend/requirements.txt
152
+
153
+ - name: Test backend with SQLite
154
+ id: sqlite
155
+ env:
156
+ WEBUI_SECRET_KEY: secret-key
157
+ GLOBAL_LOG_LEVEL: debug
158
+ run: |
159
+ cd backend
160
+ uvicorn open_webui.main:app --port "8080" --forwarded-allow-ips '*' &
161
+ UVICORN_PID=$!
162
+ # Wait up to 40 seconds for the server to start
163
+ for i in {1..40}; do
164
+ curl -s http://localhost:8080/api/config > /dev/null && break
165
+ sleep 1
166
+ if [ $i -eq 40 ]; then
167
+ echo "Server failed to start"
168
+ kill -9 $UVICORN_PID
169
+ exit 1
170
+ fi
171
+ done
172
+ # Check that the server is still running after 5 seconds
173
+ sleep 5
174
+ if ! kill -0 $UVICORN_PID; then
175
+ echo "Server has stopped"
176
+ exit 1
177
+ fi
178
+
179
+ - name: Test backend with Postgres
180
+ if: success() || steps.sqlite.conclusion == 'failure'
181
+ env:
182
+ WEBUI_SECRET_KEY: secret-key
183
+ GLOBAL_LOG_LEVEL: debug
184
+ DATABASE_URL: postgresql://postgres:postgres@localhost:5432/postgres
185
+ DATABASE_POOL_SIZE: 10
186
+ DATABASE_POOL_MAX_OVERFLOW: 10
187
+ DATABASE_POOL_TIMEOUT: 30
188
+ run: |
189
+ cd backend
190
+ uvicorn open_webui.main:app --port "8081" --forwarded-allow-ips '*' &
191
+ UVICORN_PID=$!
192
+ # Wait up to 20 seconds for the server to start
193
+ for i in {1..20}; do
194
+ curl -s http://localhost:8081/api/config > /dev/null && break
195
+ sleep 1
196
+ if [ $i -eq 20 ]; then
197
+ echo "Server failed to start"
198
+ kill -9 $UVICORN_PID
199
+ exit 1
200
+ fi
201
+ done
202
+ # Check that the server is still running after 5 seconds
203
+ sleep 5
204
+ if ! kill -0 $UVICORN_PID; then
205
+ echo "Server has stopped"
206
+ exit 1
207
+ fi
208
+
209
+ # Check that service will reconnect to postgres when connection will be closed
210
+ status_code=$(curl --write-out %{http_code} -s --output /dev/null http://localhost:8081/health/db)
211
+ if [[ "$status_code" -ne 200 ]] ; then
212
+ echo "Server has failed before postgres reconnect check"
213
+ exit 1
214
+ fi
215
+
216
+ echo "Terminating all connections to postgres..."
217
+ python -c "import os, psycopg2 as pg2; \
218
+ conn = pg2.connect(dsn=os.environ['DATABASE_URL'].replace('+pool', '')); \
219
+ cur = conn.cursor(); \
220
+ cur.execute('SELECT pg_terminate_backend(psa.pid) FROM pg_stat_activity psa WHERE datname = current_database() AND pid <> pg_backend_pid();')"
221
+
222
+ status_code=$(curl --write-out %{http_code} -s --output /dev/null http://localhost:8081/health/db)
223
+ if [[ "$status_code" -ne 200 ]] ; then
224
+ echo "Server has not reconnected to postgres after connection was closed: returned status $status_code"
225
+ exit 1
226
+ fi
227
+
228
+ # - name: Test backend with MySQL
229
+ # if: success() || steps.sqlite.conclusion == 'failure' || steps.postgres.conclusion == 'failure'
230
+ # env:
231
+ # WEBUI_SECRET_KEY: secret-key
232
+ # GLOBAL_LOG_LEVEL: debug
233
+ # DATABASE_URL: mysql://root:mysql@localhost:3306/mysql
234
+ # run: |
235
+ # cd backend
236
+ # uvicorn open_webui.main:app --port "8083" --forwarded-allow-ips '*' &
237
+ # UVICORN_PID=$!
238
+ # # Wait up to 20 seconds for the server to start
239
+ # for i in {1..20}; do
240
+ # curl -s http://localhost:8083/api/config > /dev/null && break
241
+ # sleep 1
242
+ # if [ $i -eq 20 ]; then
243
+ # echo "Server failed to start"
244
+ # kill -9 $UVICORN_PID
245
+ # exit 1
246
+ # fi
247
+ # done
248
+ # # Check that the server is still running after 5 seconds
249
+ # sleep 5
250
+ # if ! kill -0 $UVICORN_PID; then
251
+ # echo "Server has stopped"
252
+ # exit 1
253
+ # fi
.github/workflows/lint-backend.disabled ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Python CI
2
+ on:
3
+ push:
4
+ branches: ['main']
5
+ pull_request:
6
+ jobs:
7
+ build:
8
+ name: 'Lint Backend'
9
+ env:
10
+ PUBLIC_API_BASE_URL: ''
11
+ runs-on: ubuntu-latest
12
+ strategy:
13
+ matrix:
14
+ node-version:
15
+ - latest
16
+ steps:
17
+ - uses: actions/checkout@v4
18
+ - name: Use Python
19
+ uses: actions/setup-python@v5
20
+ - name: Use Bun
21
+ uses: oven-sh/setup-bun@v1
22
+ - name: Install dependencies
23
+ run: |
24
+ python -m pip install --upgrade pip
25
+ pip install pylint
26
+ - name: Lint backend
27
+ run: bun run lint:backend
.github/workflows/lint-frontend.disabled ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Bun CI
2
+ on:
3
+ push:
4
+ branches: ['main']
5
+ pull_request:
6
+ jobs:
7
+ build:
8
+ name: 'Lint Frontend'
9
+ env:
10
+ PUBLIC_API_BASE_URL: ''
11
+ runs-on: ubuntu-latest
12
+ steps:
13
+ - uses: actions/checkout@v4
14
+ - name: Use Bun
15
+ uses: oven-sh/setup-bun@v1
16
+ - run: bun --version
17
+ - name: Install frontend dependencies
18
+ run: bun install --frozen-lockfile
19
+ - run: bun run lint:frontend
20
+ - run: bun run lint:types
21
+ if: success() || failure()
.github/workflows/release-pypi.yml ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Release to PyPI
2
+
3
+ on:
4
+ push:
5
+ branches:
6
+ - main # or whatever branch you want to use
7
+ - pypi-release
8
+
9
+ jobs:
10
+ release:
11
+ runs-on: ubuntu-latest
12
+ environment:
13
+ name: pypi
14
+ url: https://pypi.org/p/open-webui
15
+ permissions:
16
+ id-token: write
17
+ steps:
18
+ - name: Checkout repository
19
+ uses: actions/checkout@v4
20
+ - uses: actions/setup-node@v4
21
+ with:
22
+ node-version: 18
23
+ - uses: actions/setup-python@v5
24
+ with:
25
+ python-version: 3.11
26
+ - name: Build
27
+ run: |
28
+ python -m pip install --upgrade pip
29
+ pip install build
30
+ python -m build .
31
+ - name: Publish package distributions to PyPI
32
+ uses: pypa/gh-action-pypi-publish@release/v1
.gitignore ADDED
@@ -0,0 +1,310 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ .DS_Store
2
+ node_modules
3
+ /build
4
+ /.svelte-kit
5
+ /package
6
+ .myenv/
7
+ .env
8
+ .env.*
9
+ !.env.example
10
+ vite.config.js.timestamp-*
11
+ vite.config.ts.timestamp-*
12
+ # Byte-compiled / optimized / DLL files
13
+ __pycache__/
14
+ *.py[cod]
15
+ *$py.class
16
+
17
+ # C extensions
18
+ *.so
19
+
20
+ # Pyodide distribution
21
+ static/pyodide/*
22
+ !static/pyodide/pyodide-lock.json
23
+
24
+ # Distribution / packaging
25
+ .Python
26
+ build/
27
+ develop-eggs/
28
+ dist/
29
+ downloads/
30
+ eggs/
31
+ .eggs/
32
+ lib64/
33
+ parts/
34
+ sdist/
35
+ var/
36
+ wheels/
37
+ share/python-wheels/
38
+ *.egg-info/
39
+ .installed.cfg
40
+ *.egg
41
+ MANIFEST
42
+
43
+ # PyInstaller
44
+ # Usually these files are written by a python script from a template
45
+ # before PyInstaller builds the exe, so as to inject date/other infos into it.
46
+ *.manifest
47
+ *.spec
48
+
49
+ # Installer logs
50
+ pip-log.txt
51
+ pip-delete-this-directory.txt
52
+
53
+ # Unit test / coverage reports
54
+ htmlcov/
55
+ .tox/
56
+ .nox/
57
+ .coverage
58
+ .coverage.*
59
+ .cache
60
+ nosetests.xml
61
+ coverage.xml
62
+ *.cover
63
+ *.py,cover
64
+ .hypothesis/
65
+ .pytest_cache/
66
+ cover/
67
+
68
+ # Translations
69
+ *.mo
70
+ *.pot
71
+
72
+ # Django stuff:
73
+ *.log
74
+ local_settings.py
75
+ db.sqlite3
76
+ db.sqlite3-journal
77
+
78
+ # Flask stuff:
79
+ instance/
80
+ .webassets-cache
81
+
82
+ # Scrapy stuff:
83
+ .scrapy
84
+
85
+ # Sphinx documentation
86
+ docs/_build/
87
+
88
+ # PyBuilder
89
+ .pybuilder/
90
+ target/
91
+
92
+ # Jupyter Notebook
93
+ .ipynb_checkpoints
94
+
95
+ # IPython
96
+ profile_default/
97
+ ipython_config.py
98
+
99
+ # pyenv
100
+ # For a library or package, you might want to ignore these files since the code is
101
+ # intended to run in multiple environments; otherwise, check them in:
102
+ # .python-version
103
+
104
+ # pipenv
105
+ # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
106
+ # However, in case of collaboration, if having platform-specific dependencies or dependencies
107
+ # having no cross-platform support, pipenv may install dependencies that don't work, or not
108
+ # install all needed dependencies.
109
+ #Pipfile.lock
110
+
111
+ # poetry
112
+ # Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
113
+ # This is especially recommended for binary packages to ensure reproducibility, and is more
114
+ # commonly ignored for libraries.
115
+ # https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
116
+ #poetry.lock
117
+
118
+ # pdm
119
+ # Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
120
+ #pdm.lock
121
+ # pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
122
+ # in version control.
123
+ # https://pdm.fming.dev/#use-with-ide
124
+ .pdm.toml
125
+
126
+ # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
127
+ __pypackages__/
128
+
129
+ # Celery stuff
130
+ celerybeat-schedule
131
+ celerybeat.pid
132
+
133
+ # SageMath parsed files
134
+ *.sage.py
135
+
136
+ # Environments
137
+ .env
138
+ .venv
139
+ env/
140
+ venv/
141
+ ENV/
142
+ env.bak/
143
+ venv.bak/
144
+
145
+ # Spyder project settings
146
+ .spyderproject
147
+ .spyproject
148
+
149
+ # Rope project settings
150
+ .ropeproject
151
+
152
+ # mkdocs documentation
153
+ /site
154
+
155
+ # mypy
156
+ .mypy_cache/
157
+ .dmypy.json
158
+ dmypy.json
159
+
160
+ # Pyre type checker
161
+ .pyre/
162
+
163
+ # pytype static type analyzer
164
+ .pytype/
165
+
166
+ # Cython debug symbols
167
+ cython_debug/
168
+
169
+ # PyCharm
170
+ # JetBrains specific template is maintained in a separate JetBrains.gitignore that can
171
+ # be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
172
+ # and can be added to the global gitignore or merged into this file. For a more nuclear
173
+ # option (not recommended) you can uncomment the following to ignore the entire idea folder.
174
+ .idea/
175
+
176
+ # Logs
177
+ logs
178
+ *.log
179
+ npm-debug.log*
180
+ yarn-debug.log*
181
+ yarn-error.log*
182
+ lerna-debug.log*
183
+ .pnpm-debug.log*
184
+
185
+ # Diagnostic reports (https://nodejs.org/api/report.html)
186
+ report.[0-9]*.[0-9]*.[0-9]*.[0-9]*.json
187
+
188
+ # Runtime data
189
+ pids
190
+ *.pid
191
+ *.seed
192
+ *.pid.lock
193
+
194
+ # Directory for instrumented libs generated by jscoverage/JSCover
195
+ lib-cov
196
+
197
+ # Coverage directory used by tools like istanbul
198
+ coverage
199
+ *.lcov
200
+
201
+ # nyc test coverage
202
+ .nyc_output
203
+
204
+ # Grunt intermediate storage (https://gruntjs.com/creating-plugins#storing-task-files)
205
+ .grunt
206
+
207
+ # Bower dependency directory (https://bower.io/)
208
+ bower_components
209
+
210
+ # node-waf configuration
211
+ .lock-wscript
212
+
213
+ # Compiled binary addons (https://nodejs.org/api/addons.html)
214
+ build/Release
215
+
216
+ # Dependency directories
217
+ node_modules/
218
+ jspm_packages/
219
+
220
+ # Snowpack dependency directory (https://snowpack.dev/)
221
+ web_modules/
222
+
223
+ # TypeScript cache
224
+ *.tsbuildinfo
225
+
226
+ # Optional npm cache directory
227
+ .npm
228
+
229
+ # Optional eslint cache
230
+ .eslintcache
231
+
232
+ # Optional stylelint cache
233
+ .stylelintcache
234
+
235
+ # Microbundle cache
236
+ .rpt2_cache/
237
+ .rts2_cache_cjs/
238
+ .rts2_cache_es/
239
+ .rts2_cache_umd/
240
+
241
+ # Optional REPL history
242
+ .node_repl_history
243
+
244
+ # Output of 'npm pack'
245
+ *.tgz
246
+
247
+ # Yarn Integrity file
248
+ .yarn-integrity
249
+
250
+ # dotenv environment variable files
251
+ .env
252
+ .env.development.local
253
+ .env.test.local
254
+ .env.production.local
255
+ .env.local
256
+
257
+ # parcel-bundler cache (https://parceljs.org/)
258
+ .cache
259
+ .parcel-cache
260
+
261
+ # Next.js build output
262
+ .next
263
+ out
264
+
265
+ # Nuxt.js build / generate output
266
+ .nuxt
267
+ dist
268
+
269
+ # Gatsby files
270
+ .cache/
271
+ # Comment in the public line in if your project uses Gatsby and not Next.js
272
+ # https://nextjs.org/blog/next-9-1#public-directory-support
273
+ # public
274
+
275
+ # vuepress build output
276
+ .vuepress/dist
277
+
278
+ # vuepress v2.x temp and cache directory
279
+ .temp
280
+ .cache
281
+
282
+ # Docusaurus cache and generated files
283
+ .docusaurus
284
+
285
+ # Serverless directories
286
+ .serverless/
287
+
288
+ # FuseBox cache
289
+ .fusebox/
290
+
291
+ # DynamoDB Local files
292
+ .dynamodb/
293
+
294
+ # TernJS port file
295
+ .tern-port
296
+
297
+ # Stores VSCode versions used for testing VSCode extensions
298
+ .vscode-test
299
+
300
+ # yarn v2
301
+ .yarn/cache
302
+ .yarn/unplugged
303
+ .yarn/build-state.yml
304
+ .yarn/install-state.gz
305
+ .pnp.*
306
+
307
+ # cypress artifacts
308
+ cypress/videos
309
+ cypress/screenshots
310
+ .vscode/settings.json
.npmrc ADDED
@@ -0,0 +1 @@
 
 
1
+ engine-strict=true
.prettierignore ADDED
@@ -0,0 +1,316 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Ignore files for PNPM, NPM and YARN
2
+ pnpm-lock.yaml
3
+ package-lock.json
4
+ yarn.lock
5
+
6
+ kubernetes/
7
+
8
+ # Copy of .gitignore
9
+ .DS_Store
10
+ node_modules
11
+ /build
12
+ /.svelte-kit
13
+ /package
14
+ .env
15
+ .env.*
16
+ !.env.example
17
+ vite.config.js.timestamp-*
18
+ vite.config.ts.timestamp-*
19
+ # Byte-compiled / optimized / DLL files
20
+ __pycache__/
21
+ *.py[cod]
22
+ *$py.class
23
+
24
+ # C extensions
25
+ *.so
26
+
27
+ # Distribution / packaging
28
+ .Python
29
+ build/
30
+ develop-eggs/
31
+ dist/
32
+ downloads/
33
+ eggs/
34
+ .eggs/
35
+ lib64/
36
+ parts/
37
+ sdist/
38
+ var/
39
+ wheels/
40
+ share/python-wheels/
41
+ *.egg-info/
42
+ .installed.cfg
43
+ *.egg
44
+ MANIFEST
45
+
46
+ # PyInstaller
47
+ # Usually these files are written by a python script from a template
48
+ # before PyInstaller builds the exe, so as to inject date/other infos into it.
49
+ *.manifest
50
+ *.spec
51
+
52
+ # Installer logs
53
+ pip-log.txt
54
+ pip-delete-this-directory.txt
55
+
56
+ # Unit test / coverage reports
57
+ htmlcov/
58
+ .tox/
59
+ .nox/
60
+ .coverage
61
+ .coverage.*
62
+ .cache
63
+ nosetests.xml
64
+ coverage.xml
65
+ *.cover
66
+ *.py,cover
67
+ .hypothesis/
68
+ .pytest_cache/
69
+ cover/
70
+
71
+ # Translations
72
+ *.mo
73
+ *.pot
74
+
75
+ # Django stuff:
76
+ *.log
77
+ local_settings.py
78
+ db.sqlite3
79
+ db.sqlite3-journal
80
+
81
+ # Flask stuff:
82
+ instance/
83
+ .webassets-cache
84
+
85
+ # Scrapy stuff:
86
+ .scrapy
87
+
88
+ # Sphinx documentation
89
+ docs/_build/
90
+
91
+ # PyBuilder
92
+ .pybuilder/
93
+ target/
94
+
95
+ # Jupyter Notebook
96
+ .ipynb_checkpoints
97
+
98
+ # IPython
99
+ profile_default/
100
+ ipython_config.py
101
+
102
+ # pyenv
103
+ # For a library or package, you might want to ignore these files since the code is
104
+ # intended to run in multiple environments; otherwise, check them in:
105
+ # .python-version
106
+
107
+ # pipenv
108
+ # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
109
+ # However, in case of collaboration, if having platform-specific dependencies or dependencies
110
+ # having no cross-platform support, pipenv may install dependencies that don't work, or not
111
+ # install all needed dependencies.
112
+ #Pipfile.lock
113
+
114
+ # poetry
115
+ # Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
116
+ # This is especially recommended for binary packages to ensure reproducibility, and is more
117
+ # commonly ignored for libraries.
118
+ # https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
119
+ #poetry.lock
120
+
121
+ # pdm
122
+ # Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
123
+ #pdm.lock
124
+ # pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
125
+ # in version control.
126
+ # https://pdm.fming.dev/#use-with-ide
127
+ .pdm.toml
128
+
129
+ # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
130
+ __pypackages__/
131
+
132
+ # Celery stuff
133
+ celerybeat-schedule
134
+ celerybeat.pid
135
+
136
+ # SageMath parsed files
137
+ *.sage.py
138
+
139
+ # Environments
140
+ .env
141
+ .venv
142
+ env/
143
+ venv/
144
+ ENV/
145
+ env.bak/
146
+ venv.bak/
147
+
148
+ # Spyder project settings
149
+ .spyderproject
150
+ .spyproject
151
+
152
+ # Rope project settings
153
+ .ropeproject
154
+
155
+ # mkdocs documentation
156
+ /site
157
+
158
+ # mypy
159
+ .mypy_cache/
160
+ .dmypy.json
161
+ dmypy.json
162
+
163
+ # Pyre type checker
164
+ .pyre/
165
+
166
+ # pytype static type analyzer
167
+ .pytype/
168
+
169
+ # Cython debug symbols
170
+ cython_debug/
171
+
172
+ # PyCharm
173
+ # JetBrains specific template is maintained in a separate JetBrains.gitignore that can
174
+ # be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
175
+ # and can be added to the global gitignore or merged into this file. For a more nuclear
176
+ # option (not recommended) you can uncomment the following to ignore the entire idea folder.
177
+ .idea/
178
+
179
+ # Logs
180
+ logs
181
+ *.log
182
+ npm-debug.log*
183
+ yarn-debug.log*
184
+ yarn-error.log*
185
+ lerna-debug.log*
186
+ .pnpm-debug.log*
187
+
188
+ # Diagnostic reports (https://nodejs.org/api/report.html)
189
+ report.[0-9]*.[0-9]*.[0-9]*.[0-9]*.json
190
+
191
+ # Runtime data
192
+ pids
193
+ *.pid
194
+ *.seed
195
+ *.pid.lock
196
+
197
+ # Directory for instrumented libs generated by jscoverage/JSCover
198
+ lib-cov
199
+
200
+ # Coverage directory used by tools like istanbul
201
+ coverage
202
+ *.lcov
203
+
204
+ # nyc test coverage
205
+ .nyc_output
206
+
207
+ # Grunt intermediate storage (https://gruntjs.com/creating-plugins#storing-task-files)
208
+ .grunt
209
+
210
+ # Bower dependency directory (https://bower.io/)
211
+ bower_components
212
+
213
+ # node-waf configuration
214
+ .lock-wscript
215
+
216
+ # Compiled binary addons (https://nodejs.org/api/addons.html)
217
+ build/Release
218
+
219
+ # Dependency directories
220
+ node_modules/
221
+ jspm_packages/
222
+
223
+ # Snowpack dependency directory (https://snowpack.dev/)
224
+ web_modules/
225
+
226
+ # TypeScript cache
227
+ *.tsbuildinfo
228
+
229
+ # Optional npm cache directory
230
+ .npm
231
+
232
+ # Optional eslint cache
233
+ .eslintcache
234
+
235
+ # Optional stylelint cache
236
+ .stylelintcache
237
+
238
+ # Microbundle cache
239
+ .rpt2_cache/
240
+ .rts2_cache_cjs/
241
+ .rts2_cache_es/
242
+ .rts2_cache_umd/
243
+
244
+ # Optional REPL history
245
+ .node_repl_history
246
+
247
+ # Output of 'npm pack'
248
+ *.tgz
249
+
250
+ # Yarn Integrity file
251
+ .yarn-integrity
252
+
253
+ # dotenv environment variable files
254
+ .env
255
+ .env.development.local
256
+ .env.test.local
257
+ .env.production.local
258
+ .env.local
259
+
260
+ # parcel-bundler cache (https://parceljs.org/)
261
+ .cache
262
+ .parcel-cache
263
+
264
+ # Next.js build output
265
+ .next
266
+ out
267
+
268
+ # Nuxt.js build / generate output
269
+ .nuxt
270
+ dist
271
+
272
+ # Gatsby files
273
+ .cache/
274
+ # Comment in the public line in if your project uses Gatsby and not Next.js
275
+ # https://nextjs.org/blog/next-9-1#public-directory-support
276
+ # public
277
+
278
+ # vuepress build output
279
+ .vuepress/dist
280
+
281
+ # vuepress v2.x temp and cache directory
282
+ .temp
283
+ .cache
284
+
285
+ # Docusaurus cache and generated files
286
+ .docusaurus
287
+
288
+ # Serverless directories
289
+ .serverless/
290
+
291
+ # FuseBox cache
292
+ .fusebox/
293
+
294
+ # DynamoDB Local files
295
+ .dynamodb/
296
+
297
+ # TernJS port file
298
+ .tern-port
299
+
300
+ # Stores VSCode versions used for testing VSCode extensions
301
+ .vscode-test
302
+
303
+ # yarn v2
304
+ .yarn/cache
305
+ .yarn/unplugged
306
+ .yarn/build-state.yml
307
+ .yarn/install-state.gz
308
+ .pnp.*
309
+
310
+ # cypress artifacts
311
+ cypress/videos
312
+ cypress/screenshots
313
+
314
+
315
+
316
+ /static/*
.prettierrc ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "useTabs": true,
3
+ "singleQuote": true,
4
+ "trailingComma": "none",
5
+ "printWidth": 100,
6
+ "plugins": ["prettier-plugin-svelte"],
7
+ "pluginSearchDirs": ["."],
8
+ "overrides": [{ "files": "*.svelte", "options": { "parser": "svelte" } }]
9
+ }
CHANGELOG.md ADDED
@@ -0,0 +1,1297 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Changelog
2
+
3
+ All notable changes to this project will be documented in this file.
4
+
5
+ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
6
+ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
7
+
8
+ ## [0.4.2] - 2024-11-20
9
+
10
+ ### Fixed
11
+
12
+ - **📁 Knowledge Files Visibility Issue**: Resolved the bug preventing individual files in knowledge collections from displaying when referenced with '#'.
13
+ - **🔗 OpenAI Endpoint Prefix**: Fixed the issue where certain OpenAI connections that deviate from the official API spec weren’t working correctly with prefixes.
14
+ - **⚔️ Arena Model Access Control**: Corrected an issue where arena model access control settings were not being saved.
15
+ - **🔧 Usage Capability Selector**: Fixed the broken usage capabilities selector in the model editor.
16
+
17
+ ## [0.4.1] - 2024-11-19
18
+
19
+ ### Added
20
+
21
+ - **📊 Enhanced Feedback System**: Introduced a detailed 1-10 rating scale for feedback alongside thumbs up/down, preparing for more precise model fine-tuning and improving feedback quality.
22
+ - **ℹ️ Tool Descriptions on Hover**: Easily access tool descriptions by hovering over the message input, providing a smoother workflow with more context when utilizing tools.
23
+
24
+ ### Fixed
25
+
26
+ - **🗑️ Graceful Handling of Deleted Users**: Resolved an issue where deleted users caused workspace items (models, knowledge, prompts, tools) to fail, ensuring reliable workspace loading.
27
+ - **🔑 API Key Creation**: Fixed an issue preventing users from creating new API keys, restoring secure and seamless API management.
28
+ - **🔗 HTTPS Proxy Fix**: Corrected HTTPS proxy issues affecting the '/api/v1/models/' endpoint, ensuring smoother, uninterrupted model management.
29
+
30
+ ## [0.4.0] - 2024-11-19
31
+
32
+ ### Added
33
+
34
+ - **👥 User Groups**: You can now create and manage user groups, making user organization seamless.
35
+ - **🔐 Group-Based Access Control**: Set granular access to models, knowledge, prompts, and tools based on user groups, allowing for more controlled and secure environments.
36
+ - **🛠️ Group-Based User Permissions**: Easily manage workspace permissions. Grant users the ability to upload files, delete, edit, or create temporary chats, as well as define their ability to create models, knowledge, prompts, and tools.
37
+ - **🔑 LDAP Support**: Newly introduced LDAP authentication adds robust security and scalability to user management.
38
+ - **🌐 Enhanced OpenAI-Compatible Connections**: Added prefix ID support to avoid model ID clashes, with explicit model ID support for APIs lacking '/models' endpoint support, ensuring smooth operation with custom setups.
39
+ - **🔐 Ollama API Key Support**: Now manage credentials for Ollama when set behind proxies, including the option to utilize prefix ID for proper distinction across multiple Ollama instances.
40
+ - **🔄 Connection Enable/Disable Toggle**: Easily enable or disable individual OpenAI and Ollama connections as needed.
41
+ - **🎨 Redesigned Model Workspace**: Freshly redesigned to improve usability for managing models across users and groups.
42
+ - **🎨 Redesigned Prompt Workspace**: A fresh UI to conveniently organize and manage prompts.
43
+ - **🧩 Sorted Functions Workspace**: Functions are now automatically categorized by type (Action, Filter, Pipe), streamlining management.
44
+ - **💻 Redesigned Collaborative Workspace**: Enhanced support for multiple users contributing to models, knowledge, prompts, or tools, improving collaboration.
45
+ - **🔧 Auto-Selected Tools in Model Editor**: Tools enabled through the model editor are now automatically selected, whereas previously it only gave users the option to enable the tool, reducing manual steps and enhancing efficiency.
46
+ - **🔔 Web Search & Tools Indicator**: A clear indication now shows when web search or tools are active, reducing confusion.
47
+ - **🔑 Toggle API Key Auth**: Tighten security by easily enabling or disabling API key authentication option for Open WebUI.
48
+ - **🗂️ Agentic Retrieval**: Improve RAG accuracy via smart pre-processing of chat history to determine the best queries before retrieval.
49
+ - **📁 Large Text as File Option**: Optionally convert large pasted text into a file upload, keeping the chat interface cleaner.
50
+ - **🗂️ Toggle Citations for Models**: Ability to disable citations has been introduced in the model editor.
51
+ - **🔍 User Settings Search**: Quickly search for settings fields, improving ease of use and navigation.
52
+ - **🗣️ Experimental SpeechT5 TTS**: Local SpeechT5 support added for improved text-to-speech capabilities.
53
+ - **🔄 Unified Reset for Models**: A one-click option has been introduced to reset and remove all models from the Admin Settings.
54
+ - **🛠️ Initial Setup Wizard**: The setup process now explicitly informs users that they are creating an admin account during the first-time setup, ensuring clarity. Previously, users encountered the login page right away without this distinction.
55
+ - **🌐 Enhanced Translations**: Several language translations, including Ukrainian, Norwegian, and Brazilian Portuguese, were refined for better localization.
56
+
57
+ ### Fixed
58
+
59
+ - **🎥 YouTube Video Attachments**: Fixed issues preventing proper loading and attachment of YouTube videos as files.
60
+ - **🔄 Shared Chat Update**: Corrected issues where shared chats were not updating, improving collaboration consistency.
61
+ - **🔍 DuckDuckGo Rate Limit Fix**: Addressed issues with DuckDuckGo search integration, enhancing search stability and performance when operating within rate limits.
62
+ - **🧾 Citations Relevance Fix**: Adjusted the relevance percentage calculation for citations, so that Open WebUI properly reflect the accuracy of a retrieved document in RAG, ensuring users get clearer insights into sources.
63
+ - **🔑 Jina Search API Key Requirement**: Added the option to input an API key for Jina Search, ensuring smooth functionality as keys are now mandatory.
64
+
65
+ ### Changed
66
+
67
+ - **🛠️ Functions Moved to Admin Panel**: As Functions operate as advanced plugins, they are now accessible from the Admin Panel instead of the workspace.
68
+ - **🛠️ Manage Ollama Connections**: The "Models" section in Admin Settings has been relocated to Admin Settings > "Connections" > Ollama Connections. You can now manage Ollama instances via a dedicated "Manage Ollama" modal from "Connections", streamlining the setup and configuration of Ollama models.
69
+ - **📊 Base Models in Admin Settings**: Admins can now find all base models, both connections or functions, in the "Models" Admin setting. Global model accessibility can be enabled or disabled here. Models are private by default, requiring explicit permission assignment for user access.
70
+ - **📌 Sticky Model Selection for New Chats**: The model chosen from a previous chat now persists when creating a new chat. If you click "New Chat" again from the new chat page, it will revert to your default model.
71
+ - **🎨 Design Refactoring**: Overall design refinements across the platform have been made, providing a more cohesive and polished user experience.
72
+
73
+ ### Removed
74
+
75
+ - **📂 Model List Reordering**: Temporarily removed and will be reintroduced in upcoming user group settings improvements.
76
+ - **⚙️ Default Model Setting**: Removed the ability to set a default model for users, will be reintroduced with user group settings in the future.
77
+
78
+ ## [0.3.35] - 2024-10-26
79
+
80
+ ### Added
81
+
82
+ - **🌐 Translation Update**: Added translation labels in the SearchInput and CreateCollection components and updated Brazilian Portuguese translation (pt-BR)
83
+ - **📁 Robust File Handling**: Enhanced file input handling for chat. If the content extraction fails or is empty, users will now receive a clear warning, preventing silent failures and ensuring you always know what's happening with your uploads.
84
+ - **🌍 New Language Support**: Introduced Hungarian translations and updated French translations, expanding the platform's language accessibility for a more global user base.
85
+
86
+ ### Fixed
87
+
88
+ - **📚 Knowledge Base Loading Issue**: Resolved a critical bug where the Knowledge Base was not loading, ensuring smooth access to your stored documents and improving information retrieval in RAG-enhanced workflows.
89
+ - **🛠️ Tool Parameters Issue**: Fixed an error where tools were not functioning correctly when required parameters were missing, ensuring reliable tool performance and more efficient task completions.
90
+ - **🔗 Merged Response Loss in Multi-Model Chats**: Addressed an issue where responses in multi-model chat workflows were being deleted after follow-up queries, improving consistency and ensuring smoother interactions across models.
91
+
92
+ ## [0.3.34] - 2024-10-26
93
+
94
+ ### Added
95
+
96
+ - **🔧 Feedback Export Enhancements**: Feedback history data can now be exported to JSON, allowing for seamless integration in RLHF processing and further analysis.
97
+ - **🗂️ Embedding Model Lazy Loading**: Search functionality for leaderboard reranking is now more efficient, as embedding models are lazy-loaded only when needed, optimizing performance.
98
+ - **🎨 Rich Text Input Toggle**: Users can now switch back to legacy textarea input for chat if they prefer simpler text input, though rich text is still the default until deprecation.
99
+ - **🛠️ Improved Tool Calling Mechanism**: Enhanced method for parsing and calling tools, improving the reliability and robustness of tool function calls.
100
+ - **🌐 Globalization Enhancements**: Updates to internationalization (i18n) support, further refining multi-language compatibility and accuracy.
101
+
102
+ ### Fixed
103
+
104
+ - **🖥️ Folder Rename Fix for Firefox**: Addressed a persistent issue where users could not rename folders by pressing enter in Firefox, now ensuring seamless folder management across browsers.
105
+ - **🔠 Tiktoken Model Text Splitter Issue**: Resolved an issue where the tiktoken text splitter wasn’t working in Docker installations, restoring full functionality for tokenized text editing.
106
+ - **💼 S3 File Upload Issue**: Fixed a problem affecting S3 file uploads, ensuring smooth operations for those who store files on cloud storage.
107
+ - **🔒 Strict-Transport-Security Crash**: Resolved a crash when setting the Strict-Transport-Security (HSTS) header, improving stability and security enhancements.
108
+ - **🚫 OIDC Boolean Access Fix**: Addressed an issue with boolean values not being accessed correctly during OIDC logins, ensuring login reliability.
109
+ - **⚙️ Rich Text Paste Behavior**: Refined paste behavior in rich text input to make it smoother and more intuitive when pasting various content types.
110
+ - **🔨 Model Exclusion for Arena Fix**: Corrected the filter function that was not properly excluding models from the arena, improving model management.
111
+ - **🏷️ "Tags Generation Prompt" Fix**: Addressed an issue preventing custom "tags generation prompts" from registering properly, ensuring custom prompt work seamlessly.
112
+
113
+ ## [0.3.33] - 2024-10-24
114
+
115
+ ### Added
116
+
117
+ - **🏆 Evaluation Leaderboard**: Easily track your performance through a new leaderboard system where your ratings contribute to a real-time ranking based on the Elo system. Sibling responses (regenerations, many model chats) are required for your ratings to count in the leaderboard. Additionally, you can opt-in to share your feedback history and be part of the community-wide leaderboard. Expect further improvements as we refine the algorithm—help us build the best community leaderboard!
118
+ - **⚔️ Arena Model Evaluation**: Enable blind A/B testing of models directly from Admin Settings > Evaluation for a true side-by-side comparison. Ideal for pinpointing the best model for your needs.
119
+ - **🎯 Topic-Based Leaderboard**: Discover more accurate rankings with experimental topic-based reranking, which adjusts leaderboard standings based on tag similarity in feedback. Get more relevant insights based on specific topics!
120
+ - **📁 Folders Support for Chats**: Organize your chats better by grouping them into folders. Drag and drop chats between folders and export them seamlessly for easy sharing or analysis.
121
+ - **📤 Easy Chat Import via Drag & Drop**: Save time by simply dragging and dropping chat exports (JSON) directly onto the sidebar to import them into your workspace—streamlined, efficient, and intuitive!
122
+ - **📚 Enhanced Knowledge Collection**: Now, you can reference individual files from a knowledge collection—ideal for more precise Retrieval-Augmented Generations (RAG) queries and document analysis.
123
+ - **🏷️ Enhanced Tagging System**: Tags now take up less space! Utilize the new 'tag:' query system to manage, search, and organize your conversations more effectively without cluttering the interface.
124
+ - **🧠 Auto-Tagging for Chats**: Your conversations are now automatically tagged for improved organization, mirroring the efficiency of auto-generated titles.
125
+ - **🔍 Backend Chat Query System**: Chat filtering has become more efficient, now handled through the backend\*\* instead of your browser, improving search performance and accuracy.
126
+ - **🎮 Revamped Playground**: Experience a refreshed and optimized Playground for smoother testing, tweaks, and experimentation of your models and tools.
127
+ - **🧩 Token-Based Text Splitter**: Introducing token-based text splitting (tiktoken), giving you more precise control over how text is processed. Previously, only character-based splitting was available.
128
+ - **🔢 Ollama Batch Embeddings**: Leverage new batch embedding support for improved efficiency and performance with Ollama embedding models.
129
+ - **🔍 Enhanced Add Text Content Modal**: Enjoy a cleaner, more intuitive workflow for adding and curating knowledge content with an upgraded input modal from our Knowledge workspace.
130
+ - **🖋️ Rich Text Input for Chats**: Make your chat inputs more dynamic with support for rich text formatting. Your conversations just got a lot more polished and professional.
131
+ - **⚡ Faster Whisper Model Configurability**: Customize your local faster whisper model directly from the WebUI.
132
+ - **☁️ Experimental S3 Support**: Enable stateless WebUI instances with S3 support, greatly enhancing scalability and balancing heavy workloads.
133
+ - **🔕 Disable Update Toast**: Now you can streamline your workspace even further—choose to disable update notifications for a more focused experience.
134
+ - **🌟 RAG Citation Relevance Percentage**: Easily assess citation accuracy with the addition of relevance percentages in RAG results.
135
+ - **⚙️ Mermaid Copy Button**: Mermaid diagrams now come with a handy copy button, simplifying the extraction and use of diagram contents directly in your workflow.
136
+ - **🎨 UI Redesign**: Major interface redesign that will make navigation smoother, keep your focus where it matters, and ensure a modern look.
137
+
138
+ ### Fixed
139
+
140
+ - **🎙️ Voice Note Mic Stopping Issue**: Fixed the issue where the microphone stayed active after ending a voice note recording, ensuring your audio workflow runs smoothly.
141
+
142
+ ### Removed
143
+
144
+ - **👋 Goodbye Sidebar Tags**: Sidebar tag clutter is gone. We’ve shifted tag buttons to more effective query-based tag filtering for a sleeker, more agile interface.
145
+
146
+ ## [0.3.32] - 2024-10-06
147
+
148
+ ### Added
149
+
150
+ - **🔢 Workspace Enhancements**: Added a display count for models, prompts, tools, and functions in the workspace, providing a clear overview and easier management.
151
+
152
+ ### Fixed
153
+
154
+ - **🖥️ Web and YouTube Attachment Fix**: Resolved an issue where attaching web links and YouTube videos was malfunctioning, ensuring seamless integration and display within chats.
155
+ - **📞 Call Mode Activation on Landing Page**: Fixed a bug where call mode was not operational from the landing page.
156
+
157
+ ### Changed
158
+
159
+ - **🔄 URL Parameter Refinement**: Updated the 'tool_ids' URL parameter to 'tools' or 'tool-ids' for more intuitive and consistent user experience.
160
+ - **🎨 Floating Buttons Styling Update**: Refactored the styling of floating buttons to intelligently adjust to the left side when there isn't enough room on the right, improving interface usability and aesthetic.
161
+ - **🔧 Enhanced Accessibility for Floating Buttons**: Implemented the ability to close floating buttons with the 'Esc' key, making workflow smoother and more efficient for users navigating via keyboard.
162
+ - **🖇️ Updated Information URL**: Information URLs now direct users to a general release page rather than a version-specific URL, ensuring access to the latest and relevant details all in one place.
163
+ - **📦 Library Dependencies Update**: Upgraded dependencies to ensure compatibility and performance optimization for pip installs.
164
+
165
+ ## [0.3.31] - 2024-10-06
166
+
167
+ ### Added
168
+
169
+ - **📚 Knowledge Feature**: Reimagined documents feature, now more performant with a better UI for enhanced organization; includes streamlined API integration for Retrieval-Augmented Generation (RAG). Detailed documentation forthcoming: https://docs.openwebui.com/
170
+ - **🌐 New Landing Page**: Freshly designed landing page; toggle between the new UI and the classic chat UI from Settings > Interface for a personalized experience.
171
+ - **📁 Full Document Retrieval Mode**: Toggle between full document retrieval or traditional snippets by clicking on the file item. This mode enhances document capabilities and supports comprehensive tasks like summarization by utilizing the entire content instead of RAG.
172
+ - **📄 Extracted File Content Display**: View extracted content directly by clicking on the file item, simplifying file analysis.
173
+ - **🎨 Artifacts Feature**: Render web content and SVGs directly in the interface, supporting quick iterations and live changes.
174
+ - **🖊️ Editable Code Blocks**: Supercharged code blocks now allow live editing directly in the LLM response, with live reloads supported by artifacts.
175
+ - **🔧 Code Block Enhancements**: Introduced a floating copy button in code blocks to facilitate easier code copying without scrolling.
176
+ - **🔍 SVG Pan/Zoom**: Enhanced interaction with SVG images, including Mermaid diagrams, via new pan and zoom capabilities.
177
+ - **🔍 Text Select Quick Actions**: New floating buttons appear when text is highlighted in LLM responses, offering deeper interactions like "Ask a Question" or "Explain".
178
+ - **🗃️ Database Pool Configuration**: Enhanced database handling to support scalable user growth.
179
+ - **🔊 Experimental Audio Compression**: Compress audio files to navigate around the 25MB limit for OpenAI's speech-to-text processing.
180
+ - **🔍 Query Embedding**: Adjusted embedding behavior to enhance system performance by not repeating query embedding.
181
+ - **💾 Lazy Load Optimizations**: Implemented lazy loading of large dependencies to minimize initial memory usage, boosting performance.
182
+ - **🍏 Apple Touch Icon Support**: Optimizes the display of icons for web bookmarks on Apple mobile devices.
183
+ - **🔽 Expandable Content Markdown Support**: Introducing 'details', 'summary' tag support for creating expandable content sections in markdown, facilitating cleaner, organized documentation and interactive content display.
184
+
185
+ ### Fixed
186
+
187
+ - **🔘 Action Button Issue**: Resolved a bug where action buttons were not functioning, enhancing UI reliability.
188
+ - **🔄 Multi-Model Chat Loop**: Fixed an infinite loop issue in multi-model chat environments, ensuring smoother chat operations.
189
+ - **📄 Chat PDF/TXT Export Issue**: Resolved problems with exporting chat logs to PDF and TXT formats.
190
+ - **🔊 Call to Text-to-Speech Issues**: Rectified problems with text-to-speech functions to improve audio interactions.
191
+
192
+ ### Changed
193
+
194
+ - **⚙️ Endpoint Renaming**: Renamed 'rag' endpoints to 'retrieval' for clearer function description.
195
+ - **🎨 Styling and Interface Updates**: Multiple refinements across the platform to enhance visual appeal and user interaction.
196
+
197
+ ### Removed
198
+
199
+ - **🗑️ Deprecated 'DOCS_DIR'**: Removed the outdated 'docs_dir' variable in favor of more direct file management solutions, with direct file directory syncing and API uploads for a more integrated experience.
200
+
201
+ ## [0.3.30] - 2024-09-26
202
+
203
+ ### Fixed
204
+
205
+ - **🍞 Update Available Toast Dismissal**: Enhanced user experience by ensuring that once the update available notification is dismissed, it won't reappear for 24 hours.
206
+ - **📋 Ollama /embed Form Data**: Adjusted the integration inaccuracies in the /embed form data to ensure it perfectly matches with Ollama's specifications.
207
+ - **🔧 O1 Max Completion Tokens Issue**: Resolved compatibility issues with OpenAI's o1 models max_completion_tokens param to ensure smooth operation.
208
+ - **🔄 Pip Install Database Issue**: Fixed a critical issue where database changes during pip installations were reverting and not saving chat logs, now ensuring data persistence and reliability in chat operations.
209
+ - **🏷️ Chat Rename Tab Update**: Fixed the functionality to change the web browser's tab title simultaneously when a chat is renamed, keeping tab titles consistent.
210
+
211
+ ## [0.3.29] - 2023-09-25
212
+
213
+ ### Fixed
214
+
215
+ - **🔧 KaTeX Rendering Improvement**: Resolved specific corner cases in KaTeX rendering to enhance the display of complex mathematical notation.
216
+ - **📞 'Call' URL Parameter Fix**: Corrected functionality for 'call' URL search parameter ensuring reliable activation of voice calls through URL triggers.
217
+ - **🔄 Configuration Reset Fix**: Fixed the RESET_CONFIG_ON_START to ensure settings revert to default correctly upon each startup, improving reliability in configuration management.
218
+ - **🌍 Filter Outlet Hook Fix**: Addressed issues in the filter outlet hook, ensuring all filter functions operate as intended.
219
+
220
+ ## [0.3.28] - 2024-09-24
221
+
222
+ ### Fixed
223
+
224
+ - **🔍 Web Search Functionality**: Corrected an issue where the web search option was not functioning properly.
225
+
226
+ ## [0.3.27] - 2024-09-24
227
+
228
+ ### Fixed
229
+
230
+ - **🔄 Periodic Cleanup Error Resolved**: Fixed a critical RuntimeError related to the 'periodic_usage_pool_cleanup' coroutine, ensuring smooth and efficient performance post-pip install, correcting a persisting issue from version 0.3.26.
231
+ - **📊 Enhanced LaTeX Rendering**: Improved rendering for LaTeX content, enhancing clarity and visual presentation in documents and mathematical models.
232
+
233
+ ## [0.3.26] - 2024-09-24
234
+
235
+ ### Fixed
236
+
237
+ - **🔄 Event Loop Error Resolution**: Addressed a critical error where a missing running event loop caused 'periodic_usage_pool_cleanup' to fail with pip installs. This fix ensures smoother and more reliable updates and installations, enhancing overall system stability.
238
+
239
+ ## [0.3.25] - 2024-09-24
240
+
241
+ ### Fixed
242
+
243
+ - **🖼️ Image Generation Functionality**: Resolved an issue where image generation was not functioning, restoring full capability for visual content creation.
244
+ - **⚖️ Rate Response Corrections**: Addressed a problem where rate responses were not working, ensuring reliable feedback mechanisms are operational.
245
+
246
+ ## [0.3.24] - 2024-09-24
247
+
248
+ ### Added
249
+
250
+ - **🚀 Rendering Optimization**: Significantly improved message rendering performance, enhancing user experience and webui responsiveness.
251
+ - **💖 Favorite Response Feature in Chat Overview**: Users can now mark responses as favorite directly from the chat overview, enhancing ease of retrieval and organization of preferred responses.
252
+ - **💬 Create Message Pairs with Shortcut**: Implemented creation of new message pairs using Cmd/Ctrl+Shift+Enter, making conversation editing faster and more intuitive.
253
+ - **🌍 Expanded User Prompt Variables**: Added weekday, timezone, and language information variables to user prompts to match system prompt variables.
254
+ - **🎵 Enhanced Audio Support**: Now includes support for 'audio/x-m4a' files, broadening compatibility with audio content within the platform.
255
+ - **🔏 Model URL Search Parameter**: Added an ability to select a model directly via URL parameters, streamlining navigation and model access.
256
+ - **📄 Enhanced PDF Citations**: PDF citations now open at the associated page, streamlining reference checks and document handling.
257
+ - **🔧Use of Redis in Sockets**: Enhanced socket implementation to fully support Redis, enabling effective stateless instances suitable for scalable load balancing.
258
+ - **🌍 Stream Individual Model Responses**: Allows specific models to have individualized streaming settings, enhancing performance and customization.
259
+ - **🕒 Display Model Hash and Last Modified Timestamp for Ollama Models**: Provides critical model details directly in the Models workspace for enhanced tracking.
260
+ - **❗ Update Info Notification for Admins**: Ensures administrators receive immediate updates upon login, keeping them informed of the latest changes and system statuses.
261
+
262
+ ### Fixed
263
+
264
+ - **🗑️ Temporary File Handling On Windows**: Fixed an issue causing errors when accessing a temporary file being used by another process, Tools & Functions should now work as intended.
265
+ - **🔓 Authentication Toggle Issue**: Resolved the malfunction where setting 'WEBUI_AUTH=False' did not appropriately disable authentication, ensuring that user experience and system security settings function as configured.
266
+ - **🔧 Save As Copy Issue for Many Model Chats**: Resolved an error preventing users from save messages as copies in many model chats.
267
+ - **🔒 Sidebar Closure on Mobile**: Resolved an issue where the mobile sidebar remained open after menu engagement, improving user interface responsivity and comfort.
268
+ - **🛡️ Tooltip XSS Vulnerability**: Resolved a cross-site scripting (XSS) issue within tooltips, ensuring enhanced security and data integrity during user interactions.
269
+
270
+ ### Changed
271
+
272
+ - **↩️ Deprecated Interface Stream Response Settings**: Moved to advanced parameters to streamline interface settings and enhance user clarity.
273
+ - **⚙️ Renamed 'speedRate' to 'playbackRate'**: Standardizes terminology, improving usability and understanding in media settings.
274
+
275
+ ## [0.3.23] - 2024-09-21
276
+
277
+ ### Added
278
+
279
+ - **🚀 WebSocket Redis Support**: Enhanced load balancing capabilities for multiple instance setups, promoting better performance and reliability in WebUI.
280
+ - **🔧 Adjustable Chat Controls**: Introduced width-adjustable chat controls, enabling a personalized and more comfortable user interface.
281
+ - **🌎 i18n Updates**: Improved and updated the Chinese translations.
282
+
283
+ ### Fixed
284
+
285
+ - **🌐 Task Model Unloading Issue**: Modified task handling to use the Ollama /api/chat endpoint instead of OpenAI compatible endpoint, ensuring models stay loaded and ready with custom parameters, thus minimizing delays in task execution.
286
+ - **📝 Title Generation Fix for OpenAI Compatible APIs**: Resolved an issue preventing the generation of titles, enhancing consistency and reliability when using multiple API providers.
287
+ - **🗃️ RAG Duplicate Collection Issue**: Fixed a bug causing repeated processing of the same uploaded file. Now utilizes indexed files to prevent unnecessary duplications, optimizing resource usage.
288
+ - **🖼️ Image Generation Enhancement**: Refactored OpenAI image generation endpoint to be asynchronous, preventing the WebUI from becoming unresponsive during processing, thus enhancing user experience.
289
+ - **🔓 Downgrade Authlib**: Reverted Authlib to version 1.3.1 to address and resolve issues concerning OAuth functionality.
290
+
291
+ ### Changed
292
+
293
+ - **🔍 Improved Message Interaction**: Enhanced the message node interface to allow for easier focus redirection with a simple click, streamlining user interaction.
294
+ - **✨ Styling Refactor**: Updated WebUI styling for a cleaner, more modern look, enhancing user experience across the platform.
295
+
296
+ ## [0.3.22] - 2024-09-19
297
+
298
+ ### Added
299
+
300
+ - **⭐ Chat Overview**: Introducing a node-based interactive messages diagram for improved visualization of conversation flows.
301
+ - **🔗 Multiple Vector DB Support**: Now supports multiple vector databases, including the newly added Milvus support. Community contributions for additional database support are highly encouraged!
302
+ - **📡 Experimental Non-Stream Chat Completion**: Experimental feature allowing the use of OpenAI o1 models, which do not support streaming, ensuring more versatile model deployment.
303
+ - **🔍 Experimental Colbert-AI Reranker Integration**: Added support for "jinaai/jina-colbert-v2" as a reranker, enhancing search relevance and accuracy. Note: it may not function at all on low-spec computers.
304
+ - **🕸️ ENABLE_WEBSOCKET_SUPPORT**: Added environment variable for instances to ignore websocket upgrades, stabilizing connections on platforms with websocket issues.
305
+ - **🔊 Azure Speech Service Integration**: Added support for Azure Speech services for Text-to-Speech (TTS).
306
+ - **🎚️ Customizable Playback Speed**: Playback speed control is now available in Call mode settings, allowing users to adjust audio playback speed to their preferences.
307
+ - **🧠 Enhanced Error Messaging**: System now displays helpful error messages directly to users during chat completion issues.
308
+ - **📂 Save Model as Transparent PNG**: Model profile images are now saved as PNGs, supporting transparency and improving visual integration.
309
+ - **📱 iPhone Compatibility Adjustments**: Added padding to accommodate the iPhone navigation bar, improving UI display on these devices.
310
+ - **🔗 Secure Response Headers**: Implemented security response headers, bolstering web application security.
311
+ - **🔧 Enhanced AUTOMATIC1111 Settings**: Users can now configure 'CFG Scale', 'Sampler', and 'Scheduler' parameters directly in the admin settings, enhancing workflow flexibility without source code modifications.
312
+ - **🌍 i18n Updates**: Enhanced translations for Chinese, Ukrainian, Russian, and French, fostering a better localized experience.
313
+
314
+ ### Fixed
315
+
316
+ - **🛠️ Chat Message Deletion**: Resolved issues with chat message deletion, ensuring a smoother user interaction and system stability.
317
+ - **🔢 Ordered List Numbering**: Fixed the incorrect ordering in lists.
318
+
319
+ ### Changed
320
+
321
+ - **🎨 Transparent Icon Handling**: Allowed model icons to be displayed on transparent backgrounds, improving UI aesthetics.
322
+ - **📝 Improved RAG Template**: Enhanced Retrieval-Augmented Generation template, optimizing context handling and error checking for more precise operation.
323
+
324
+ ## [0.3.21] - 2024-09-08
325
+
326
+ ### Added
327
+
328
+ - **📊 Document Count Display**: Now displays the total number of documents directly within the dashboard.
329
+ - **🚀 Ollama Embed API Endpoint**: Enabled /api/embed endpoint proxy support.
330
+
331
+ ### Fixed
332
+
333
+ - **��� Docker Launch Issue**: Resolved the problem preventing Open-WebUI from launching correctly when using Docker.
334
+
335
+ ### Changed
336
+
337
+ - **🔍 Enhanced Search Prompts**: Improved the search query generation prompts for better accuracy and user interaction, enhancing the overall search experience.
338
+
339
+ ## [0.3.20] - 2024-09-07
340
+
341
+ ### Added
342
+
343
+ - **🌐 Translation Update**: Updated Catalan translations to improve user experience for Catalan speakers.
344
+
345
+ ### Fixed
346
+
347
+ - **📄 PDF Download**: Resolved a configuration issue with fonts directory, ensuring PDFs are now downloaded with the correct formatting.
348
+ - **🛠️ Installation of Tools & Functions Requirements**: Fixed a bug where necessary requirements for tools and functions were not properly installing.
349
+ - **🔗 Inline Image Link Rendering**: Enabled rendering of images directly from links in chat.
350
+ - **📞 Post-Call User Interface Cleanup**: Adjusted UI behavior to automatically close chat controls after a voice call ends, reducing screen clutter.
351
+ - **🎙️ Microphone Deactivation Post-Call**: Addressed an issue where the microphone remained active after calls.
352
+ - **✍️ Markdown Spacing Correction**: Corrected spacing in Markdown rendering, ensuring text appears neatly and as expected.
353
+ - **🔄 Message Re-rendering**: Fixed an issue causing all response messages to re-render with each new message, now improving chat performance.
354
+
355
+ ### Changed
356
+
357
+ - **🌐 Refined Web Search Integration**: Deprecated the Search Query Generation Prompt threshold; introduced a toggle button for "Enable Web Search Query Generation" allowing users to opt-in to using web search more judiciously.
358
+ - **📝 Default Prompt Templates Update**: Emptied environment variable templates for search and title generation now default to the Open WebUI default prompt templates, simplifying configuration efforts.
359
+
360
+ ## [0.3.19] - 2024-09-05
361
+
362
+ ### Added
363
+
364
+ - **🌐 Translation Update**: Improved Chinese translations.
365
+
366
+ ### Fixed
367
+
368
+ - **📂 DATA_DIR Overriding**: Fixed an issue to avoid overriding DATA_DIR, preventing errors when directories are set identically, ensuring smoother operation and data management.
369
+ - **🛠️ Frontmatter Extraction**: Fixed the extraction process for frontmatter in tools and functions.
370
+
371
+ ### Changed
372
+
373
+ - **🎨 UI Styling**: Refined the user interface styling for enhanced visual coherence and user experience.
374
+
375
+ ## [0.3.18] - 2024-09-04
376
+
377
+ ### Added
378
+
379
+ - **🛠️ Direct Database Execution for Tools & Functions**: Enhanced the execution of Python files for tools and functions, now directly loading from the database for a more streamlined backend process.
380
+
381
+ ### Fixed
382
+
383
+ - **🔄 Automatic Rewrite of Import Statements in Tools & Functions**: Tool and function scripts that import 'utils', 'apps', 'main', 'config' will now automatically rename these with 'open_webui.', ensuring compatibility and consistency across different modules.
384
+ - **🎨 Styling Adjustments**: Minor fixes in the visual styling to improve user experience and interface consistency.
385
+
386
+ ## [0.3.17] - 2024-09-04
387
+
388
+ ### Added
389
+
390
+ - **🔄 Import/Export Configuration**: Users can now import and export webui configurations from admin settings > Database, simplifying setup replication across systems.
391
+ - **🌍 Web Search via URL Parameter**: Added support for activating web search directly through URL by setting 'web-search=true'.
392
+ - **🌐 SearchApi Integration**: Added support for SearchApi as an alternative web search provider, enhancing search capabilities within the platform.
393
+ - **🔍 Literal Type Support in Tools**: Tools now support the Literal type.
394
+ - **🌍 Updated Translations**: Improved translations for Chinese, Ukrainian, and Catalan.
395
+
396
+ ### Fixed
397
+
398
+ - **🔧 Pip Install Issue**: Resolved the issue where pip install failed due to missing 'alembic.ini', ensuring smoother installation processes.
399
+ - **🌃 Automatic Theme Update**: Fixed an issue where the color theme did not update dynamically with system changes.
400
+ - **🛠️ User Agent in ComfyUI**: Added default headers in ComfyUI to fix access issues, improving reliability in network communications.
401
+ - **🔄 Missing Chat Completion Response Headers**: Ensured proper return of proxied response headers during chat completion, improving API reliability.
402
+ - **🔗 Websocket Connection Prioritization**: Modified socket.io configuration to prefer websockets and more reliably fallback to polling, enhancing connection stability.
403
+ - **🎭 Accessibility Enhancements**: Added missing ARIA labels for buttons, improving accessibility for visually impaired users.
404
+ - **⚖️ Advanced Parameter**: Fixed an issue ensuring that advanced parameters are correctly applied in all scenarios, ensuring consistent behavior of user-defined settings.
405
+
406
+ ### Changed
407
+
408
+ - **🔁 Namespace Reorganization**: Reorganized all Python files under the 'open_webui' namespace to streamline the project structure and improve maintainability. Tools and functions importing from 'utils' should now use 'open_webui.utils'.
409
+ - **🚧 Dependency Updates**: Updated several backend dependencies like 'aiohttp', 'authlib', 'duckduckgo-search', 'flask-cors', and 'langchain' to their latest versions, enhancing performance and security.
410
+
411
+ ## [0.3.16] - 2024-08-27
412
+
413
+ ### Added
414
+
415
+ - **🚀 Config DB Migration**: Migrated configuration handling from config.json to the database, enabling high-availability setups and load balancing across multiple Open WebUI instances.
416
+ - **🔗 Call Mode Activation via URL**: Added a 'call=true' URL search parameter enabling direct shortcuts to activate call mode, enhancing user interaction on mobile devices.
417
+ - **✨ TTS Content Control**: Added functionality to control how message content is segmented for Text-to-Speech (TTS) generation requests, allowing for more flexible speech output options.
418
+ - **😄 Show Knowledge Search Status**: Enhanced model usage transparency by displaying status when working with knowledge-augmented models, helping users understand the system's state during queries.
419
+ - **👆 Click-to-Copy for Codespan**: Enhanced interactive experience in the WebUI by allowing users to click to copy content from code spans directly.
420
+ - **🚫 API User Blocking via Model Filter**: Introduced the ability to block API users based on customized model filters, enhancing security and control over API access.
421
+ - **🎬 Call Overlay Styling**: Adjusted call overlay styling on large screens to not cover the entire interface, but only the chat control area, for a more unobtrusive interaction experience.
422
+
423
+ ### Fixed
424
+
425
+ - **🔧 LaTeX Rendering Issue**: Addressed an issue that affected the correct rendering of LaTeX.
426
+ - **📁 File Leak Prevention**: Resolved the issue of uploaded files mistakenly being accessible across user chats.
427
+ - **🔧 Pipe Functions with '**files**' Param**: Fixed issues with '**files**' parameter not functioning correctly in pipe functions.
428
+ - **📝 Markdown Processing for RAG**: Fixed issues with processing Markdown in files.
429
+ - **🚫 Duplicate System Prompts**: Fixed bugs causing system prompts to duplicate.
430
+
431
+ ### Changed
432
+
433
+ - **🔋 Wakelock Permission**: Optimized the activation of wakelock to only engage during call mode, conserving device resources and improving battery performance during idle periods.
434
+ - **🔍 Content-Type for Ollama Chats**: Added 'application/x-ndjson' content-type to '/api/chat' endpoint responses to match raw Ollama responses.
435
+ - **✋ Disable Signups Conditionally**: Implemented conditional logic to disable sign-ups when 'ENABLE_LOGIN_FORM' is set to false.
436
+
437
+ ## [0.3.15] - 2024-08-21
438
+
439
+ ### Added
440
+
441
+ - **🔗 Temporary Chat Activation**: Integrated a new URL parameter 'temporary-chat=true' to enable temporary chat sessions directly through the URL.
442
+ - **🌄 ComfyUI Seed Node Support**: Introduced seed node support in ComfyUI for image generation, allowing users to specify node IDs for randomized seed assignment.
443
+
444
+ ### Fixed
445
+
446
+ - **🛠️ Tools and Functions**: Resolved a critical issue where Tools and Functions were not properly functioning, restoring full capability and reliability to these essential features.
447
+ - **🔘 Chat Action Button in Many Model Chat**: Fixed the malfunctioning of chat action buttons in many model chat environments, ensuring a smoother and more responsive user interaction.
448
+ - **⏪ Many Model Chat Compatibility**: Restored backward compatibility for many model chats.
449
+
450
+ ## [0.3.14] - 2024-08-21
451
+
452
+ ### Added
453
+
454
+ - **🛠️ Custom ComfyUI Workflow**: Deprecating several older environment variables, this enhancement introduces a new, customizable workflow for a more tailored user experience.
455
+ - **🔀 Merge Responses in Many Model Chat**: Enhances the dialogue by merging responses from multiple models into a single, coherent reply, improving the interaction quality in many model chats.
456
+ - **✅ Multiple Instances of Same Model in Chats**: Enhanced many model chat to support adding multiple instances of the same model.
457
+ - **🔧 Quick Actions in Model Workspace**: Enhanced Shift key quick actions for hiding/unhiding and deleting models, facilitating a smoother workflow.
458
+ - **🗨️ Markdown Rendering in User Messages**: User messages are now rendered in Markdown, enhancing readability and interaction.
459
+ - **💬 Temporary Chat Feature**: Introduced a temporary chat feature, deprecating the old chat history setting to enhance user interaction flexibility.
460
+ - **🖋️ User Message Editing**: Enhanced the user chat editing feature to allow saving changes without sending, providing more flexibility in message management.
461
+ - **🛡️ Security Enhancements**: Various security improvements implemented across the platform to ensure safer user experiences.
462
+ - **🌍 Updated Translations**: Enhanced translations for Chinese, Ukrainian, and Bahasa Malaysia, improving localization and user comprehension.
463
+
464
+ ### Fixed
465
+
466
+ - **📑 Mermaid Rendering Issue**: Addressed issues with Mermaid chart rendering to ensure clean and clear visual data representation.
467
+ - **🎭 PWA Icon Maskability**: Fixed the Progressive Web App icon to be maskable, ensuring proper display on various device home screens.
468
+ - **🔀 Cloned Model Chat Freezing Issue**: Fixed a bug where cloning many model chats would cause freezing, enhancing stability and responsiveness.
469
+ - **🔍 Generic Error Handling and Refinements**: Various minor fixes and refinements to address previously untracked issues, ensuring smoother operations.
470
+
471
+ ### Changed
472
+
473
+ - **🖼️ Image Generation Refactor**: Overhauled image generation processes for improved efficiency and quality.
474
+ - **🔨 Refactor Tool and Function Calling**: Refactored tool and function calling mechanisms for improved clarity and maintainability.
475
+ - **🌐 Backend Library Updates**: Updated critical backend libraries including SQLAlchemy, uvicorn[standard], faster-whisper, bcrypt, and boto3 for enhanced performance and security.
476
+
477
+ ### Removed
478
+
479
+ - **🚫 Deprecated ComfyUI Environment Variables**: Removed several outdated environment variables related to ComfyUI settings, simplifying configuration management.
480
+
481
+ ## [0.3.13] - 2024-08-14
482
+
483
+ ### Added
484
+
485
+ - **🎨 Enhanced Markdown Rendering**: Significant improvements in rendering markdown, ensuring smooth and reliable display of LaTeX and Mermaid charts, enhancing user experience with more robust visual content.
486
+ - **🔄 Auto-Install Tools & Functions Python Dependencies**: For 'Tools' and 'Functions', Open WebUI now automatically install extra python requirements specified in the frontmatter, streamlining setup processes and customization.
487
+ - **🌀 OAuth Email Claim Customization**: Introduced an 'OAUTH_EMAIL_CLAIM' variable to allow customization of the default "email" claim within OAuth configurations, providing greater flexibility in authentication processes.
488
+ - **📶 Websocket Reconnection**: Enhanced reliability with the capability to automatically reconnect when a websocket is closed, ensuring consistent and stable communication.
489
+ - **🤳 Haptic Feedback on Support Devices**: Android devices now support haptic feedback for an immersive tactile experience during certain interactions.
490
+
491
+ ### Fixed
492
+
493
+ - **🛠️ ComfyUI Performance Improvement**: Addressed an issue causing FastAPI to stall when ComfyUI image generation was active; now runs in a separate thread to prevent UI unresponsiveness.
494
+ - **🔀 Session Handling**: Fixed an issue mandating session_id on client-side to ensure smoother session management and transitions.
495
+ - **🖋️ Minor Bug Fixes and Format Corrections**: Various minor fixes including typo corrections, backend formatting improvements, and test amendments enhancing overall system stability and performance.
496
+
497
+ ### Changed
498
+
499
+ - **🚀 Migration to SvelteKit 2**: Upgraded the underlying framework to SvelteKit version 2, offering enhanced speed, better code structure, and improved deployment capabilities.
500
+ - **🧹 General Cleanup and Refactoring**: Performed broad cleanup and refactoring across the platform, improving code efficiency and maintaining high standards of code health.
501
+ - **🚧 Integration Testing Improvements**: Modified how Cypress integration tests detect chat messages and updated sharing tests for better reliability and accuracy.
502
+ - **📁 Standardized '.safetensors' File Extension**: Renamed the '.sft' file extension to '.safetensors' for ComfyUI workflows, standardizing file formats across the platform.
503
+
504
+ ### Removed
505
+
506
+ - **🗑️ Deprecated Frontend Functions**: Removed frontend functions that were migrated to backend to declutter the codebase and reduce redundancy.
507
+
508
+ ## [0.3.12] - 2024-08-07
509
+
510
+ ### Added
511
+
512
+ - **🔄 Sidebar Infinite Scroll**: Added an infinite scroll feature in the sidebar for more efficient chat navigation, reducing load times and enhancing user experience.
513
+ - **🚀 Enhanced Markdown Rendering**: Support for rendering all code blocks and making images clickable for preview; codespan styling is also enhanced to improve readability and user interaction.
514
+ - **🔒 Admin Shared Chat Visibility**: Admins no longer have default visibility over shared chats when ENABLE_ADMIN_CHAT_ACCESS is set to false, tightening security and privacy settings for users.
515
+ - **🌍 Language Updates**: Added Malay (Bahasa Malaysia) translation and updated Catalan and Traditional Chinese translations to improve accessibility for more users.
516
+
517
+ ### Fixed
518
+
519
+ - **📊 Markdown Rendering Issues**: Resolved issues with markdown rendering to ensure consistent and correct display across components.
520
+ - **🛠️ Styling Issues**: Multiple fixes applied to styling throughout the application, improving the overall visual experience and interface consistency.
521
+ - **🗃️ Modal Handling**: Fixed an issue where modals were not closing correctly in various model chat scenarios, enhancing usability and interface reliability.
522
+ - **📄 Missing OpenAI Usage Information**: Resolved issues where usage statistics for OpenAI services were not being correctly displayed, ensuring users have access to crucial data for managing and monitoring their API consumption.
523
+ - **🔧 Non-Streaming Support for Functions Plugin**: Fixed a functionality issue with the Functions plugin where non-streaming operations were not functioning as intended, restoring full capabilities for async and sync integration within the platform.
524
+ - **🔄 Environment Variable Type Correction (COMFYUI_FLUX_FP8_CLIP)**: Corrected the data type of the 'COMFYUI_FLUX_FP8_CLIP' environment variable from string to boolean, ensuring environment settings apply correctly and enhance configuration management.
525
+
526
+ ### Changed
527
+
528
+ - **🔧 Backend Dependency Updates**: Updated several backend dependencies such as boto3, pypdf, python-pptx, validators, and black, ensuring up-to-date security and performance optimizations.
529
+
530
+ ## [0.3.11] - 2024-08-02
531
+
532
+ ### Added
533
+
534
+ - **📊 Model Information Display**: Added visuals for model selection, including images next to model names for more intuitive navigation.
535
+ - **🗣 ElevenLabs Voice Adaptations**: Voice enhancements including support for ElevenLabs voice ID by name for personalized vocal interactions.
536
+ - **⌨️ Arrow Keys Model Selection**: Users can now use arrow keys for quicker model selection, enhancing accessibility.
537
+ - **🔍 Fuzzy Search in Model Selector**: Enhanced model selector with fuzzy search to locate models swiftly, including descriptions.
538
+ - **🕹️ ComfyUI Flux Image Generation**: Added support for the new Flux image gen model; introduces environment controls like weight precision and CLIP model options in Settings.
539
+ - **💾 Display File Size for Uploads**: Enhanced file interface now displays file size, preparing for upcoming upload restrictions.
540
+ - **🎚️ Advanced Params "Min P"**: Added 'Min P' parameter in the advanced settings for customized model precision control.
541
+ - **🔒 Enhanced OAuth**: Introduced custom redirect URI support for OAuth behind reverse proxies, enabling safer authentication processes.
542
+ - **🖥 Enhanced Latex Rendering**: Adjustments made to latex rendering processes, now accurately detecting and presenting latex inputs from text.
543
+ - **🌐 Internationalization**: Enhanced with new Romanian and updated Vietnamese and Ukrainian translations, helping broaden accessibility for international users.
544
+
545
+ ### Fixed
546
+
547
+ - **🔧 Tags Handling in Document Upload**: Tags are now properly sent to the upload document handler, resolving issues with missing metadata.
548
+ - **🖥️ Sensitive Input Fields**: Corrected browser misinterpretation of secure input fields, preventing misclassification as password fields.
549
+ - **📂 Static Path Resolution in PDF Generation**: Fixed static paths that adjust dynamically to prevent issues across various environments.
550
+
551
+ ### Changed
552
+
553
+ - **🎨 UI/UX Styling Enhancements**: Multiple minor styling updates for a cleaner and more intuitive user interface.
554
+ - **🚧 Refactoring Various Components**: Numerous refactoring changes across styling, file handling, and function simplifications for clarity and performance.
555
+ - **🎛️ User Valves Management**: Moved user valves from settings to direct chat controls for more user-friendly access during interactions.
556
+
557
+ ### Removed
558
+
559
+ - **⚙️ Health Check Logging**: Removed verbose logging from the health checking processes to declutter logs and improve backend performance.
560
+
561
+ ## [0.3.10] - 2024-07-17
562
+
563
+ ### Fixed
564
+
565
+ - **🔄 Improved File Upload**: Addressed the issue where file uploads lacked animation.
566
+ - **💬 Chat Continuity**: Fixed a problem where existing chats were not functioning properly in some instances.
567
+ - **🗂️ Chat File Reset**: Resolved the issue of chat files not resetting for new conversations, now ensuring a clean slate for each chat session.
568
+ - **📁 Document Workspace Uploads**: Corrected the handling of document uploads in the workspace using the Files API.
569
+
570
+ ## [0.3.9] - 2024-07-17
571
+
572
+ ### Added
573
+
574
+ - **📁 Files Chat Controls**: We've reverted to the old file handling behavior where uploaded files are always included. You can now manage files directly within the chat controls section, giving you the ability to remove files as needed.
575
+ - **🔧 "Action" Function Support**: Introducing a new "Action" function to write custom buttons to the message toolbar. This feature enables more interactive messaging, with documentation coming soon.
576
+ - **📜 Citations Handling**: For newly uploaded files in documents workspace, citations will now display the actual filename. Additionally, you can click on these filenames to open the file in a new tab for easier access.
577
+ - **🛠️ Event Emitter and Call Updates**: Enhanced 'event_emitter' to allow message replacement and 'event_call' to support text input for Tools and Functions. Detailed documentation will be provided shortly.
578
+ - **🎨 Styling Refactor**: Various styling updates for a cleaner and more cohesive user interface.
579
+ - **🌐 Enhanced Translations**: Improved translations for Catalan, Ukrainian, and Brazilian Portuguese.
580
+
581
+ ### Fixed
582
+
583
+ - **🔧 Chat Controls Priority**: Resolved an issue where Chat Controls values were being overridden by model information parameters. The priority is now Chat Controls, followed by Global Settings, then Model Settings.
584
+ - **🪲 Debug Logs**: Fixed an issue where debug logs were not being logged properly.
585
+ - **🔑 Automatic1111 Auth Key**: The auth key for Automatic1111 is no longer required.
586
+ - **📝 Title Generation**: Ensured that the title generation runs only once, even when multiple models are in a chat.
587
+ - **✅ Boolean Values in Params**: Added support for boolean values in parameters.
588
+ - **🖼️ Files Overlay Styling**: Fixed the styling issue with the files overlay.
589
+
590
+ ### Changed
591
+
592
+ - **⬆️ Dependency Updates**
593
+ - Upgraded 'pydantic' from version 2.7.1 to 2.8.2.
594
+ - Upgraded 'sqlalchemy' from version 2.0.30 to 2.0.31.
595
+ - Upgraded 'unstructured' from version 0.14.9 to 0.14.10.
596
+ - Upgraded 'chromadb' from version 0.5.3 to 0.5.4.
597
+
598
+ ## [0.3.8] - 2024-07-09
599
+
600
+ ### Added
601
+
602
+ - **💬 Chat Controls**: Easily adjust parameters for each chat session, offering more precise control over your interactions.
603
+ - **📌 Pinned Chats**: Support for pinned chats, allowing you to keep important conversations easily accessible.
604
+ - **📄 Apache Tika Integration**: Added support for using Apache Tika as a document loader, enhancing document processing capabilities.
605
+ - **🛠️ Custom Environment for OpenID Claims**: Allows setting custom claims for OpenID, providing more flexibility in user authentication.
606
+ - **🔧 Enhanced Tools & Functions API**: Introduced 'event_emitter' and 'event_call', now you can also add citations for better documentation and tracking. Detailed documentation will be provided on our documentation website.
607
+ - **↔️ Sideways Scrolling in Settings**: Settings tabs container now supports horizontal scrolling for easier navigation.
608
+ - **🌑 Darker OLED Theme**: Includes a new, darker OLED theme and improved styling for the light theme, enhancing visual appeal.
609
+ - **🌐 Language Updates**: Updated translations for Indonesian, German, French, and Catalan languages, expanding accessibility.
610
+
611
+ ### Fixed
612
+
613
+ - **⏰ OpenAI Streaming Timeout**: Resolved issues with OpenAI streaming response using the 'AIOHTTP_CLIENT_TIMEOUT' setting, ensuring reliable performance.
614
+ - **💡 User Valves**: Fixed malfunctioning user valves, ensuring proper functionality.
615
+ - **🔄 Collapsible Components**: Addressed issues with collapsible components not working, restoring expected behavior.
616
+
617
+ ### Changed
618
+
619
+ - **🗃️ Database Backend**: Switched from Peewee to SQLAlchemy for improved concurrency support, enhancing database performance.
620
+ - **⬆️ ChromaDB Update**: Upgraded to version 0.5.3. Ensure your remote ChromaDB instance matches this version.
621
+ - **🔤 Primary Font Styling**: Updated primary font to Archivo for better visual consistency.
622
+ - **🔄 Font Change for Windows**: Replaced Arimo with Inter font for Windows users, improving readability.
623
+ - **🚀 Lazy Loading**: Implemented lazy loading for 'faster_whisper' and 'sentence_transformers' to reduce startup memory usage.
624
+ - **📋 Task Generation Payload**: Task generations now include only the "task" field in the body instead of "title".
625
+
626
+ ## [0.3.7] - 2024-06-29
627
+
628
+ ### Added
629
+
630
+ - **🌐 Enhanced Internationalization (i18n)**: Newly introduced Indonesian translation, and updated translations for Turkish, Chinese, and Catalan languages to improve user accessibility.
631
+
632
+ ### Fixed
633
+
634
+ - **🕵️‍♂️ Browser Language Detection**: Corrected the issue where the application was not properly detecting and adapting to the browser's language settings.
635
+ - **🔐 OIDC Admin Role Assignment**: Fixed a bug where the admin role was not being assigned to the first user who signed up via OpenID Connect (OIDC).
636
+ - **💬 Chat/Completions Endpoint**: Resolved an issue where the chat/completions endpoint was non-functional when the stream option was set to False.
637
+ - **🚫 'WEBUI_AUTH' Configuration**: Addressed the problem where setting 'WEBUI_AUTH' to False was not being applied correctly.
638
+
639
+ ### Changed
640
+
641
+ - **📦 Dependency Update**: Upgraded 'authlib' from version 1.3.0 to 1.3.1 to ensure better security and performance enhancements.
642
+
643
+ ## [0.3.6] - 2024-06-27
644
+
645
+ ### Added
646
+
647
+ - **✨ "Functions" Feature**: You can now utilize "Functions" like filters (middleware) and pipe (model) functions directly within the WebUI. While largely compatible with Pipelines, these native functions can be executed easily within Open WebUI. Example use cases for filter functions include usage monitoring, real-time translation, moderation, and automemory. For pipe functions, the scope ranges from Cohere and Anthropic integration directly within Open WebUI, enabling "Valves" for per-user OpenAI API key usage, and much more. If you encounter issues, SAFE_MODE has been introduced.
648
+ - **📁 Files API**: Compatible with OpenAI, this feature allows for custom Retrieval-Augmented Generation (RAG) in conjunction with the Filter Function. More examples will be shared on our community platform and official documentation website.
649
+ - **🛠️ Tool Enhancements**: Tools now support citations and "Valves". Documentation will be available shortly.
650
+ - **🔗 Iframe Support via Files API**: Enables rendering HTML directly into your chat interface using functions and tools. Use cases include playing games like DOOM and Snake, displaying a weather applet, and implementing Anthropic "artifacts"-like features. Stay tuned for updates on our community platform and documentation.
651
+ - **🔒 Experimental OAuth Support**: New experimental OAuth support. Check our documentation for more details.
652
+ - **🖼️ Custom Background Support**: Set a custom background from Settings > Interface to personalize your experience.
653
+ - **🔑 AUTOMATIC1111_API_AUTH Support**: Enhanced security for the AUTOMATIC1111 API.
654
+ - **🎨 Code Highlight Optimization**: Improved code highlighting features.
655
+ - **🎙️ Voice Interruption Feature**: Reintroduced and now toggleable from Settings > Interface.
656
+ - **💤 Wakelock API**: Now in use to prevent screen dimming during important tasks.
657
+ - **🔐 API Key Privacy**: All API keys are now hidden by default for better security.
658
+ - **🔍 New Web Search Provider**: Added jina_search as a new option.
659
+ - **🌐 Enhanced Internationalization (i18n)**: Improved Korean translation and updated Chinese and Ukrainian translations.
660
+
661
+ ### Fixed
662
+
663
+ - **🔧 Conversation Mode Issue**: Fixed the issue where Conversation Mode remained active after being removed from settings.
664
+ - **📏 Scroll Button Obstruction**: Resolved the issue where the scrollToBottom button container obstructed clicks on buttons beneath it.
665
+
666
+ ### Changed
667
+
668
+ - **⏲️ AIOHTTP_CLIENT_TIMEOUT**: Now set to 'None' by default for improved configuration flexibility.
669
+ - **📞 Voice Call Enhancements**: Improved by skipping code blocks and expressions during calls.
670
+ - **🚫 Error Message Handling**: Disabled the continuation of operations with error messages.
671
+ - **🗂️ Playground Relocation**: Moved the Playground from the workspace to the user menu for better user experience.
672
+
673
+ ## [0.3.5] - 2024-06-16
674
+
675
+ ### Added
676
+
677
+ - **📞 Enhanced Voice Call**: Text-to-speech (TTS) callback now operates in real-time for each sentence, reducing latency by not waiting for full completion.
678
+ - **👆 Tap to Interrupt**: During a call, you can now stop the assistant from speaking by simply tapping, instead of using voice. This resolves the issue of the speaker's voice being mistakenly registered as input.
679
+ - **😊 Emoji Call**: Toggle this feature on from the Settings > Interface, allowing LLMs to express emotions using emojis during voice calls for a more dynamic interaction.
680
+ - **🖱️ Quick Archive/Delete**: Use the Shift key + mouseover on the chat list to swiftly archive or delete items.
681
+ - **📝 Markdown Support in Model Descriptions**: You can now format model descriptions with markdown, enabling bold text, links, etc.
682
+ - **🧠 Editable Memories**: Adds the capability to modify memories.
683
+ - **📋 Admin Panel Sorting**: Introduces the ability to sort users/chats within the admin panel.
684
+ - **🌑 Dark Mode for Quick Selectors**: Dark mode now available for chat quick selectors (prompts, models, documents).
685
+ - **🔧 Advanced Parameters**: Adds 'num_keep' and 'num_batch' to advanced parameters for customization.
686
+ - **📅 Dynamic System Prompts**: New variables '{{CURRENT_DATETIME}}', '{{CURRENT_TIME}}', '{{USER_LOCATION}}' added for system prompts. Ensure '{{USER_LOCATION}}' is toggled on from Settings > Interface.
687
+ - **🌐 Tavily Web Search**: Includes Tavily as a web search provider option.
688
+ - **🖊️ Federated Auth Usernames**: Ability to set user names for federated authentication.
689
+ - **🔗 Auto Clean URLs**: When adding connection URLs, trailing slashes are now automatically removed.
690
+ - **🌐 Enhanced Translations**: Improved Chinese and Swedish translations.
691
+
692
+ ### Fixed
693
+
694
+ - **⏳ AIOHTTP_CLIENT_TIMEOUT**: Introduced a new environment variable 'AIOHTTP_CLIENT_TIMEOUT' for requests to Ollama lasting longer than 5 minutes. Default is 300 seconds; set to blank ('') for no timeout.
695
+ - **❌ Message Delete Freeze**: Resolved an issue where message deletion would sometimes cause the web UI to freeze.
696
+
697
+ ## [0.3.4] - 2024-06-12
698
+
699
+ ### Fixed
700
+
701
+ - **🔒 Mixed Content with HTTPS Issue**: Resolved a problem where mixed content (HTTP and HTTPS) was causing security warnings and blocking resources on HTTPS sites.
702
+ - **🔍 Web Search Issue**: Addressed the problem where web search functionality was not working correctly. The 'ENABLE_RAG_LOCAL_WEB_FETCH' option has been reintroduced to restore proper web searching capabilities.
703
+ - **💾 RAG Template Not Being Saved**: Fixed an issue where the RAG template was not being saved correctly, ensuring your custom templates are now preserved as expected.
704
+
705
+ ## [0.3.3] - 2024-06-12
706
+
707
+ ### Added
708
+
709
+ - **🛠️ Native Python Function Calling**: Introducing native Python function calling within Open WebUI. We’ve also included a built-in code editor to seamlessly develop and integrate function code within the 'Tools' workspace. With this, you can significantly enhance your LLM’s capabilities by creating custom RAG pipelines, web search tools, and even agent-like features such as sending Discord messages.
710
+ - **🌐 DuckDuckGo Integration**: Added DuckDuckGo as a web search provider, giving you more search options.
711
+ - **🌏 Enhanced Translations**: Improved translations for Vietnamese and Chinese languages, making the interface more accessible.
712
+
713
+ ### Fixed
714
+
715
+ - **🔗 Web Search URL Error Handling**: Fixed the issue where a single URL error would disrupt the data loading process in Web Search mode. Now, such errors will be handled gracefully to ensure uninterrupted data loading.
716
+ - **🖥️ Frontend Responsiveness**: Resolved the problem where the frontend would stop responding if the backend encounters an error while downloading a model. Improved error handling to maintain frontend stability.
717
+ - **🔧 Dependency Issues in pip**: Fixed issues related to pip installations, ensuring all dependencies are correctly managed to prevent installation errors.
718
+
719
+ ## [0.3.2] - 2024-06-10
720
+
721
+ ### Added
722
+
723
+ - **🔍 Web Search Query Status**: The web search query will now persist in the results section to aid in easier debugging and tracking of search queries.
724
+ - **🌐 New Web Search Provider**: We have added Serply as a new option for web search providers, giving you more choices for your search needs.
725
+ - **🌏 Improved Translations**: We've enhanced translations for Chinese and Portuguese.
726
+
727
+ ### Fixed
728
+
729
+ - **🎤 Audio File Upload Issue**: The bug that prevented audio files from being uploaded in chat input has been fixed, ensuring smooth communication.
730
+ - **💬 Message Input Handling**: Improved the handling of message inputs by instantly clearing images and text after sending, along with immediate visual indications when a response message is loading, enhancing user feedback.
731
+ - **⚙️ Parameter Registration and Validation**: Fixed the issue where parameters were not registering in certain cases and addressed the problem where users were unable to save due to invalid input errors.
732
+
733
+ ## [0.3.1] - 2024-06-09
734
+
735
+ ### Fixed
736
+
737
+ - **💬 Chat Functionality**: Resolved the issue where chat functionality was not working for specific models.
738
+
739
+ ## [0.3.0] - 2024-06-09
740
+
741
+ ### Added
742
+
743
+ - **📚 Knowledge Support for Models**: Attach documents directly to models from the models workspace, enhancing the information available to each model.
744
+ - **🎙️ Hands-Free Voice Call Feature**: Initiate voice calls without needing to use your hands, making interactions more seamless.
745
+ - **📹 Video Call Feature**: Enable video calls with supported vision models like Llava and GPT-4o, adding a visual dimension to your communications.
746
+ - **🎛️ Enhanced UI for Voice Recording**: Improved user interface for the voice recording feature, making it more intuitive and user-friendly.
747
+ - **🌐 External STT Support**: Now support for external Speech-To-Text services, providing more flexibility in choosing your STT provider.
748
+ - **⚙️ Unified Settings**: Consolidated settings including document settings under a new admin settings section for easier management.
749
+ - **🌑 Dark Mode Splash Screen**: A new splash screen for dark mode, ensuring a consistent and visually appealing experience for dark mode users.
750
+ - **📥 Upload Pipeline**: Directly upload pipelines from the admin settings > pipelines section, streamlining the pipeline management process.
751
+ - **🌍 Improved Language Support**: Enhanced support for Chinese and Ukrainian languages, better catering to a global user base.
752
+
753
+ ### Fixed
754
+
755
+ - **🛠️ Playground Issue**: Fixed the playground not functioning properly, ensuring a smoother user experience.
756
+ - **🔥 Temperature Parameter Issue**: Corrected the issue where the temperature value '0' was not being passed correctly.
757
+ - **📝 Prompt Input Clearing**: Resolved prompt input textarea not being cleared right away, ensuring a clean slate for new inputs.
758
+ - **✨ Various UI Styling Issues**: Fixed numerous user interface styling problems for a more cohesive look.
759
+ - **👥 Active Users Display**: Fixed active users showing active sessions instead of actual users, now reflecting accurate user activity.
760
+ - **🌐 Community Platform Compatibility**: The Community Platform is back online and fully compatible with Open WebUI.
761
+
762
+ ### Changed
763
+
764
+ - **📝 RAG Implementation**: Updated the RAG (Retrieval-Augmented Generation) implementation to use a system prompt for context, instead of overriding the user's prompt.
765
+ - **🔄 Settings Relocation**: Moved Models, Connections, Audio, and Images settings to the admin settings for better organization.
766
+ - **✍️ Improved Title Generation**: Enhanced the default prompt for title generation, yielding better results.
767
+ - **🔧 Backend Task Management**: Tasks like title generation and search query generation are now managed on the backend side and controlled only by the admin.
768
+ - **🔍 Editable Search Query Prompt**: You can now edit the search query generation prompt, offering more control over how queries are generated.
769
+ - **📏 Prompt Length Threshold**: Set the prompt length threshold for search query generation from the admin settings, giving more customization options.
770
+ - **📣 Settings Consolidation**: Merged the Banners admin setting with the Interface admin setting for a more streamlined settings area.
771
+
772
+ ## [0.2.5] - 2024-06-05
773
+
774
+ ### Added
775
+
776
+ - **👥 Active Users Indicator**: Now you can see how many people are currently active and what they are running. This helps you gauge when performance might slow down due to a high number of users.
777
+ - **🗂️ Create Ollama Modelfile**: The option to create a modelfile for Ollama has been reintroduced in the Settings > Models section, making it easier to manage your models.
778
+ - **⚙️ Default Model Setting**: Added an option to set the default model from Settings > Interface. This feature is now easily accessible, especially convenient for mobile users as it was previously hidden.
779
+ - **🌐 Enhanced Translations**: We've improved the Chinese translations and added support for Turkmen and Norwegian languages to make the interface more accessible globally.
780
+
781
+ ### Fixed
782
+
783
+ - **📱 Mobile View Improvements**: The UI now uses dvh (dynamic viewport height) instead of vh (viewport height), providing a better and more responsive experience for mobile users.
784
+
785
+ ## [0.2.4] - 2024-06-03
786
+
787
+ ### Added
788
+
789
+ - **👤 Improved Account Pending Page**: The account pending page now displays admin details by default to avoid confusion. You can disable this feature in the admin settings if needed.
790
+ - **🌐 HTTP Proxy Support**: We have enabled the use of the 'http_proxy' environment variable in OpenAI and Ollama API calls, making it easier to configure network settings.
791
+ - **❓ Quick Access to Documentation**: You can now easily access Open WebUI documents via a question mark button located at the bottom right corner of the screen (available on larger screens like PCs).
792
+ - **🌍 Enhanced Translation**: Improvements have been made to translations.
793
+
794
+ ### Fixed
795
+
796
+ - **🔍 SearxNG Web Search**: Fixed the issue where the SearxNG web search functionality was not working properly.
797
+
798
+ ## [0.2.3] - 2024-06-03
799
+
800
+ ### Added
801
+
802
+ - **📁 Export Chat as JSON**: You can now export individual chats as JSON files from the navbar menu by navigating to 'Download > Export Chat'. This makes sharing specific conversations easier.
803
+ - **✏️ Edit Titles with Double Click**: Double-click on titles to rename them quickly and efficiently.
804
+ - **🧩 Batch Multiple Embeddings**: Introduced 'RAG_EMBEDDING_OPENAI_BATCH_SIZE' to process multiple embeddings in a batch, enhancing performance for large datasets.
805
+ - **🌍 Improved Translations**: Enhanced the translation quality across various languages for a better user experience.
806
+
807
+ ### Fixed
808
+
809
+ - **🛠️ Modelfile Migration Script**: Fixed an issue where the modelfile migration script would fail if an invalid modelfile was encountered.
810
+ - **💬 Zhuyin Input Method on Mac**: Resolved an issue where using the Zhuyin input method in the Web UI on a Mac caused text to send immediately upon pressing the enter key, leading to incorrect input.
811
+ - **🔊 Local TTS Voice Selection**: Fixed the issue where the selected local Text-to-Speech (TTS) voice was not being displayed in settings.
812
+
813
+ ## [0.2.2] - 2024-06-02
814
+
815
+ ### Added
816
+
817
+ - **🌊 Mermaid Rendering Support**: We've included support for Mermaid rendering. This allows you to create beautiful diagrams and flowcharts directly within Open WebUI.
818
+ - **🔄 New Environment Variable 'RESET_CONFIG_ON_START'**: Introducing a new environment variable: 'RESET_CONFIG_ON_START'. Set this variable to reset your configuration settings upon starting the application, making it easier to revert to default settings.
819
+
820
+ ### Fixed
821
+
822
+ - **🔧 Pipelines Filter Issue**: We've addressed an issue with the pipelines where filters were not functioning as expected.
823
+
824
+ ## [0.2.1] - 2024-06-02
825
+
826
+ ### Added
827
+
828
+ - **🖱️ Single Model Export Button**: Easily export models with just one click using the new single model export button.
829
+ - **🖥️ Advanced Parameters Support**: Added support for 'num_thread', 'use_mmap', and 'use_mlock' parameters for Ollama.
830
+ - **🌐 Improved Vietnamese Translation**: Enhanced Vietnamese language support for a better user experience for our Vietnamese-speaking community.
831
+
832
+ ### Fixed
833
+
834
+ - **🔧 OpenAI URL API Save Issue**: Corrected a problem preventing the saving of OpenAI URL API settings.
835
+ - **🚫 Display Issue with Disabled Ollama API**: Fixed the display bug causing models to appear in settings when the Ollama API was disabled.
836
+
837
+ ### Changed
838
+
839
+ - **💡 Versioning Update**: As a reminder from our previous update, version 0.2.y will focus primarily on bug fixes, while major updates will be designated as 0.x from now on for better version tracking.
840
+
841
+ ## [0.2.0] - 2024-06-01
842
+
843
+ ### Added
844
+
845
+ - **🔧 Pipelines Support**: Open WebUI now includes a plugin framework for enhanced customization and functionality (https://github.com/open-webui/pipelines). Easily add custom logic and integrate Python libraries, from AI agents to home automation APIs.
846
+ - **🔗 Function Calling via Pipelines**: Integrate function calling seamlessly through Pipelines.
847
+ - **⚖️ User Rate Limiting via Pipelines**: Implement user-specific rate limits to manage API usage efficiently.
848
+ - **📊 Usage Monitoring with Langfuse**: Track and analyze usage statistics with Langfuse integration through Pipelines.
849
+ - **🕒 Conversation Turn Limits**: Set limits on conversation turns to manage interactions better through Pipelines.
850
+ - **🛡️ Toxic Message Filtering**: Automatically filter out toxic messages to maintain a safe environment using Pipelines.
851
+ - **🔍 Web Search Support**: Introducing built-in web search capabilities via RAG API, allowing users to search using SearXNG, Google Programmatic Search Engine, Brave Search, serpstack, and serper. Activate it effortlessly by adding necessary variables from Document settings > Web Params.
852
+ - **🗂️ Models Workspace**: Create and manage model presets for both Ollama/OpenAI API. Note: The old Modelfiles workspace is deprecated.
853
+ - **🛠️ Model Builder Feature**: Build and edit all models with persistent builder mode.
854
+ - **🏷️ Model Tagging Support**: Organize models with tagging features in the models workspace.
855
+ - **📋 Model Ordering Support**: Effortlessly organize models by dragging and dropping them into the desired positions within the models workspace.
856
+ - **📈 OpenAI Generation Stats**: Access detailed generation statistics for OpenAI models.
857
+ - **📅 System Prompt Variables**: New variables added: '{{CURRENT_DATE}}' and '{{USER_NAME}}' for dynamic prompts.
858
+ - **📢 Global Banner Support**: Manage global banners from admin settings > banners.
859
+ - **🗃️ Enhanced Archived Chats Modal**: Search and export archived chats easily.
860
+ - **📂 Archive All Button**: Quickly archive all chats from settings > chats.
861
+ - **🌐 Improved Translations**: Added and improved translations for French, Croatian, Cebuano, and Vietnamese.
862
+
863
+ ### Fixed
864
+
865
+ - **🔍 Archived Chats Visibility**: Resolved issue with archived chats not showing in the admin panel.
866
+ - **💬 Message Styling**: Fixed styling issues affecting message appearance.
867
+ - **🔗 Shared Chat Responses**: Corrected the issue where shared chat response messages were not readonly.
868
+ - **🖥️ UI Enhancement**: Fixed the scrollbar overlapping issue with the message box in the user interface.
869
+
870
+ ### Changed
871
+
872
+ - **💾 User Settings Storage**: User settings are now saved on the backend, ensuring consistency across all devices.
873
+ - **📡 Unified API Requests**: The API request for getting models is now unified to '/api/models' for easier usage.
874
+ - **🔄 Versioning Update**: Our versioning will now follow the format 0.x for major updates and 0.x.y for patches.
875
+ - **📦 Export All Chats (All Users)**: Moved this functionality to the Admin Panel settings for better organization and accessibility.
876
+
877
+ ### Removed
878
+
879
+ - **🚫 Bundled LiteLLM Support Deprecated**: Migrate your LiteLLM config.yaml to a self-hosted LiteLLM instance. LiteLLM can still be added via OpenAI Connections. Download the LiteLLM config.yaml from admin settings > database > export LiteLLM config.yaml.
880
+
881
+ ## [0.1.125] - 2024-05-19
882
+
883
+ ### Added
884
+
885
+ - **🔄 Updated UI**: Chat interface revamped with chat bubbles. Easily switch back to the old style via settings > interface > chat bubble UI.
886
+ - **📂 Enhanced Sidebar UI**: Model files, documents, prompts, and playground merged into Workspace for streamlined access.
887
+ - **🚀 Improved Many Model Interaction**: All responses now displayed simultaneously for a smoother experience.
888
+ - **🐍 Python Code Execution**: Execute Python code locally in the browser with libraries like 'requests', 'beautifulsoup4', 'numpy', 'pandas', 'seaborn', 'matplotlib', 'scikit-learn', 'scipy', 'regex'.
889
+ - **🧠 Experimental Memory Feature**: Manually input personal information you want LLMs to remember via settings > personalization > memory.
890
+ - **💾 Persistent Settings**: Settings now saved as config.json for convenience.
891
+ - **🩺 Health Check Endpoint**: Added for Docker deployment.
892
+ - **↕️ RTL Support**: Toggle chat direction via settings > interface > chat direction.
893
+ - **🖥️ PowerPoint Support**: RAG pipeline now supports PowerPoint documents.
894
+ - **🌐 Language Updates**: Ukrainian, Turkish, Arabic, Chinese, Serbian, Vietnamese updated; Punjabi added.
895
+
896
+ ### Changed
897
+
898
+ - **👤 Shared Chat Update**: Shared chat now includes creator user information.
899
+
900
+ ## [0.1.124] - 2024-05-08
901
+
902
+ ### Added
903
+
904
+ - **🖼️ Improved Chat Sidebar**: Now conveniently displays time ranges and organizes chats by today, yesterday, and more.
905
+ - **📜 Citations in RAG Feature**: Easily track the context fed to the LLM with added citations in the RAG feature.
906
+ - **🔒 Auth Disable Option**: Introducing the ability to disable authentication. Set 'WEBUI_AUTH' to False to disable authentication. Note: Only applicable for fresh installations without existing users.
907
+ - **📹 Enhanced YouTube RAG Pipeline**: Now supports non-English videos for an enriched experience.
908
+ - **🔊 Specify OpenAI TTS Models**: Customize your TTS experience by specifying OpenAI TTS models.
909
+ - **🔧 Additional Environment Variables**: Discover more environment variables in our comprehensive documentation at Open WebUI Documentation (https://docs.openwebui.com).
910
+ - **🌐 Language Support**: Arabic, Finnish, and Hindi added; Improved support for German, Vietnamese, and Chinese.
911
+
912
+ ### Fixed
913
+
914
+ - **🛠️ Model Selector Styling**: Addressed styling issues for improved user experience.
915
+ - **⚠️ Warning Messages**: Resolved backend warning messages.
916
+
917
+ ### Changed
918
+
919
+ - **📝 Title Generation**: Limited output to 50 tokens.
920
+ - **📦 Helm Charts**: Removed Helm charts, now available in a separate repository (https://github.com/open-webui/helm-charts).
921
+
922
+ ## [0.1.123] - 2024-05-02
923
+
924
+ ### Added
925
+
926
+ - **🎨 New Landing Page Design**: Refreshed design for a more modern look and optimized use of screen space.
927
+ - **📹 Youtube RAG Pipeline**: Introduces dedicated RAG pipeline for Youtube videos, enabling interaction with video transcriptions directly.
928
+ - **🔧 Enhanced Admin Panel**: Streamlined user management with options to add users directly or in bulk via CSV import.
929
+ - **👥 '@' Model Integration**: Easily switch to specific models during conversations; old collaborative chat feature phased out.
930
+ - **🌐 Language Enhancements**: Swedish translation added, plus improvements to German, Spanish, and the addition of Doge translation.
931
+
932
+ ### Fixed
933
+
934
+ - **🗑️ Delete Chat Shortcut**: Addressed issue where shortcut wasn't functioning.
935
+ - **🖼️ Modal Closing Bug**: Resolved unexpected closure of modal when dragging from within.
936
+ - **✏️ Edit Button Styling**: Fixed styling inconsistency with edit buttons.
937
+ - **🌐 Image Generation Compatibility Issue**: Rectified image generation compatibility issue with third-party APIs.
938
+ - **📱 iOS PWA Icon Fix**: Corrected iOS PWA home screen icon shape.
939
+ - **🔍 Scroll Gesture Bug**: Adjusted gesture sensitivity to prevent accidental activation when scrolling through code on mobile; now requires scrolling from the leftmost side to open the sidebar.
940
+
941
+ ### Changed
942
+
943
+ - **🔄 Unlimited Context Length**: Advanced settings now allow unlimited max context length (previously limited to 16000).
944
+ - **👑 Super Admin Assignment**: The first signup is automatically assigned a super admin role, unchangeable by other admins.
945
+ - **🛡️ Admin User Restrictions**: User action buttons from the admin panel are now disabled for users with admin roles.
946
+ - **🔝 Default Model Selector**: Set as default model option now exclusively available on the landing page.
947
+
948
+ ## [0.1.122] - 2024-04-27
949
+
950
+ ### Added
951
+
952
+ - **🌟 Enhanced RAG Pipeline**: Now with hybrid searching via 'BM25', reranking powered by 'CrossEncoder', and configurable relevance score thresholds.
953
+ - **🛢️ External Database Support**: Seamlessly connect to custom SQLite or Postgres databases using the 'DATABASE_URL' environment variable.
954
+ - **🌐 Remote ChromaDB Support**: Introducing the capability to connect to remote ChromaDB servers.
955
+ - **👨‍💼 Improved Admin Panel**: Admins can now conveniently check users' chat lists and last active status directly from the admin panel.
956
+ - **🎨 Splash Screen**: Introducing a loading splash screen for a smoother user experience.
957
+ - **🌍 Language Support Expansion**: Added support for Bangla (bn-BD), along with enhancements to Chinese, Spanish, and Ukrainian translations.
958
+ - **💻 Improved LaTeX Rendering Performance**: Enjoy faster rendering times for LaTeX equations.
959
+ - **🔧 More Environment Variables**: Explore additional environment variables in our documentation (https://docs.openwebui.com), including the 'ENABLE_LITELLM' option to manage memory usage.
960
+
961
+ ### Fixed
962
+
963
+ - **🔧 Ollama Compatibility**: Resolved errors occurring when Ollama server version isn't an integer, such as SHA builds or RCs.
964
+ - **🐛 Various OpenAI API Issues**: Addressed several issues related to the OpenAI API.
965
+ - **🛑 Stop Sequence Issue**: Fixed the problem where the stop sequence with a backslash '\' was not functioning.
966
+ - **🔤 Font Fallback**: Corrected font fallback issue.
967
+
968
+ ### Changed
969
+
970
+ - **⌨️ Prompt Input Behavior on Mobile**: Enter key prompt submission disabled on mobile devices for improved user experience.
971
+
972
+ ## [0.1.121] - 2024-04-24
973
+
974
+ ### Fixed
975
+
976
+ - **🔧 Translation Issues**: Addressed various translation discrepancies.
977
+ - **🔒 LiteLLM Security Fix**: Updated LiteLLM version to resolve a security vulnerability.
978
+ - **🖥️ HTML Tag Display**: Rectified the issue where the '< br >' tag wasn't displaying correctly.
979
+ - **🔗 WebSocket Connection**: Resolved the failure of WebSocket connection under HTTPS security for ComfyUI server.
980
+ - **📜 FileReader Optimization**: Implemented FileReader initialization per image in multi-file drag & drop to ensure reusability.
981
+ - **🏷️ Tag Display**: Corrected tag display inconsistencies.
982
+ - **📦 Archived Chat Styling**: Fixed styling issues in archived chat.
983
+ - **🔖 Safari Copy Button Bug**: Addressed the bug where the copy button failed to copy links in Safari.
984
+
985
+ ## [0.1.120] - 2024-04-20
986
+
987
+ ### Added
988
+
989
+ - **📦 Archive Chat Feature**: Easily archive chats with a new sidebar button, and access archived chats via the profile button > archived chats.
990
+ - **🔊 Configurable Text-to-Speech Endpoint**: Customize your Text-to-Speech experience with configurable OpenAI endpoints.
991
+ - **🛠️ Improved Error Handling**: Enhanced error message handling for connection failures.
992
+ - **⌨️ Enhanced Shortcut**: When editing messages, use ctrl/cmd+enter to save and submit, and esc to close.
993
+ - **🌐 Language Support**: Added support for Georgian and enhanced translations for Portuguese and Vietnamese.
994
+
995
+ ### Fixed
996
+
997
+ - **🔧 Model Selector**: Resolved issue where default model selection was not saving.
998
+ - **🔗 Share Link Copy Button**: Fixed bug where the copy button wasn't copying links in Safari.
999
+ - **🎨 Light Theme Styling**: Addressed styling issue with the light theme.
1000
+
1001
+ ## [0.1.119] - 2024-04-16
1002
+
1003
+ ### Added
1004
+
1005
+ - **🌟 Enhanced RAG Embedding Support**: Ollama, and OpenAI models can now be used for RAG embedding model.
1006
+ - **🔄 Seamless Integration**: Copy 'ollama run <model name>' directly from Ollama page to easily select and pull models.
1007
+ - **🏷️ Tagging Feature**: Add tags to chats directly via the sidebar chat menu.
1008
+ - **📱 Mobile Accessibility**: Swipe left and right on mobile to effortlessly open and close the sidebar.
1009
+ - **🔍 Improved Navigation**: Admin panel now supports pagination for user list.
1010
+ - **🌍 Additional Language Support**: Added Polish language support.
1011
+
1012
+ ### Fixed
1013
+
1014
+ - **🌍 Language Enhancements**: Vietnamese and Spanish translations have been improved.
1015
+ - **🔧 Helm Fixes**: Resolved issues with Helm trailing slash and manifest.json.
1016
+
1017
+ ### Changed
1018
+
1019
+ - **🐳 Docker Optimization**: Updated docker image build process to utilize 'uv' for significantly faster builds compared to 'pip3'.
1020
+
1021
+ ## [0.1.118] - 2024-04-10
1022
+
1023
+ ### Added
1024
+
1025
+ - **🦙 Ollama and CUDA Images**: Added support for ':ollama' and ':cuda' tagged images.
1026
+ - **👍 Enhanced Response Rating**: Now you can annotate your ratings for better feedback.
1027
+ - **👤 User Initials Profile Photo**: User initials are now the default profile photo.
1028
+ - **🔍 Update RAG Embedding Model**: Customize RAG embedding model directly in document settings.
1029
+ - **🌍 Additional Language Support**: Added Turkish language support.
1030
+
1031
+ ### Fixed
1032
+
1033
+ - **🔒 Share Chat Permission**: Resolved issue with chat sharing permissions.
1034
+ - **🛠 Modal Close**: Modals can now be closed using the Esc key.
1035
+
1036
+ ### Changed
1037
+
1038
+ - **🎨 Admin Panel Styling**: Refreshed styling for the admin panel.
1039
+ - **🐳 Docker Image Build**: Updated docker image build process for improved efficiency.
1040
+
1041
+ ## [0.1.117] - 2024-04-03
1042
+
1043
+ ### Added
1044
+
1045
+ - 🗨️ **Local Chat Sharing**: Share chat links seamlessly between users.
1046
+ - 🔑 **API Key Generation Support**: Generate secret keys to leverage Open WebUI with OpenAI libraries.
1047
+ - 📄 **Chat Download as PDF**: Easily download chats in PDF format.
1048
+ - 📝 **Improved Logging**: Enhancements to logging functionality.
1049
+ - 📧 **Trusted Email Authentication**: Authenticate using a trusted email header.
1050
+
1051
+ ### Fixed
1052
+
1053
+ - 🌷 **Enhanced Dutch Translation**: Improved translation for Dutch users.
1054
+ - ⚪ **White Theme Styling**: Resolved styling issue with the white theme.
1055
+ - 📜 **LaTeX Chat Screen Overflow**: Fixed screen overflow issue with LaTeX rendering.
1056
+ - 🔒 **Security Patches**: Applied necessary security patches.
1057
+
1058
+ ## [0.1.116] - 2024-03-31
1059
+
1060
+ ### Added
1061
+
1062
+ - **🔄 Enhanced UI**: Model selector now conveniently located in the navbar, enabling seamless switching between multiple models during conversations.
1063
+ - **🔍 Improved Model Selector**: Directly pull a model from the selector/Models now display detailed information for better understanding.
1064
+ - **💬 Webhook Support**: Now compatible with Google Chat and Microsoft Teams.
1065
+ - **🌐 Localization**: Korean translation (I18n) now available.
1066
+ - **🌑 Dark Theme**: OLED dark theme introduced for reduced strain during prolonged usage.
1067
+ - **🏷️ Tag Autocomplete**: Dropdown feature added for effortless chat tagging.
1068
+
1069
+ ### Fixed
1070
+
1071
+ - **🔽 Auto-Scrolling**: Addressed OpenAI auto-scrolling issue.
1072
+ - **🏷️ Tag Validation**: Implemented tag validation to prevent empty string tags.
1073
+ - **🚫 Model Whitelisting**: Resolved LiteLLM model whitelisting issue.
1074
+ - **✅ Spelling**: Corrected various spelling issues for improved readability.
1075
+
1076
+ ## [0.1.115] - 2024-03-24
1077
+
1078
+ ### Added
1079
+
1080
+ - **🔍 Custom Model Selector**: Easily find and select custom models with the new search filter feature.
1081
+ - **🛑 Cancel Model Download**: Added the ability to cancel model downloads.
1082
+ - **🎨 Image Generation ComfyUI**: Image generation now supports ComfyUI.
1083
+ - **🌟 Updated Light Theme**: Updated the light theme for a fresh look.
1084
+ - **🌍 Additional Language Support**: Now supporting Bulgarian, Italian, Portuguese, Japanese, and Dutch.
1085
+
1086
+ ### Fixed
1087
+
1088
+ - **🔧 Fixed Broken Experimental GGUF Upload**: Resolved issues with experimental GGUF upload functionality.
1089
+
1090
+ ### Changed
1091
+
1092
+ - **🔄 Vector Storage Reset Button**: Moved the reset vector storage button to document settings.
1093
+
1094
+ ## [0.1.114] - 2024-03-20
1095
+
1096
+ ### Added
1097
+
1098
+ - **🔗 Webhook Integration**: Now you can subscribe to new user sign-up events via webhook. Simply navigate to the admin panel > admin settings > webhook URL.
1099
+ - **🛡️ Enhanced Model Filtering**: Alongside Ollama, OpenAI proxy model whitelisting, we've added model filtering functionality for LiteLLM proxy.
1100
+ - **🌍 Expanded Language Support**: Spanish, Catalan, and Vietnamese languages are now available, with improvements made to others.
1101
+
1102
+ ### Fixed
1103
+
1104
+ - **🔧 Input Field Spelling**: Resolved issue with spelling mistakes in input fields.
1105
+ - **🖊️ Light Mode Styling**: Fixed styling issue with light mode in document adding.
1106
+
1107
+ ### Changed
1108
+
1109
+ - **🔄 Language Sorting**: Languages are now sorted alphabetically by their code for improved organization.
1110
+
1111
+ ## [0.1.113] - 2024-03-18
1112
+
1113
+ ### Added
1114
+
1115
+ - 🌍 **Localization**: You can now change the UI language in Settings > General. We support Ukrainian, German, Farsi (Persian), Traditional and Simplified Chinese and French translations. You can help us to translate the UI into your language! More info in our [CONTRIBUTION.md](https://github.com/open-webui/open-webui/blob/main/docs/CONTRIBUTING.md#-translations-and-internationalization).
1116
+ - 🎨 **System-wide Theme**: Introducing a new system-wide theme for enhanced visual experience.
1117
+
1118
+ ### Fixed
1119
+
1120
+ - 🌑 **Dark Background on Select Fields**: Improved readability by adding a dark background to select fields, addressing issues on certain browsers/devices.
1121
+ - **Multiple OPENAI_API_BASE_URLS Issue**: Resolved issue where multiple base URLs caused conflicts when one wasn't functioning.
1122
+ - **RAG Encoding Issue**: Fixed encoding problem in RAG.
1123
+ - **npm Audit Fix**: Addressed npm audit findings.
1124
+ - **Reduced Scroll Threshold**: Improved auto-scroll experience by reducing the scroll threshold from 50px to 5px.
1125
+
1126
+ ### Changed
1127
+
1128
+ - 🔄 **Sidebar UI Update**: Updated sidebar UI to feature a chat menu dropdown, replacing two icons for improved navigation.
1129
+
1130
+ ## [0.1.112] - 2024-03-15
1131
+
1132
+ ### Fixed
1133
+
1134
+ - 🗨️ Resolved chat malfunction after image generation.
1135
+ - 🎨 Fixed various RAG issues.
1136
+ - 🧪 Rectified experimental broken GGUF upload logic.
1137
+
1138
+ ## [0.1.111] - 2024-03-10
1139
+
1140
+ ### Added
1141
+
1142
+ - 🛡️ **Model Whitelisting**: Admins now have the ability to whitelist models for users with the 'user' role.
1143
+ - 🔄 **Update All Models**: Added a convenient button to update all models at once.
1144
+ - 📄 **Toggle PDF OCR**: Users can now toggle PDF OCR option for improved parsing performance.
1145
+ - 🎨 **DALL-E Integration**: Introduced DALL-E integration for image generation alongside automatic1111.
1146
+ - 🛠️ **RAG API Refactoring**: Refactored RAG logic and exposed its API, with additional documentation to follow.
1147
+
1148
+ ### Fixed
1149
+
1150
+ - 🔒 **Max Token Settings**: Added max token settings for anthropic/claude-3-sonnet-20240229 (Issue #1094).
1151
+ - 🔧 **Misalignment Issue**: Corrected misalignment of Edit and Delete Icons when Chat Title is Empty (Issue #1104).
1152
+ - 🔄 **Context Loss Fix**: Resolved RAG losing context on model response regeneration with Groq models via API key (Issue #1105).
1153
+ - 📁 **File Handling Bug**: Addressed File Not Found Notification when Dropping a Conversation Element (Issue #1098).
1154
+ - 🖱️ **Dragged File Styling**: Fixed dragged file layover styling issue.
1155
+
1156
+ ## [0.1.110] - 2024-03-06
1157
+
1158
+ ### Added
1159
+
1160
+ - **🌐 Multiple OpenAI Servers Support**: Enjoy seamless integration with multiple OpenAI-compatible APIs, now supported natively.
1161
+
1162
+ ### Fixed
1163
+
1164
+ - **🔍 OCR Issue**: Resolved PDF parsing issue caused by OCR malfunction.
1165
+ - **🚫 RAG Issue**: Fixed the RAG functionality, ensuring it operates smoothly.
1166
+ - **📄 "Add Docs" Model Button**: Addressed the non-functional behavior of the "Add Docs" model button.
1167
+
1168
+ ## [0.1.109] - 2024-03-06
1169
+
1170
+ ### Added
1171
+
1172
+ - **🔄 Multiple Ollama Servers Support**: Enjoy enhanced scalability and performance with support for multiple Ollama servers in a single WebUI. Load balancing features are now available, providing improved efficiency (#788, #278).
1173
+ - **🔧 Support for Claude 3 and Gemini**: Responding to user requests, we've expanded our toolset to include Claude 3 and Gemini, offering a wider range of functionalities within our platform (#1064).
1174
+ - **🔍 OCR Functionality for PDF Loader**: We've augmented our PDF loader with Optical Character Recognition (OCR) capabilities. Now, extract text from scanned documents and images within PDFs, broadening the scope of content processing (#1050).
1175
+
1176
+ ### Fixed
1177
+
1178
+ - **🛠️ RAG Collection**: Implemented a dynamic mechanism to recreate RAG collections, ensuring users have up-to-date and accurate data (#1031).
1179
+ - **📝 User Agent Headers**: Fixed issue of RAG web requests being sent with empty user_agent headers, reducing rejections from certain websites. Realistic headers are now utilized for these requests (#1024).
1180
+ - **⏹️ Playground Cancel Functionality**: Introducing a new "Cancel" option for stopping Ollama generation in the Playground, enhancing user control and usability (#1006).
1181
+ - **🔤 Typographical Error in 'ASSISTANT' Field**: Corrected a typographical error in the 'ASSISTANT' field within the GGUF model upload template for accuracy and consistency (#1061).
1182
+
1183
+ ### Changed
1184
+
1185
+ - **🔄 Refactored Message Deletion Logic**: Streamlined message deletion process for improved efficiency and user experience, simplifying interactions within the platform (#1004).
1186
+ - **⚠️ Deprecation of `OLLAMA_API_BASE_URL`**: Deprecated `OLLAMA_API_BASE_URL` environment variable; recommend using `OLLAMA_BASE_URL` instead. Refer to our documentation for further details.
1187
+
1188
+ ## [0.1.108] - 2024-03-02
1189
+
1190
+ ### Added
1191
+
1192
+ - **🎮 Playground Feature (Beta)**: Explore the full potential of the raw API through an intuitive UI with our new playground feature, accessible to admins. Simply click on the bottom name area of the sidebar to access it. The playground feature offers two modes text completion (notebook) and chat completion. As it's in beta, please report any issues you encounter.
1193
+ - **🛠️ Direct Database Download for Admins**: Admins can now download the database directly from the WebUI via the admin settings.
1194
+ - **🎨 Additional RAG Settings**: Customize your RAG process with the ability to edit the TOP K value. Navigate to Documents > Settings > General to make changes.
1195
+ - **🖥️ UI Improvements**: Tooltips now available in the input area and sidebar handle. More tooltips will be added across other parts of the UI.
1196
+
1197
+ ### Fixed
1198
+
1199
+ - Resolved input autofocus issue on mobile when the sidebar is open, making it easier to use.
1200
+ - Corrected numbered list display issue in Safari (#963).
1201
+ - Restricted user ability to delete chats without proper permissions (#993).
1202
+
1203
+ ### Changed
1204
+
1205
+ - **Simplified Ollama Settings**: Ollama settings now don't require the `/api` suffix. You can now utilize the Ollama base URL directly, e.g., `http://localhost:11434`. Also, an `OLLAMA_BASE_URL` environment variable has been added.
1206
+ - **Database Renaming**: Starting from this release, `ollama.db` will be automatically renamed to `webui.db`.
1207
+
1208
+ ## [0.1.107] - 2024-03-01
1209
+
1210
+ ### Added
1211
+
1212
+ - **🚀 Makefile and LLM Update Script**: Included Makefile and a script for LLM updates in the repository.
1213
+
1214
+ ### Fixed
1215
+
1216
+ - Corrected issue where links in the settings modal didn't appear clickable (#960).
1217
+ - Fixed problem with web UI port not taking effect due to incorrect environment variable name in run-compose.sh (#996).
1218
+ - Enhanced user experience by displaying chat in browser title and enabling automatic scrolling to the bottom (#992).
1219
+
1220
+ ### Changed
1221
+
1222
+ - Upgraded toast library from `svelte-french-toast` to `svelte-sonner` for a more polished UI.
1223
+ - Enhanced accessibility with the addition of dark mode on the authentication page.
1224
+
1225
+ ## [0.1.106] - 2024-02-27
1226
+
1227
+ ### Added
1228
+
1229
+ - **🎯 Auto-focus Feature**: The input area now automatically focuses when initiating or opening a chat conversation.
1230
+
1231
+ ### Fixed
1232
+
1233
+ - Corrected typo from "HuggingFace" to "Hugging Face" (Issue #924).
1234
+ - Resolved bug causing errors in chat completion API calls to OpenAI due to missing "num_ctx" parameter (Issue #927).
1235
+ - Fixed issues preventing text editing, selection, and cursor retention in the input field (Issue #940).
1236
+ - Fixed a bug where defining an OpenAI-compatible API server using 'OPENAI_API_BASE_URL' containing 'openai' string resulted in hiding models not containing 'gpt' string from the model menu. (Issue #930)
1237
+
1238
+ ## [0.1.105] - 2024-02-25
1239
+
1240
+ ### Added
1241
+
1242
+ - **📄 Document Selection**: Now you can select and delete multiple documents at once for easier management.
1243
+
1244
+ ### Changed
1245
+
1246
+ - **🏷️ Document Pre-tagging**: Simply click the "+" button at the top, enter tag names in the popup window, or select from a list of existing tags. Then, upload files with the added tags for streamlined organization.
1247
+
1248
+ ## [0.1.104] - 2024-02-25
1249
+
1250
+ ### Added
1251
+
1252
+ - **🔄 Check for Updates**: Keep your system current by checking for updates conveniently located in Settings > About.
1253
+ - **🗑️ Automatic Tag Deletion**: Unused tags on the sidebar will now be deleted automatically with just a click.
1254
+
1255
+ ### Changed
1256
+
1257
+ - **🎨 Modernized Styling**: Enjoy a refreshed look with updated styling for a more contemporary experience.
1258
+
1259
+ ## [0.1.103] - 2024-02-25
1260
+
1261
+ ### Added
1262
+
1263
+ - **🔗 Built-in LiteLLM Proxy**: Now includes LiteLLM proxy within Open WebUI for enhanced functionality.
1264
+
1265
+ - Easily integrate existing LiteLLM configurations using `-v /path/to/config.yaml:/app/backend/data/litellm/config.yaml` flag.
1266
+ - When utilizing Docker container to run Open WebUI, ensure connections to localhost use `host.docker.internal`.
1267
+
1268
+ - **🖼️ Image Generation Enhancements**: Introducing Advanced Settings with Image Preview Feature.
1269
+ - Customize image generation by setting the number of steps; defaults to A1111 value.
1270
+
1271
+ ### Fixed
1272
+
1273
+ - Resolved issue with RAG scan halting document loading upon encountering unsupported MIME types or exceptions (Issue #866).
1274
+
1275
+ ### Changed
1276
+
1277
+ - Ollama is no longer required to run Open WebUI.
1278
+ - Access our comprehensive documentation at [Open WebUI Documentation](https://docs.openwebui.com/).
1279
+
1280
+ ## [0.1.102] - 2024-02-22
1281
+
1282
+ ### Added
1283
+
1284
+ - **🖼️ Image Generation**: Generate Images using the AUTOMATIC1111/stable-diffusion-webui API. You can set this up in Settings > Images.
1285
+ - **📝 Change title generation prompt**: Change the prompt used to generate titles for your chats. You can set this up in the Settings > Interface.
1286
+ - **🤖 Change embedding model**: Change the embedding model used to generate embeddings for your chats in the Dockerfile. Use any sentence transformer model from huggingface.co.
1287
+ - **📢 CHANGELOG.md/Popup**: This popup will show you the latest changes.
1288
+
1289
+ ## [0.1.101] - 2024-02-22
1290
+
1291
+ ### Fixed
1292
+
1293
+ - LaTex output formatting issue (#828)
1294
+
1295
+ ### Changed
1296
+
1297
+ - Instead of having the previous 1.0.0-alpha.101, we switched to semantic versioning as a way to respect global conventions.
CODE_OF_CONDUCT.md ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Contributor Covenant Code of Conduct
2
+
3
+ ## Our Pledge
4
+
5
+ We as members, contributors, and leaders pledge to make participation in our
6
+ community a harassment-free experience for everyone, regardless of age, body
7
+ size, visible or invisible disability, ethnicity, sex characteristics, gender
8
+ identity and expression, level of experience, education, socio-economic status,
9
+ nationality, personal appearance, race, religion, or sexual identity
10
+ and orientation.
11
+
12
+ We pledge to act and interact in ways that contribute to an open, welcoming, diverse, inclusive, and healthy community.
13
+
14
+ ## Our Standards
15
+
16
+ Examples of behavior that contribute to a positive environment for our community include:
17
+
18
+ - Demonstrating empathy and kindness toward other people
19
+ - Being respectful of differing opinions, viewpoints, and experiences
20
+ - Giving and gracefully accepting constructive feedback
21
+ - Accepting responsibility and apologizing to those affected by our mistakes, and learning from the experience
22
+ - Focusing on what is best not just for us as individuals, but for the overall community
23
+
24
+ Examples of unacceptable behavior include:
25
+
26
+ - The use of sexualized language or imagery, and sexual attention or advances of any kind
27
+ - Trolling, insulting or derogatory comments, and personal or political attacks
28
+ - Public or private harassment
29
+ - Publishing others' private information, such as a physical or email address, without their explicit permission
30
+ - **Spamming of any kind**
31
+ - Aggressive sales tactics targeting our community members are strictly prohibited. You can mention your product if it's relevant to the discussion, but under no circumstances should you push it forcefully
32
+ - Other conduct which could reasonably be considered inappropriate in a professional setting
33
+
34
+ ## Enforcement Responsibilities
35
+
36
+ Community leaders are responsible for clarifying and enforcing our standards of acceptable behavior and will take appropriate and fair corrective action in response to any behavior that they deem inappropriate, threatening, offensive, or harmful.
37
+
38
+ ## Scope
39
+
40
+ This Code of Conduct applies within all community spaces and also applies when an individual is officially representing the community in public spaces. Examples of representing our community include using an official e-mail address, posting via an official social media account, or acting as an appointed representative at an online or offline event.
41
+
42
+ ## Enforcement
43
+
44
+ Instances of abusive, harassing, spamming, or otherwise unacceptable behavior may be reported to the community leaders responsible for enforcement at [email protected]. All complaints will be reviewed and investigated promptly and fairly.
45
+
46
+ All community leaders are obligated to respect the privacy and security of the reporter of any incident.
47
+
48
+ ## Enforcement Guidelines
49
+
50
+ Community leaders will follow these Community Impact Guidelines in determining the consequences for any action they deem in violation of this Code of Conduct:
51
+
52
+ ### 1. Temporary Ban
53
+
54
+ **Community Impact**: Any violation of community standards, including but not limited to inappropriate language, unprofessional behavior, harassment, or spamming.
55
+
56
+ **Consequence**: A temporary ban from any sort of interaction or public communication with the community for a specified period of time. No public or private interaction with the people involved, including unsolicited interaction with those enforcing the Code of Conduct, is allowed during this period. Violating these terms may lead to a permanent ban.
57
+
58
+ ### 2. Permanent Ban
59
+
60
+ **Community Impact**: Repeated or severe violations of community standards, including sustained inappropriate behavior, harassment of an individual, or aggression toward or disparagement of classes of individuals.
61
+
62
+ **Consequence**: A permanent ban from any sort of public interaction within the community.
63
+
64
+ ## Attribution
65
+
66
+ This Code of Conduct is adapted from the [Contributor Covenant][homepage],
67
+ version 2.0, available at
68
+ https://www.contributor-covenant.org/version/2/0/code_of_conduct.html.
69
+
70
+ Community Impact Guidelines were inspired by [Mozilla's code of conduct
71
+ enforcement ladder](https://github.com/mozilla/diversity).
72
+
73
+ [homepage]: https://www.contributor-covenant.org
74
+
75
+ For answers to common questions about this code of conduct, see the FAQ at
76
+ https://www.contributor-covenant.org/faq. Translations are available at
77
+ https://www.contributor-covenant.org/translations.
Caddyfile.localhost ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Run with
2
+ # caddy run --envfile ./example.env --config ./Caddyfile.localhost
3
+ #
4
+ # This is configured for
5
+ # - Automatic HTTPS (even for localhost)
6
+ # - Reverse Proxying to Ollama API Base URL (http://localhost:11434/api)
7
+ # - CORS
8
+ # - HTTP Basic Auth API Tokens (uncomment basicauth section)
9
+
10
+
11
+ # CORS Preflight (OPTIONS) + Request (GET, POST, PATCH, PUT, DELETE)
12
+ (cors-api) {
13
+ @match-cors-api-preflight method OPTIONS
14
+ handle @match-cors-api-preflight {
15
+ header {
16
+ Access-Control-Allow-Origin "{http.request.header.origin}"
17
+ Access-Control-Allow-Methods "GET, POST, PUT, PATCH, DELETE, OPTIONS"
18
+ Access-Control-Allow-Headers "Origin, Accept, Authorization, Content-Type, X-Requested-With"
19
+ Access-Control-Allow-Credentials "true"
20
+ Access-Control-Max-Age "3600"
21
+ defer
22
+ }
23
+ respond "" 204
24
+ }
25
+
26
+ @match-cors-api-request {
27
+ not {
28
+ header Origin "{http.request.scheme}://{http.request.host}"
29
+ }
30
+ header Origin "{http.request.header.origin}"
31
+ }
32
+ handle @match-cors-api-request {
33
+ header {
34
+ Access-Control-Allow-Origin "{http.request.header.origin}"
35
+ Access-Control-Allow-Methods "GET, POST, PUT, PATCH, DELETE, OPTIONS"
36
+ Access-Control-Allow-Headers "Origin, Accept, Authorization, Content-Type, X-Requested-With"
37
+ Access-Control-Allow-Credentials "true"
38
+ Access-Control-Max-Age "3600"
39
+ defer
40
+ }
41
+ }
42
+ }
43
+
44
+ # replace localhost with example.com or whatever
45
+ localhost {
46
+ ## HTTP Basic Auth
47
+ ## (uncomment to enable)
48
+ # basicauth {
49
+ # # see .example.env for how to generate tokens
50
+ # {env.OLLAMA_API_ID} {env.OLLAMA_API_TOKEN_DIGEST}
51
+ # }
52
+
53
+ handle /api/* {
54
+ # Comment to disable CORS
55
+ import cors-api
56
+
57
+ reverse_proxy localhost:11434
58
+ }
59
+
60
+ # Same-Origin Static Web Server
61
+ file_server {
62
+ root ./build/
63
+ }
64
+ }
Dockerfile ADDED
@@ -0,0 +1,176 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # syntax=docker/dockerfile:1
2
+ # Initialize device type args
3
+ # use build args in the docker build command with --build-arg="BUILDARG=true"
4
+ ARG USE_CUDA=false
5
+ ARG USE_OLLAMA=false
6
+ # Tested with cu117 for CUDA 11 and cu121 for CUDA 12 (default)
7
+ ARG USE_CUDA_VER=cu121
8
+ # any sentence transformer model; models to use can be found at https://huggingface.co/models?library=sentence-transformers
9
+ # Leaderboard: https://huggingface.co/spaces/mteb/leaderboard
10
+ # for better performance and multilangauge support use "intfloat/multilingual-e5-large" (~2.5GB) or "intfloat/multilingual-e5-base" (~1.5GB)
11
+ # IMPORTANT: If you change the embedding model (sentence-transformers/all-MiniLM-L6-v2) and vice versa, you aren't able to use RAG Chat with your previous documents loaded in the WebUI! You need to re-embed them.
12
+ ARG USE_EMBEDDING_MODEL=sentence-transformers/all-MiniLM-L6-v2
13
+ ARG USE_RERANKING_MODEL=""
14
+
15
+ # Tiktoken encoding name; models to use can be found at https://huggingface.co/models?library=tiktoken
16
+ ARG USE_TIKTOKEN_ENCODING_NAME="cl100k_base"
17
+
18
+ ARG BUILD_HASH=dev-build
19
+ # Override at your own risk - non-root configurations are untested
20
+ ARG UID=0
21
+ ARG GID=0
22
+
23
+ ######## WebUI frontend ########
24
+ FROM --platform=$BUILDPLATFORM node:22-alpine3.20 AS build
25
+ ARG BUILD_HASH
26
+
27
+ WORKDIR /app
28
+
29
+ COPY package.json package-lock.json ./
30
+ RUN npm ci
31
+
32
+ COPY . .
33
+ ENV APP_BUILD_HASH=${BUILD_HASH}
34
+ RUN npm run build
35
+
36
+ ######## WebUI backend ########
37
+ FROM python:3.11-slim-bookworm AS base
38
+
39
+ # Use args
40
+ ARG USE_CUDA
41
+ ARG USE_OLLAMA
42
+ ARG USE_CUDA_VER
43
+ ARG USE_EMBEDDING_MODEL
44
+ ARG USE_RERANKING_MODEL
45
+ ARG UID
46
+ ARG GID
47
+
48
+ ## Basis ##
49
+ ENV ENV=prod \
50
+ PORT=8080 \
51
+ # pass build args to the build
52
+ USE_OLLAMA_DOCKER=${USE_OLLAMA} \
53
+ USE_CUDA_DOCKER=${USE_CUDA} \
54
+ USE_CUDA_DOCKER_VER=${USE_CUDA_VER} \
55
+ USE_EMBEDDING_MODEL_DOCKER=${USE_EMBEDDING_MODEL} \
56
+ USE_RERANKING_MODEL_DOCKER=${USE_RERANKING_MODEL}
57
+
58
+ ## Basis URL Config ##
59
+ ENV OLLAMA_BASE_URL="/ollama" \
60
+ OPENAI_API_BASE_URL=""
61
+
62
+ ## API Key and Security Config ##
63
+ ENV OPENAI_API_KEY="" \
64
+ WEBUI_SECRET_KEY="" \
65
+ SCARF_NO_ANALYTICS=true \
66
+ DO_NOT_TRACK=true \
67
+ ANONYMIZED_TELEMETRY=false
68
+
69
+ #### Other models #########################################################
70
+ ## whisper TTS model settings ##
71
+ ENV WHISPER_MODEL="base" \
72
+ WHISPER_MODEL_DIR="/app/backend/data/cache/whisper/models"
73
+
74
+ ## RAG Embedding model settings ##
75
+ ENV RAG_EMBEDDING_MODEL="$USE_EMBEDDING_MODEL_DOCKER" \
76
+ RAG_RERANKING_MODEL="$USE_RERANKING_MODEL_DOCKER" \
77
+ SENTENCE_TRANSFORMERS_HOME="/app/backend/data/cache/embedding/models"
78
+
79
+ ## Tiktoken model settings ##
80
+ ENV TIKTOKEN_ENCODING_NAME="cl100k_base" \
81
+ TIKTOKEN_CACHE_DIR="/app/backend/data/cache/tiktoken"
82
+
83
+ ## Hugging Face download cache ##
84
+ ENV HF_HOME="/app/backend/data/cache/embedding/models"
85
+
86
+ ## Torch Extensions ##
87
+ # ENV TORCH_EXTENSIONS_DIR="/.cache/torch_extensions"
88
+
89
+ #### Other models ##########################################################
90
+
91
+ WORKDIR /app/backend
92
+
93
+ ENV HOME=/root
94
+ # Create user and group if not root
95
+ RUN if [ $UID -ne 0 ]; then \
96
+ if [ $GID -ne 0 ]; then \
97
+ addgroup --gid $GID app; \
98
+ fi; \
99
+ adduser --uid $UID --gid $GID --home $HOME --disabled-password --no-create-home app; \
100
+ fi
101
+
102
+ RUN mkdir -p $HOME/.cache/chroma
103
+ RUN echo -n 00000000-0000-0000-0000-000000000000 > $HOME/.cache/chroma/telemetry_user_id
104
+
105
+ # Make sure the user has access to the app and root directory
106
+ RUN chown -R $UID:$GID /app $HOME
107
+
108
+ RUN if [ "$USE_OLLAMA" = "true" ]; then \
109
+ apt-get update && \
110
+ # Install pandoc and netcat
111
+ apt-get install -y --no-install-recommends git build-essential pandoc netcat-openbsd curl && \
112
+ apt-get install -y --no-install-recommends gcc python3-dev && \
113
+ # for RAG OCR
114
+ apt-get install -y --no-install-recommends ffmpeg libsm6 libxext6 && \
115
+ # install helper tools
116
+ apt-get install -y --no-install-recommends curl jq && \
117
+ # install ollama
118
+ curl -fsSL https://ollama.com/install.sh | sh && \
119
+ # cleanup
120
+ rm -rf /var/lib/apt/lists/*; \
121
+ else \
122
+ apt-get update && \
123
+ # Install pandoc, netcat and gcc
124
+ apt-get install -y --no-install-recommends git build-essential pandoc gcc netcat-openbsd curl jq && \
125
+ apt-get install -y --no-install-recommends gcc python3-dev && \
126
+ # for RAG OCR
127
+ apt-get install -y --no-install-recommends ffmpeg libsm6 libxext6 && \
128
+ # cleanup
129
+ rm -rf /var/lib/apt/lists/*; \
130
+ fi
131
+
132
+ # install python dependencies
133
+ COPY --chown=$UID:$GID ./backend/requirements.txt ./requirements.txt
134
+
135
+ RUN pip3 install uv && \
136
+ if [ "$USE_CUDA" = "true" ]; then \
137
+ # If you use CUDA the whisper and embedding model will be downloaded on first use
138
+ pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/$USE_CUDA_DOCKER_VER --no-cache-dir && \
139
+ uv pip install --system -r requirements.txt --no-cache-dir && \
140
+ python -c "import os; from sentence_transformers import SentenceTransformer; SentenceTransformer(os.environ['RAG_EMBEDDING_MODEL'], device='cpu')" && \
141
+ python -c "import os; from faster_whisper import WhisperModel; WhisperModel(os.environ['WHISPER_MODEL'], device='cpu', compute_type='int8', download_root=os.environ['WHISPER_MODEL_DIR'])"; \
142
+ python -c "import os; import tiktoken; tiktoken.get_encoding(os.environ['TIKTOKEN_ENCODING_NAME'])"; \
143
+ else \
144
+ pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu --no-cache-dir && \
145
+ uv pip install --system -r requirements.txt --no-cache-dir && \
146
+ python -c "import os; from sentence_transformers import SentenceTransformer; SentenceTransformer(os.environ['RAG_EMBEDDING_MODEL'], device='cpu')" && \
147
+ python -c "import os; from faster_whisper import WhisperModel; WhisperModel(os.environ['WHISPER_MODEL'], device='cpu', compute_type='int8', download_root=os.environ['WHISPER_MODEL_DIR'])"; \
148
+ python -c "import os; import tiktoken; tiktoken.get_encoding(os.environ['TIKTOKEN_ENCODING_NAME'])"; \
149
+ fi; \
150
+ chown -R $UID:$GID /app/backend/data/
151
+
152
+
153
+
154
+ # copy embedding weight from build
155
+ # RUN mkdir -p /root/.cache/chroma/onnx_models/all-MiniLM-L6-v2
156
+ # COPY --from=build /app/onnx /root/.cache/chroma/onnx_models/all-MiniLM-L6-v2/onnx
157
+
158
+ # copy built frontend files
159
+ COPY --chown=$UID:$GID --from=build /app/build /app/build
160
+ COPY --chown=$UID:$GID --from=build /app/CHANGELOG.md /app/CHANGELOG.md
161
+ COPY --chown=$UID:$GID --from=build /app/package.json /app/package.json
162
+
163
+ # copy backend files
164
+ COPY --chown=$UID:$GID ./backend .
165
+
166
+ EXPOSE 8080
167
+
168
+ HEALTHCHECK CMD curl --silent --fail http://localhost:${PORT:-8080}/health | jq -ne 'input.status == true' || exit 1
169
+
170
+ USER $UID:$GID
171
+
172
+ ARG BUILD_HASH
173
+ ENV WEBUI_BUILD_VERSION=${BUILD_HASH}
174
+ ENV DOCKER=true
175
+
176
+ CMD [ "bash", "start.sh"]
INSTALLATION.md ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ### Installing Both Ollama and Open WebUI Using Kustomize
2
+
3
+ For cpu-only pod
4
+
5
+ ```bash
6
+ kubectl apply -f ./kubernetes/manifest/base
7
+ ```
8
+
9
+ For gpu-enabled pod
10
+
11
+ ```bash
12
+ kubectl apply -k ./kubernetes/manifest
13
+ ```
14
+
15
+ ### Installing Both Ollama and Open WebUI Using Helm
16
+
17
+ Package Helm file first
18
+
19
+ ```bash
20
+ helm package ./kubernetes/helm/
21
+ ```
22
+
23
+ For cpu-only pod
24
+
25
+ ```bash
26
+ helm install ollama-webui ./ollama-webui-*.tgz
27
+ ```
28
+
29
+ For gpu-enabled pod
30
+
31
+ ```bash
32
+ helm install ollama-webui ./ollama-webui-*.tgz --set ollama.resources.limits.nvidia.com/gpu="1"
33
+ ```
34
+
35
+ Check the `kubernetes/helm/values.yaml` file to know which parameters are available for customization
LICENSE ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MIT License
2
+
3
+ Copyright (c) 2023 Timothy Jaeryang Baek
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
Makefile ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ifneq ($(shell which docker-compose 2>/dev/null),)
3
+ DOCKER_COMPOSE := docker-compose
4
+ else
5
+ DOCKER_COMPOSE := docker compose
6
+ endif
7
+
8
+ install:
9
+ $(DOCKER_COMPOSE) up -d
10
+
11
+ remove:
12
+ @chmod +x confirm_remove.sh
13
+ @./confirm_remove.sh
14
+
15
+ start:
16
+ $(DOCKER_COMPOSE) start
17
+ startAndBuild:
18
+ $(DOCKER_COMPOSE) up -d --build
19
+
20
+ stop:
21
+ $(DOCKER_COMPOSE) stop
22
+
23
+ update:
24
+ # Calls the LLM update script
25
+ chmod +x update_ollama_models.sh
26
+ @./update_ollama_models.sh
27
+ @git pull
28
+ $(DOCKER_COMPOSE) down
29
+ # Make sure the ollama-webui container is stopped before rebuilding
30
+ @docker stop open-webui || true
31
+ $(DOCKER_COMPOSE) up --build -d
32
+ $(DOCKER_COMPOSE) start
33
+
README.md ADDED
@@ -0,0 +1,221 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: Open WebUI
3
+ emoji: 🐳
4
+ colorFrom: purple
5
+ colorTo: gray
6
+ sdk: docker
7
+ app_port: 8080
8
+ ---
9
+ # Open WebUI 👋
10
+
11
+ ![GitHub stars](https://img.shields.io/github/stars/open-webui/open-webui?style=social)
12
+ ![GitHub forks](https://img.shields.io/github/forks/open-webui/open-webui?style=social)
13
+ ![GitHub watchers](https://img.shields.io/github/watchers/open-webui/open-webui?style=social)
14
+ ![GitHub repo size](https://img.shields.io/github/repo-size/open-webui/open-webui)
15
+ ![GitHub language count](https://img.shields.io/github/languages/count/open-webui/open-webui)
16
+ ![GitHub top language](https://img.shields.io/github/languages/top/open-webui/open-webui)
17
+ ![GitHub last commit](https://img.shields.io/github/last-commit/open-webui/open-webui?color=red)
18
+ ![Hits](https://hits.seeyoufarm.com/api/count/incr/badge.svg?url=https%3A%2F%2Fgithub.com%2Follama-webui%2Follama-wbui&count_bg=%2379C83D&title_bg=%23555555&icon=&icon_color=%23E7E7E7&title=hits&edge_flat=false)
19
+ [![Discord](https://img.shields.io/badge/Discord-Open_WebUI-blue?logo=discord&logoColor=white)](https://discord.gg/5rJgQTnV4s)
20
+ [![](https://img.shields.io/static/v1?label=Sponsor&message=%E2%9D%A4&logo=GitHub&color=%23fe8e86)](https://github.com/sponsors/tjbck)
21
+
22
+ Open WebUI is an [extensible](https://github.com/open-webui/pipelines), feature-rich, and user-friendly self-hosted WebUI designed to operate entirely offline. It supports various LLM runners, including Ollama and OpenAI-compatible APIs. For more information, be sure to check out our [Open WebUI Documentation](https://docs.openwebui.com/).
23
+
24
+ ![Open WebUI Demo](./demo.gif)
25
+
26
+ ## Key Features of Open WebUI ⭐
27
+
28
+ - 🚀 **Effortless Setup**: Install seamlessly using Docker or Kubernetes (kubectl, kustomize or helm) for a hassle-free experience with support for both `:ollama` and `:cuda` tagged images.
29
+
30
+ - 🤝 **Ollama/OpenAI API Integration**: Effortlessly integrate OpenAI-compatible APIs for versatile conversations alongside Ollama models. Customize the OpenAI API URL to link with **LMStudio, GroqCloud, Mistral, OpenRouter, and more**.
31
+
32
+ - 🛡️ **Granular Permissions and User Groups**: By allowing administrators to create detailed user roles and permissions, we ensure a secure user environment. This granularity not only enhances security but also allows for customized user experiences, fostering a sense of ownership and responsibility amongst users.
33
+
34
+ - 📱 **Responsive Design**: Enjoy a seamless experience across Desktop PC, Laptop, and Mobile devices.
35
+
36
+ - 📱 **Progressive Web App (PWA) for Mobile**: Enjoy a native app-like experience on your mobile device with our PWA, providing offline access on localhost and a seamless user interface.
37
+
38
+ - ✒️🔢 **Full Markdown and LaTeX Support**: Elevate your LLM experience with comprehensive Markdown and LaTeX capabilities for enriched interaction.
39
+
40
+ - 🎤📹 **Hands-Free Voice/Video Call**: Experience seamless communication with integrated hands-free voice and video call features, allowing for a more dynamic and interactive chat environment.
41
+
42
+ - 🛠️ **Model Builder**: Easily create Ollama models via the Web UI. Create and add custom characters/agents, customize chat elements, and import models effortlessly through [Open WebUI Community](https://openwebui.com/) integration.
43
+
44
+ - 🐍 **Native Python Function Calling Tool**: Enhance your LLMs with built-in code editor support in the tools workspace. Bring Your Own Function (BYOF) by simply adding your pure Python functions, enabling seamless integration with LLMs.
45
+
46
+ - 📚 **Local RAG Integration**: Dive into the future of chat interactions with groundbreaking Retrieval Augmented Generation (RAG) support. This feature seamlessly integrates document interactions into your chat experience. You can load documents directly into the chat or add files to your document library, effortlessly accessing them using the `#` command before a query.
47
+
48
+ - 🔍 **Web Search for RAG**: Perform web searches using providers like `SearXNG`, `Google PSE`, `Brave Search`, `serpstack`, `serper`, `Serply`, `DuckDuckGo`, `TavilySearch`, `SearchApi` and `Bing` and inject the results directly into your chat experience.
49
+
50
+ - 🌐 **Web Browsing Capability**: Seamlessly integrate websites into your chat experience using the `#` command followed by a URL. This feature allows you to incorporate web content directly into your conversations, enhancing the richness and depth of your interactions.
51
+
52
+ - 🎨 **Image Generation Integration**: Seamlessly incorporate image generation capabilities using options such as AUTOMATIC1111 API or ComfyUI (local), and OpenAI's DALL-E (external), enriching your chat experience with dynamic visual content.
53
+
54
+ - ⚙️ **Many Models Conversations**: Effortlessly engage with various models simultaneously, harnessing their unique strengths for optimal responses. Enhance your experience by leveraging a diverse set of models in parallel.
55
+
56
+ - 🔐 **Role-Based Access Control (RBAC)**: Ensure secure access with restricted permissions; only authorized individuals can access your Ollama, and exclusive model creation/pulling rights are reserved for administrators.
57
+
58
+ - 🌐🌍 **Multilingual Support**: Experience Open WebUI in your preferred language with our internationalization (i18n) support. Join us in expanding our supported languages! We're actively seeking contributors!
59
+
60
+ - 🧩 **Pipelines, Open WebUI Plugin Support**: Seamlessly integrate custom logic and Python libraries into Open WebUI using [Pipelines Plugin Framework](https://github.com/open-webui/pipelines). Launch your Pipelines instance, set the OpenAI URL to the Pipelines URL, and explore endless possibilities. [Examples](https://github.com/open-webui/pipelines/tree/main/examples) include **Function Calling**, User **Rate Limiting** to control access, **Usage Monitoring** with tools like Langfuse, **Live Translation with LibreTranslate** for multilingual support, **Toxic Message Filtering** and much more.
61
+
62
+ - 🌟 **Continuous Updates**: We are committed to improving Open WebUI with regular updates, fixes, and new features.
63
+
64
+ Want to learn more about Open WebUI's features? Check out our [Open WebUI documentation](https://docs.openwebui.com/features) for a comprehensive overview!
65
+
66
+ ## 🔗 Also Check Out Open WebUI Community!
67
+
68
+ Don't forget to explore our sibling project, [Open WebUI Community](https://openwebui.com/), where you can discover, download, and explore customized Modelfiles. Open WebUI Community offers a wide range of exciting possibilities for enhancing your chat interactions with Open WebUI! 🚀
69
+
70
+ ## How to Install 🚀
71
+
72
+ ### Installation via Python pip 🐍
73
+
74
+ Open WebUI can be installed using pip, the Python package installer. Before proceeding, ensure you're using **Python 3.11** to avoid compatibility issues.
75
+
76
+ 1. **Install Open WebUI**:
77
+ Open your terminal and run the following command to install Open WebUI:
78
+
79
+ ```bash
80
+ pip install open-webui
81
+ ```
82
+
83
+ 2. **Running Open WebUI**:
84
+ After installation, you can start Open WebUI by executing:
85
+
86
+ ```bash
87
+ open-webui serve
88
+ ```
89
+
90
+ This will start the Open WebUI server, which you can access at [http://localhost:8080](http://localhost:8080)
91
+
92
+ ### Quick Start with Docker 🐳
93
+
94
+ > [!NOTE]
95
+ > Please note that for certain Docker environments, additional configurations might be needed. If you encounter any connection issues, our detailed guide on [Open WebUI Documentation](https://docs.openwebui.com/) is ready to assist you.
96
+
97
+ > [!WARNING]
98
+ > When using Docker to install Open WebUI, make sure to include the `-v open-webui:/app/backend/data` in your Docker command. This step is crucial as it ensures your database is properly mounted and prevents any loss of data.
99
+
100
+ > [!TIP]
101
+ > If you wish to utilize Open WebUI with Ollama included or CUDA acceleration, we recommend utilizing our official images tagged with either `:cuda` or `:ollama`. To enable CUDA, you must install the [Nvidia CUDA container toolkit](https://docs.nvidia.com/dgx/nvidia-container-runtime-upgrade/) on your Linux/WSL system.
102
+
103
+ ### Installation with Default Configuration
104
+
105
+ - **If Ollama is on your computer**, use this command:
106
+
107
+ ```bash
108
+ docker run -d -p 3000:8080 --add-host=host.docker.internal:host-gateway -v open-webui:/app/backend/data --name open-webui --restart always ghcr.io/open-webui/open-webui:main
109
+ ```
110
+
111
+ - **If Ollama is on a Different Server**, use this command:
112
+
113
+ To connect to Ollama on another server, change the `OLLAMA_BASE_URL` to the server's URL:
114
+
115
+ ```bash
116
+ docker run -d -p 3000:8080 -e OLLAMA_BASE_URL=https://example.com -v open-webui:/app/backend/data --name open-webui --restart always ghcr.io/open-webui/open-webui:main
117
+ ```
118
+
119
+ - **To run Open WebUI with Nvidia GPU support**, use this command:
120
+
121
+ ```bash
122
+ docker run -d -p 3000:8080 --gpus all --add-host=host.docker.internal:host-gateway -v open-webui:/app/backend/data --name open-webui --restart always ghcr.io/open-webui/open-webui:cuda
123
+ ```
124
+
125
+ ### Installation for OpenAI API Usage Only
126
+
127
+ - **If you're only using OpenAI API**, use this command:
128
+
129
+ ```bash
130
+ docker run -d -p 3000:8080 -e OPENAI_API_KEY=your_secret_key -v open-webui:/app/backend/data --name open-webui --restart always ghcr.io/open-webui/open-webui:main
131
+ ```
132
+
133
+ ### Installing Open WebUI with Bundled Ollama Support
134
+
135
+ This installation method uses a single container image that bundles Open WebUI with Ollama, allowing for a streamlined setup via a single command. Choose the appropriate command based on your hardware setup:
136
+
137
+ - **With GPU Support**:
138
+ Utilize GPU resources by running the following command:
139
+
140
+ ```bash
141
+ docker run -d -p 3000:8080 --gpus=all -v ollama:/root/.ollama -v open-webui:/app/backend/data --name open-webui --restart always ghcr.io/open-webui/open-webui:ollama
142
+ ```
143
+
144
+ - **For CPU Only**:
145
+ If you're not using a GPU, use this command instead:
146
+
147
+ ```bash
148
+ docker run -d -p 3000:8080 -v ollama:/root/.ollama -v open-webui:/app/backend/data --name open-webui --restart always ghcr.io/open-webui/open-webui:ollama
149
+ ```
150
+
151
+ Both commands facilitate a built-in, hassle-free installation of both Open WebUI and Ollama, ensuring that you can get everything up and running swiftly.
152
+
153
+ After installation, you can access Open WebUI at [http://localhost:3000](http://localhost:3000). Enjoy! 😄
154
+
155
+ ### Other Installation Methods
156
+
157
+ We offer various installation alternatives, including non-Docker native installation methods, Docker Compose, Kustomize, and Helm. Visit our [Open WebUI Documentation](https://docs.openwebui.com/getting-started/) or join our [Discord community](https://discord.gg/5rJgQTnV4s) for comprehensive guidance.
158
+
159
+ ### Troubleshooting
160
+
161
+ Encountering connection issues? Our [Open WebUI Documentation](https://docs.openwebui.com/troubleshooting/) has got you covered. For further assistance and to join our vibrant community, visit the [Open WebUI Discord](https://discord.gg/5rJgQTnV4s).
162
+
163
+ #### Open WebUI: Server Connection Error
164
+
165
+ If you're experiencing connection issues, it’s often due to the WebUI docker container not being able to reach the Ollama server at 127.0.0.1:11434 (host.docker.internal:11434) inside the container . Use the `--network=host` flag in your docker command to resolve this. Note that the port changes from 3000 to 8080, resulting in the link: `http://localhost:8080`.
166
+
167
+ **Example Docker Command**:
168
+
169
+ ```bash
170
+ docker run -d --network=host -v open-webui:/app/backend/data -e OLLAMA_BASE_URL=http://127.0.0.1:11434 --name open-webui --restart always ghcr.io/open-webui/open-webui:main
171
+ ```
172
+
173
+ ### Keeping Your Docker Installation Up-to-Date
174
+
175
+ In case you want to update your local Docker installation to the latest version, you can do it with [Watchtower](https://containrrr.dev/watchtower/):
176
+
177
+ ```bash
178
+ docker run --rm --volume /var/run/docker.sock:/var/run/docker.sock containrrr/watchtower --run-once open-webui
179
+ ```
180
+
181
+ In the last part of the command, replace `open-webui` with your container name if it is different.
182
+
183
+ Check our Migration Guide available in our [Open WebUI Documentation](https://docs.openwebui.com/tutorials/migration/).
184
+
185
+ ### Using the Dev Branch 🌙
186
+
187
+ > [!WARNING]
188
+ > The `:dev` branch contains the latest unstable features and changes. Use it at your own risk as it may have bugs or incomplete features.
189
+
190
+ If you want to try out the latest bleeding-edge features and are okay with occasional instability, you can use the `:dev` tag like this:
191
+
192
+ ```bash
193
+ docker run -d -p 3000:8080 -v open-webui:/app/backend/data --name open-webui --add-host=host.docker.internal:host-gateway --restart always ghcr.io/open-webui/open-webui:dev
194
+ ```
195
+
196
+ ## What's Next? 🌟
197
+
198
+ Discover upcoming features on our roadmap in the [Open WebUI Documentation](https://docs.openwebui.com/roadmap/).
199
+
200
+ ## License 📜
201
+
202
+ This project is licensed under the [MIT License](LICENSE) - see the [LICENSE](LICENSE) file for details. 📄
203
+
204
+ ## Support 💬
205
+
206
+ If you have any questions, suggestions, or need assistance, please open an issue or join our
207
+ [Open WebUI Discord community](https://discord.gg/5rJgQTnV4s) to connect with us! 🤝
208
+
209
+ ## Star History
210
+
211
+ <a href="https://star-history.com/#open-webui/open-webui&Date">
212
+ <picture>
213
+ <source media="(prefers-color-scheme: dark)" srcset="https://api.star-history.com/svg?repos=open-webui/open-webui&type=Date&theme=dark" />
214
+ <source media="(prefers-color-scheme: light)" srcset="https://api.star-history.com/svg?repos=open-webui/open-webui&type=Date" />
215
+ <img alt="Star History Chart" src="https://api.star-history.com/svg?repos=open-webui/open-webui&type=Date" />
216
+ </picture>
217
+ </a>
218
+
219
+ ---
220
+
221
+ Created by [Timothy Jaeryang Baek](https://github.com/tjbck) - Let's make Open WebUI even more amazing together! 💪
TROUBLESHOOTING.md ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Open WebUI Troubleshooting Guide
2
+
3
+ ## Understanding the Open WebUI Architecture
4
+
5
+ The Open WebUI system is designed to streamline interactions between the client (your browser) and the Ollama API. At the heart of this design is a backend reverse proxy, enhancing security and resolving CORS issues.
6
+
7
+ - **How it Works**: The Open WebUI is designed to interact with the Ollama API through a specific route. When a request is made from the WebUI to Ollama, it is not directly sent to the Ollama API. Initially, the request is sent to the Open WebUI backend via `/ollama` route. From there, the backend is responsible for forwarding the request to the Ollama API. This forwarding is accomplished by using the route specified in the `OLLAMA_BASE_URL` environment variable. Therefore, a request made to `/ollama` in the WebUI is effectively the same as making a request to `OLLAMA_BASE_URL` in the backend. For instance, a request to `/ollama/api/tags` in the WebUI is equivalent to `OLLAMA_BASE_URL/api/tags` in the backend.
8
+
9
+ - **Security Benefits**: This design prevents direct exposure of the Ollama API to the frontend, safeguarding against potential CORS (Cross-Origin Resource Sharing) issues and unauthorized access. Requiring authentication to access the Ollama API further enhances this security layer.
10
+
11
+ ## Open WebUI: Server Connection Error
12
+
13
+ If you're experiencing connection issues, it’s often due to the WebUI docker container not being able to reach the Ollama server at 127.0.0.1:11434 (host.docker.internal:11434) inside the container . Use the `--network=host` flag in your docker command to resolve this. Note that the port changes from 3000 to 8080, resulting in the link: `http://localhost:8080`.
14
+
15
+ **Example Docker Command**:
16
+
17
+ ```bash
18
+ docker run -d --network=host -v open-webui:/app/backend/data -e OLLAMA_BASE_URL=http://127.0.0.1:11434 --name open-webui --restart always ghcr.io/open-webui/open-webui:main
19
+ ```
20
+
21
+ ### Error on Slow Responses for Ollama
22
+
23
+ Open WebUI has a default timeout of 5 minutes for Ollama to finish generating the response. If needed, this can be adjusted via the environment variable AIOHTTP_CLIENT_TIMEOUT, which sets the timeout in seconds.
24
+
25
+ ### General Connection Errors
26
+
27
+ **Ensure Ollama Version is Up-to-Date**: Always start by checking that you have the latest version of Ollama. Visit [Ollama's official site](https://ollama.com/) for the latest updates.
28
+
29
+ **Troubleshooting Steps**:
30
+
31
+ 1. **Verify Ollama URL Format**:
32
+ - When running the Web UI container, ensure the `OLLAMA_BASE_URL` is correctly set. (e.g., `http://192.168.1.1:11434` for different host setups).
33
+ - In the Open WebUI, navigate to "Settings" > "General".
34
+ - Confirm that the Ollama Server URL is correctly set to `[OLLAMA URL]` (e.g., `http://localhost:11434`).
35
+
36
+ By following these enhanced troubleshooting steps, connection issues should be effectively resolved. For further assistance or queries, feel free to reach out to us on our community Discord.
backend/.dockerignore ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ __pycache__
2
+ .env
3
+ _old
4
+ uploads
5
+ .ipynb_checkpoints
6
+ *.db
7
+ _test
8
+ !/data
9
+ /data/*
10
+ !/data/litellm
11
+ /data/litellm/*
12
+ !data/litellm/config.yaml
13
+
14
+ !data/config.json
backend/.gitignore ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ __pycache__
2
+ .env
3
+ _old
4
+ uploads
5
+ .ipynb_checkpoints
6
+ *.db
7
+ _test
8
+ Pipfile
9
+ !/data
10
+ /data/*
11
+ /open_webui/data/*
12
+ .webui_secret_key
backend/dev.sh ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ PORT="${PORT:-8080}"
2
+ uvicorn open_webui.main:app --port $PORT --host 0.0.0.0 --forwarded-allow-ips '*' --reload
backend/open_webui/__init__.py ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import base64
2
+ import os
3
+ import random
4
+ from pathlib import Path
5
+
6
+ import typer
7
+ import uvicorn
8
+
9
+ app = typer.Typer()
10
+
11
+ KEY_FILE = Path.cwd() / ".webui_secret_key"
12
+
13
+
14
+ @app.command()
15
+ def serve(
16
+ host: str = "0.0.0.0",
17
+ port: int = 8080,
18
+ ):
19
+ os.environ["FROM_INIT_PY"] = "true"
20
+ if os.getenv("WEBUI_SECRET_KEY") is None:
21
+ typer.echo(
22
+ "Loading WEBUI_SECRET_KEY from file, not provided as an environment variable."
23
+ )
24
+ if not KEY_FILE.exists():
25
+ typer.echo(f"Generating a new secret key and saving it to {KEY_FILE}")
26
+ KEY_FILE.write_bytes(base64.b64encode(random.randbytes(12)))
27
+ typer.echo(f"Loading WEBUI_SECRET_KEY from {KEY_FILE}")
28
+ os.environ["WEBUI_SECRET_KEY"] = KEY_FILE.read_text()
29
+
30
+ if os.getenv("USE_CUDA_DOCKER", "false") == "true":
31
+ typer.echo(
32
+ "CUDA is enabled, appending LD_LIBRARY_PATH to include torch/cudnn & cublas libraries."
33
+ )
34
+ LD_LIBRARY_PATH = os.getenv("LD_LIBRARY_PATH", "").split(":")
35
+ os.environ["LD_LIBRARY_PATH"] = ":".join(
36
+ LD_LIBRARY_PATH
37
+ + [
38
+ "/usr/local/lib/python3.11/site-packages/torch/lib",
39
+ "/usr/local/lib/python3.11/site-packages/nvidia/cudnn/lib",
40
+ ]
41
+ )
42
+ try:
43
+ import torch
44
+
45
+ assert torch.cuda.is_available(), "CUDA not available"
46
+ typer.echo("CUDA seems to be working")
47
+ except Exception as e:
48
+ typer.echo(
49
+ "Error when testing CUDA but USE_CUDA_DOCKER is true. "
50
+ "Resetting USE_CUDA_DOCKER to false and removing "
51
+ f"LD_LIBRARY_PATH modifications: {e}"
52
+ )
53
+ os.environ["USE_CUDA_DOCKER"] = "false"
54
+ os.environ["LD_LIBRARY_PATH"] = ":".join(LD_LIBRARY_PATH)
55
+
56
+ import open_webui.main # we need set environment variables before importing main
57
+
58
+ uvicorn.run(open_webui.main.app, host=host, port=port, forwarded_allow_ips="*")
59
+
60
+
61
+ @app.command()
62
+ def dev(
63
+ host: str = "0.0.0.0",
64
+ port: int = 8080,
65
+ reload: bool = True,
66
+ ):
67
+ uvicorn.run(
68
+ "open_webui.main:app",
69
+ host=host,
70
+ port=port,
71
+ reload=reload,
72
+ forwarded_allow_ips="*",
73
+ )
74
+
75
+
76
+ if __name__ == "__main__":
77
+ app()
backend/open_webui/alembic.ini ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # A generic, single database configuration.
2
+
3
+ [alembic]
4
+ # path to migration scripts
5
+ script_location = migrations
6
+
7
+ # template used to generate migration file names; The default value is %%(rev)s_%%(slug)s
8
+ # Uncomment the line below if you want the files to be prepended with date and time
9
+ # file_template = %%(year)d_%%(month).2d_%%(day).2d_%%(hour).2d%%(minute).2d-%%(rev)s_%%(slug)s
10
+
11
+ # sys.path path, will be prepended to sys.path if present.
12
+ # defaults to the current working directory.
13
+ prepend_sys_path = .
14
+
15
+ # timezone to use when rendering the date within the migration file
16
+ # as well as the filename.
17
+ # If specified, requires the python>=3.9 or backports.zoneinfo library.
18
+ # Any required deps can installed by adding `alembic[tz]` to the pip requirements
19
+ # string value is passed to ZoneInfo()
20
+ # leave blank for localtime
21
+ # timezone =
22
+
23
+ # max length of characters to apply to the
24
+ # "slug" field
25
+ # truncate_slug_length = 40
26
+
27
+ # set to 'true' to run the environment during
28
+ # the 'revision' command, regardless of autogenerate
29
+ # revision_environment = false
30
+
31
+ # set to 'true' to allow .pyc and .pyo files without
32
+ # a source .py file to be detected as revisions in the
33
+ # versions/ directory
34
+ # sourceless = false
35
+
36
+ # version location specification; This defaults
37
+ # to migrations/versions. When using multiple version
38
+ # directories, initial revisions must be specified with --version-path.
39
+ # The path separator used here should be the separator specified by "version_path_separator" below.
40
+ # version_locations = %(here)s/bar:%(here)s/bat:migrations/versions
41
+
42
+ # version path separator; As mentioned above, this is the character used to split
43
+ # version_locations. The default within new alembic.ini files is "os", which uses os.pathsep.
44
+ # If this key is omitted entirely, it falls back to the legacy behavior of splitting on spaces and/or commas.
45
+ # Valid values for version_path_separator are:
46
+ #
47
+ # version_path_separator = :
48
+ # version_path_separator = ;
49
+ # version_path_separator = space
50
+ version_path_separator = os # Use os.pathsep. Default configuration used for new projects.
51
+
52
+ # set to 'true' to search source files recursively
53
+ # in each "version_locations" directory
54
+ # new in Alembic version 1.10
55
+ # recursive_version_locations = false
56
+
57
+ # the output encoding used when revision files
58
+ # are written from script.py.mako
59
+ # output_encoding = utf-8
60
+
61
+ # sqlalchemy.url = REPLACE_WITH_DATABASE_URL
62
+
63
+
64
+ [post_write_hooks]
65
+ # post_write_hooks defines scripts or Python functions that are run
66
+ # on newly generated revision scripts. See the documentation for further
67
+ # detail and examples
68
+
69
+ # format using "black" - use the console_scripts runner, against the "black" entrypoint
70
+ # hooks = black
71
+ # black.type = console_scripts
72
+ # black.entrypoint = black
73
+ # black.options = -l 79 REVISION_SCRIPT_FILENAME
74
+
75
+ # lint with attempts to fix using "ruff" - use the exec runner, execute a binary
76
+ # hooks = ruff
77
+ # ruff.type = exec
78
+ # ruff.executable = %(here)s/.venv/bin/ruff
79
+ # ruff.options = --fix REVISION_SCRIPT_FILENAME
80
+
81
+ # Logging configuration
82
+ [loggers]
83
+ keys = root,sqlalchemy,alembic
84
+
85
+ [handlers]
86
+ keys = console
87
+
88
+ [formatters]
89
+ keys = generic
90
+
91
+ [logger_root]
92
+ level = WARN
93
+ handlers = console
94
+ qualname =
95
+
96
+ [logger_sqlalchemy]
97
+ level = WARN
98
+ handlers =
99
+ qualname = sqlalchemy.engine
100
+
101
+ [logger_alembic]
102
+ level = INFO
103
+ handlers =
104
+ qualname = alembic
105
+
106
+ [handler_console]
107
+ class = StreamHandler
108
+ args = (sys.stderr,)
109
+ level = NOTSET
110
+ formatter = generic
111
+
112
+ [formatter_generic]
113
+ format = %(levelname)-5.5s [%(name)s] %(message)s
114
+ datefmt = %H:%M:%S
backend/open_webui/apps/audio/main.py ADDED
@@ -0,0 +1,713 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import hashlib
2
+ import json
3
+ import logging
4
+ import os
5
+ import uuid
6
+ from functools import lru_cache
7
+ from pathlib import Path
8
+ from pydub import AudioSegment
9
+ from pydub.silence import split_on_silence
10
+
11
+ import requests
12
+ from open_webui.config import (
13
+ AUDIO_STT_ENGINE,
14
+ AUDIO_STT_MODEL,
15
+ AUDIO_STT_OPENAI_API_BASE_URL,
16
+ AUDIO_STT_OPENAI_API_KEY,
17
+ AUDIO_TTS_API_KEY,
18
+ AUDIO_TTS_ENGINE,
19
+ AUDIO_TTS_MODEL,
20
+ AUDIO_TTS_OPENAI_API_BASE_URL,
21
+ AUDIO_TTS_OPENAI_API_KEY,
22
+ AUDIO_TTS_SPLIT_ON,
23
+ AUDIO_TTS_VOICE,
24
+ AUDIO_TTS_AZURE_SPEECH_REGION,
25
+ AUDIO_TTS_AZURE_SPEECH_OUTPUT_FORMAT,
26
+ CACHE_DIR,
27
+ CORS_ALLOW_ORIGIN,
28
+ WHISPER_MODEL,
29
+ WHISPER_MODEL_AUTO_UPDATE,
30
+ WHISPER_MODEL_DIR,
31
+ AppConfig,
32
+ )
33
+
34
+ from open_webui.constants import ERROR_MESSAGES
35
+ from open_webui.env import (
36
+ ENV,
37
+ SRC_LOG_LEVELS,
38
+ DEVICE_TYPE,
39
+ ENABLE_FORWARD_USER_INFO_HEADERS,
40
+ )
41
+
42
+ from fastapi import Depends, FastAPI, File, HTTPException, Request, UploadFile, status
43
+ from fastapi.middleware.cors import CORSMiddleware
44
+ from fastapi.responses import FileResponse
45
+ from pydantic import BaseModel
46
+ from open_webui.utils.utils import get_admin_user, get_verified_user
47
+
48
+ # Constants
49
+ MAX_FILE_SIZE_MB = 25
50
+ MAX_FILE_SIZE = MAX_FILE_SIZE_MB * 1024 * 1024 # Convert MB to bytes
51
+
52
+
53
+ log = logging.getLogger(__name__)
54
+ log.setLevel(SRC_LOG_LEVELS["AUDIO"])
55
+
56
+ app = FastAPI(
57
+ docs_url="/docs" if ENV == "dev" else None,
58
+ openapi_url="/openapi.json" if ENV == "dev" else None,
59
+ redoc_url=None,
60
+ )
61
+
62
+ app.add_middleware(
63
+ CORSMiddleware,
64
+ allow_origins=CORS_ALLOW_ORIGIN,
65
+ allow_credentials=True,
66
+ allow_methods=["*"],
67
+ allow_headers=["*"],
68
+ )
69
+
70
+ app.state.config = AppConfig()
71
+
72
+ app.state.config.STT_OPENAI_API_BASE_URL = AUDIO_STT_OPENAI_API_BASE_URL
73
+ app.state.config.STT_OPENAI_API_KEY = AUDIO_STT_OPENAI_API_KEY
74
+ app.state.config.STT_ENGINE = AUDIO_STT_ENGINE
75
+ app.state.config.STT_MODEL = AUDIO_STT_MODEL
76
+
77
+ app.state.config.WHISPER_MODEL = WHISPER_MODEL
78
+ app.state.faster_whisper_model = None
79
+
80
+ app.state.config.TTS_OPENAI_API_BASE_URL = AUDIO_TTS_OPENAI_API_BASE_URL
81
+ app.state.config.TTS_OPENAI_API_KEY = AUDIO_TTS_OPENAI_API_KEY
82
+ app.state.config.TTS_ENGINE = AUDIO_TTS_ENGINE
83
+ app.state.config.TTS_MODEL = AUDIO_TTS_MODEL
84
+ app.state.config.TTS_VOICE = AUDIO_TTS_VOICE
85
+ app.state.config.TTS_API_KEY = AUDIO_TTS_API_KEY
86
+ app.state.config.TTS_SPLIT_ON = AUDIO_TTS_SPLIT_ON
87
+
88
+
89
+ app.state.speech_synthesiser = None
90
+ app.state.speech_speaker_embeddings_dataset = None
91
+
92
+ app.state.config.TTS_AZURE_SPEECH_REGION = AUDIO_TTS_AZURE_SPEECH_REGION
93
+ app.state.config.TTS_AZURE_SPEECH_OUTPUT_FORMAT = AUDIO_TTS_AZURE_SPEECH_OUTPUT_FORMAT
94
+
95
+ # setting device type for whisper model
96
+ whisper_device_type = DEVICE_TYPE if DEVICE_TYPE and DEVICE_TYPE == "cuda" else "cpu"
97
+ log.info(f"whisper_device_type: {whisper_device_type}")
98
+
99
+ SPEECH_CACHE_DIR = Path(CACHE_DIR).joinpath("./audio/speech/")
100
+ SPEECH_CACHE_DIR.mkdir(parents=True, exist_ok=True)
101
+
102
+
103
+ def set_faster_whisper_model(model: str, auto_update: bool = False):
104
+ if model and app.state.config.STT_ENGINE == "":
105
+ from faster_whisper import WhisperModel
106
+
107
+ faster_whisper_kwargs = {
108
+ "model_size_or_path": model,
109
+ "device": whisper_device_type,
110
+ "compute_type": "int8",
111
+ "download_root": WHISPER_MODEL_DIR,
112
+ "local_files_only": not auto_update,
113
+ }
114
+
115
+ try:
116
+ app.state.faster_whisper_model = WhisperModel(**faster_whisper_kwargs)
117
+ except Exception:
118
+ log.warning(
119
+ "WhisperModel initialization failed, attempting download with local_files_only=False"
120
+ )
121
+ faster_whisper_kwargs["local_files_only"] = False
122
+ app.state.faster_whisper_model = WhisperModel(**faster_whisper_kwargs)
123
+
124
+ else:
125
+ app.state.faster_whisper_model = None
126
+
127
+
128
+ class TTSConfigForm(BaseModel):
129
+ OPENAI_API_BASE_URL: str
130
+ OPENAI_API_KEY: str
131
+ API_KEY: str
132
+ ENGINE: str
133
+ MODEL: str
134
+ VOICE: str
135
+ SPLIT_ON: str
136
+ AZURE_SPEECH_REGION: str
137
+ AZURE_SPEECH_OUTPUT_FORMAT: str
138
+
139
+
140
+ class STTConfigForm(BaseModel):
141
+ OPENAI_API_BASE_URL: str
142
+ OPENAI_API_KEY: str
143
+ ENGINE: str
144
+ MODEL: str
145
+ WHISPER_MODEL: str
146
+
147
+
148
+ class AudioConfigUpdateForm(BaseModel):
149
+ tts: TTSConfigForm
150
+ stt: STTConfigForm
151
+
152
+
153
+ from pydub import AudioSegment
154
+ from pydub.utils import mediainfo
155
+
156
+
157
+ def is_mp4_audio(file_path):
158
+ """Check if the given file is an MP4 audio file."""
159
+ if not os.path.isfile(file_path):
160
+ print(f"File not found: {file_path}")
161
+ return False
162
+
163
+ info = mediainfo(file_path)
164
+ if (
165
+ info.get("codec_name") == "aac"
166
+ and info.get("codec_type") == "audio"
167
+ and info.get("codec_tag_string") == "mp4a"
168
+ ):
169
+ return True
170
+ return False
171
+
172
+
173
+ def convert_mp4_to_wav(file_path, output_path):
174
+ """Convert MP4 audio file to WAV format."""
175
+ audio = AudioSegment.from_file(file_path, format="mp4")
176
+ audio.export(output_path, format="wav")
177
+ print(f"Converted {file_path} to {output_path}")
178
+
179
+
180
+ @app.get("/config")
181
+ async def get_audio_config(user=Depends(get_admin_user)):
182
+ return {
183
+ "tts": {
184
+ "OPENAI_API_BASE_URL": app.state.config.TTS_OPENAI_API_BASE_URL,
185
+ "OPENAI_API_KEY": app.state.config.TTS_OPENAI_API_KEY,
186
+ "API_KEY": app.state.config.TTS_API_KEY,
187
+ "ENGINE": app.state.config.TTS_ENGINE,
188
+ "MODEL": app.state.config.TTS_MODEL,
189
+ "VOICE": app.state.config.TTS_VOICE,
190
+ "SPLIT_ON": app.state.config.TTS_SPLIT_ON,
191
+ "AZURE_SPEECH_REGION": app.state.config.TTS_AZURE_SPEECH_REGION,
192
+ "AZURE_SPEECH_OUTPUT_FORMAT": app.state.config.TTS_AZURE_SPEECH_OUTPUT_FORMAT,
193
+ },
194
+ "stt": {
195
+ "OPENAI_API_BASE_URL": app.state.config.STT_OPENAI_API_BASE_URL,
196
+ "OPENAI_API_KEY": app.state.config.STT_OPENAI_API_KEY,
197
+ "ENGINE": app.state.config.STT_ENGINE,
198
+ "MODEL": app.state.config.STT_MODEL,
199
+ "WHISPER_MODEL": app.state.config.WHISPER_MODEL,
200
+ },
201
+ }
202
+
203
+
204
+ @app.post("/config/update")
205
+ async def update_audio_config(
206
+ form_data: AudioConfigUpdateForm, user=Depends(get_admin_user)
207
+ ):
208
+ app.state.config.TTS_OPENAI_API_BASE_URL = form_data.tts.OPENAI_API_BASE_URL
209
+ app.state.config.TTS_OPENAI_API_KEY = form_data.tts.OPENAI_API_KEY
210
+ app.state.config.TTS_API_KEY = form_data.tts.API_KEY
211
+ app.state.config.TTS_ENGINE = form_data.tts.ENGINE
212
+ app.state.config.TTS_MODEL = form_data.tts.MODEL
213
+ app.state.config.TTS_VOICE = form_data.tts.VOICE
214
+ app.state.config.TTS_SPLIT_ON = form_data.tts.SPLIT_ON
215
+ app.state.config.TTS_AZURE_SPEECH_REGION = form_data.tts.AZURE_SPEECH_REGION
216
+ app.state.config.TTS_AZURE_SPEECH_OUTPUT_FORMAT = (
217
+ form_data.tts.AZURE_SPEECH_OUTPUT_FORMAT
218
+ )
219
+
220
+ app.state.config.STT_OPENAI_API_BASE_URL = form_data.stt.OPENAI_API_BASE_URL
221
+ app.state.config.STT_OPENAI_API_KEY = form_data.stt.OPENAI_API_KEY
222
+ app.state.config.STT_ENGINE = form_data.stt.ENGINE
223
+ app.state.config.STT_MODEL = form_data.stt.MODEL
224
+ app.state.config.WHISPER_MODEL = form_data.stt.WHISPER_MODEL
225
+ set_faster_whisper_model(form_data.stt.WHISPER_MODEL, WHISPER_MODEL_AUTO_UPDATE)
226
+
227
+ return {
228
+ "tts": {
229
+ "OPENAI_API_BASE_URL": app.state.config.TTS_OPENAI_API_BASE_URL,
230
+ "OPENAI_API_KEY": app.state.config.TTS_OPENAI_API_KEY,
231
+ "API_KEY": app.state.config.TTS_API_KEY,
232
+ "ENGINE": app.state.config.TTS_ENGINE,
233
+ "MODEL": app.state.config.TTS_MODEL,
234
+ "VOICE": app.state.config.TTS_VOICE,
235
+ "SPLIT_ON": app.state.config.TTS_SPLIT_ON,
236
+ "AZURE_SPEECH_REGION": app.state.config.TTS_AZURE_SPEECH_REGION,
237
+ "AZURE_SPEECH_OUTPUT_FORMAT": app.state.config.TTS_AZURE_SPEECH_OUTPUT_FORMAT,
238
+ },
239
+ "stt": {
240
+ "OPENAI_API_BASE_URL": app.state.config.STT_OPENAI_API_BASE_URL,
241
+ "OPENAI_API_KEY": app.state.config.STT_OPENAI_API_KEY,
242
+ "ENGINE": app.state.config.STT_ENGINE,
243
+ "MODEL": app.state.config.STT_MODEL,
244
+ "WHISPER_MODEL": app.state.config.WHISPER_MODEL,
245
+ },
246
+ }
247
+
248
+
249
+ def load_speech_pipeline():
250
+ from transformers import pipeline
251
+ from datasets import load_dataset
252
+
253
+ if app.state.speech_synthesiser is None:
254
+ app.state.speech_synthesiser = pipeline(
255
+ "text-to-speech", "microsoft/speecht5_tts"
256
+ )
257
+
258
+ if app.state.speech_speaker_embeddings_dataset is None:
259
+ app.state.speech_speaker_embeddings_dataset = load_dataset(
260
+ "Matthijs/cmu-arctic-xvectors", split="validation"
261
+ )
262
+
263
+
264
+ @app.post("/speech")
265
+ async def speech(request: Request, user=Depends(get_verified_user)):
266
+ body = await request.body()
267
+ name = hashlib.sha256(body).hexdigest()
268
+
269
+ file_path = SPEECH_CACHE_DIR.joinpath(f"{name}.mp3")
270
+ file_body_path = SPEECH_CACHE_DIR.joinpath(f"{name}.json")
271
+
272
+ # Check if the file already exists in the cache
273
+ if file_path.is_file():
274
+ return FileResponse(file_path)
275
+
276
+ if app.state.config.TTS_ENGINE == "openai":
277
+ headers = {}
278
+ headers["Authorization"] = f"Bearer {app.state.config.TTS_OPENAI_API_KEY}"
279
+ headers["Content-Type"] = "application/json"
280
+
281
+ if ENABLE_FORWARD_USER_INFO_HEADERS:
282
+ headers["X-OpenWebUI-User-Name"] = user.name
283
+ headers["X-OpenWebUI-User-Id"] = user.id
284
+ headers["X-OpenWebUI-User-Email"] = user.email
285
+ headers["X-OpenWebUI-User-Role"] = user.role
286
+
287
+ try:
288
+ body = body.decode("utf-8")
289
+ body = json.loads(body)
290
+ body["model"] = app.state.config.TTS_MODEL
291
+ body = json.dumps(body).encode("utf-8")
292
+ except Exception:
293
+ pass
294
+
295
+ r = None
296
+ try:
297
+ r = requests.post(
298
+ url=f"{app.state.config.TTS_OPENAI_API_BASE_URL}/audio/speech",
299
+ data=body,
300
+ headers=headers,
301
+ stream=True,
302
+ )
303
+
304
+ r.raise_for_status()
305
+
306
+ # Save the streaming content to a file
307
+ with open(file_path, "wb") as f:
308
+ for chunk in r.iter_content(chunk_size=8192):
309
+ f.write(chunk)
310
+
311
+ with open(file_body_path, "w") as f:
312
+ json.dump(json.loads(body.decode("utf-8")), f)
313
+
314
+ # Return the saved file
315
+ return FileResponse(file_path)
316
+
317
+ except Exception as e:
318
+ log.exception(e)
319
+ error_detail = "Open WebUI: Server Connection Error"
320
+ if r is not None:
321
+ try:
322
+ res = r.json()
323
+ if "error" in res:
324
+ error_detail = f"External: {res['error']['message']}"
325
+ except Exception:
326
+ error_detail = f"External: {e}"
327
+
328
+ raise HTTPException(
329
+ status_code=r.status_code if r != None else 500,
330
+ detail=error_detail,
331
+ )
332
+
333
+ elif app.state.config.TTS_ENGINE == "elevenlabs":
334
+ payload = None
335
+ try:
336
+ payload = json.loads(body.decode("utf-8"))
337
+ except Exception as e:
338
+ log.exception(e)
339
+ raise HTTPException(status_code=400, detail="Invalid JSON payload")
340
+
341
+ voice_id = payload.get("voice", "")
342
+
343
+ if voice_id not in get_available_voices():
344
+ raise HTTPException(
345
+ status_code=400,
346
+ detail="Invalid voice id",
347
+ )
348
+
349
+ url = f"https://api.elevenlabs.io/v1/text-to-speech/{voice_id}"
350
+
351
+ headers = {
352
+ "Accept": "audio/mpeg",
353
+ "Content-Type": "application/json",
354
+ "xi-api-key": app.state.config.TTS_API_KEY,
355
+ }
356
+
357
+ data = {
358
+ "text": payload["input"],
359
+ "model_id": app.state.config.TTS_MODEL,
360
+ "voice_settings": {"stability": 0.5, "similarity_boost": 0.5},
361
+ }
362
+
363
+ try:
364
+ r = requests.post(url, json=data, headers=headers)
365
+
366
+ r.raise_for_status()
367
+
368
+ # Save the streaming content to a file
369
+ with open(file_path, "wb") as f:
370
+ for chunk in r.iter_content(chunk_size=8192):
371
+ f.write(chunk)
372
+
373
+ with open(file_body_path, "w") as f:
374
+ json.dump(json.loads(body.decode("utf-8")), f)
375
+
376
+ # Return the saved file
377
+ return FileResponse(file_path)
378
+
379
+ except Exception as e:
380
+ log.exception(e)
381
+ error_detail = "Open WebUI: Server Connection Error"
382
+ if r is not None:
383
+ try:
384
+ res = r.json()
385
+ if "error" in res:
386
+ error_detail = f"External: {res['error']['message']}"
387
+ except Exception:
388
+ error_detail = f"External: {e}"
389
+
390
+ raise HTTPException(
391
+ status_code=r.status_code if r != None else 500,
392
+ detail=error_detail,
393
+ )
394
+
395
+ elif app.state.config.TTS_ENGINE == "azure":
396
+ payload = None
397
+ try:
398
+ payload = json.loads(body.decode("utf-8"))
399
+ except Exception as e:
400
+ log.exception(e)
401
+ raise HTTPException(status_code=400, detail="Invalid JSON payload")
402
+
403
+ region = app.state.config.TTS_AZURE_SPEECH_REGION
404
+ language = app.state.config.TTS_VOICE
405
+ locale = "-".join(app.state.config.TTS_VOICE.split("-")[:1])
406
+ output_format = app.state.config.TTS_AZURE_SPEECH_OUTPUT_FORMAT
407
+ url = f"https://{region}.tts.speech.microsoft.com/cognitiveservices/v1"
408
+
409
+ headers = {
410
+ "Ocp-Apim-Subscription-Key": app.state.config.TTS_API_KEY,
411
+ "Content-Type": "application/ssml+xml",
412
+ "X-Microsoft-OutputFormat": output_format,
413
+ }
414
+
415
+ data = f"""<speak version="1.0" xmlns="http://www.w3.org/2001/10/synthesis" xml:lang="{locale}">
416
+ <voice name="{language}">{payload["input"]}</voice>
417
+ </speak>"""
418
+
419
+ response = requests.post(url, headers=headers, data=data)
420
+
421
+ if response.status_code == 200:
422
+ with open(file_path, "wb") as f:
423
+ f.write(response.content)
424
+ return FileResponse(file_path)
425
+ else:
426
+ log.error(f"Error synthesizing speech - {response.reason}")
427
+ raise HTTPException(
428
+ status_code=500, detail=f"Error synthesizing speech - {response.reason}"
429
+ )
430
+ elif app.state.config.TTS_ENGINE == "transformers":
431
+ payload = None
432
+ try:
433
+ payload = json.loads(body.decode("utf-8"))
434
+ except Exception as e:
435
+ log.exception(e)
436
+ raise HTTPException(status_code=400, detail="Invalid JSON payload")
437
+
438
+ import torch
439
+ import soundfile as sf
440
+
441
+ load_speech_pipeline()
442
+
443
+ embeddings_dataset = app.state.speech_speaker_embeddings_dataset
444
+
445
+ speaker_index = 6799
446
+ try:
447
+ speaker_index = embeddings_dataset["filename"].index(
448
+ app.state.config.TTS_MODEL
449
+ )
450
+ except Exception:
451
+ pass
452
+
453
+ speaker_embedding = torch.tensor(
454
+ embeddings_dataset[speaker_index]["xvector"]
455
+ ).unsqueeze(0)
456
+
457
+ speech = app.state.speech_synthesiser(
458
+ payload["input"],
459
+ forward_params={"speaker_embeddings": speaker_embedding},
460
+ )
461
+
462
+ sf.write(file_path, speech["audio"], samplerate=speech["sampling_rate"])
463
+ with open(file_body_path, "w") as f:
464
+ json.dump(json.loads(body.decode("utf-8")), f)
465
+
466
+ return FileResponse(file_path)
467
+
468
+
469
+ def transcribe(file_path):
470
+ print("transcribe", file_path)
471
+ filename = os.path.basename(file_path)
472
+ file_dir = os.path.dirname(file_path)
473
+ id = filename.split(".")[0]
474
+
475
+ if app.state.config.STT_ENGINE == "":
476
+ if app.state.faster_whisper_model is None:
477
+ set_faster_whisper_model(app.state.config.WHISPER_MODEL)
478
+
479
+ model = app.state.faster_whisper_model
480
+ segments, info = model.transcribe(file_path, beam_size=5)
481
+ log.info(
482
+ "Detected language '%s' with probability %f"
483
+ % (info.language, info.language_probability)
484
+ )
485
+
486
+ transcript = "".join([segment.text for segment in list(segments)])
487
+ data = {"text": transcript.strip()}
488
+
489
+ # save the transcript to a json file
490
+ transcript_file = f"{file_dir}/{id}.json"
491
+ with open(transcript_file, "w") as f:
492
+ json.dump(data, f)
493
+
494
+ log.debug(data)
495
+ return data
496
+ elif app.state.config.STT_ENGINE == "openai":
497
+ if is_mp4_audio(file_path):
498
+ print("is_mp4_audio")
499
+ os.rename(file_path, file_path.replace(".wav", ".mp4"))
500
+ # Convert MP4 audio file to WAV format
501
+ convert_mp4_to_wav(file_path.replace(".wav", ".mp4"), file_path)
502
+
503
+ headers = {"Authorization": f"Bearer {app.state.config.STT_OPENAI_API_KEY}"}
504
+
505
+ files = {"file": (filename, open(file_path, "rb"))}
506
+ data = {"model": app.state.config.STT_MODEL}
507
+
508
+ log.debug(files, data)
509
+
510
+ r = None
511
+ try:
512
+ r = requests.post(
513
+ url=f"{app.state.config.STT_OPENAI_API_BASE_URL}/audio/transcriptions",
514
+ headers=headers,
515
+ files=files,
516
+ data=data,
517
+ )
518
+
519
+ r.raise_for_status()
520
+
521
+ data = r.json()
522
+
523
+ # save the transcript to a json file
524
+ transcript_file = f"{file_dir}/{id}.json"
525
+ with open(transcript_file, "w") as f:
526
+ json.dump(data, f)
527
+
528
+ print(data)
529
+ return data
530
+ except Exception as e:
531
+ log.exception(e)
532
+ error_detail = "Open WebUI: Server Connection Error"
533
+ if r is not None:
534
+ try:
535
+ res = r.json()
536
+ if "error" in res:
537
+ error_detail = f"External: {res['error']['message']}"
538
+ except Exception:
539
+ error_detail = f"External: {e}"
540
+
541
+ raise Exception(error_detail)
542
+
543
+
544
+ @app.post("/transcriptions")
545
+ def transcription(
546
+ file: UploadFile = File(...),
547
+ user=Depends(get_verified_user),
548
+ ):
549
+ log.info(f"file.content_type: {file.content_type}")
550
+
551
+ if file.content_type not in ["audio/mpeg", "audio/wav", "audio/ogg", "audio/x-m4a"]:
552
+ raise HTTPException(
553
+ status_code=status.HTTP_400_BAD_REQUEST,
554
+ detail=ERROR_MESSAGES.FILE_NOT_SUPPORTED,
555
+ )
556
+
557
+ try:
558
+ ext = file.filename.split(".")[-1]
559
+ id = uuid.uuid4()
560
+
561
+ filename = f"{id}.{ext}"
562
+ contents = file.file.read()
563
+
564
+ file_dir = f"{CACHE_DIR}/audio/transcriptions"
565
+ os.makedirs(file_dir, exist_ok=True)
566
+ file_path = f"{file_dir}/{filename}"
567
+
568
+ with open(file_path, "wb") as f:
569
+ f.write(contents)
570
+
571
+ try:
572
+ if os.path.getsize(file_path) > MAX_FILE_SIZE: # file is bigger than 25MB
573
+ log.debug(f"File size is larger than {MAX_FILE_SIZE_MB}MB")
574
+ audio = AudioSegment.from_file(file_path)
575
+ audio = audio.set_frame_rate(16000).set_channels(1) # Compress audio
576
+ compressed_path = f"{file_dir}/{id}_compressed.opus"
577
+ audio.export(compressed_path, format="opus", bitrate="32k")
578
+ log.debug(f"Compressed audio to {compressed_path}")
579
+ file_path = compressed_path
580
+
581
+ if (
582
+ os.path.getsize(file_path) > MAX_FILE_SIZE
583
+ ): # Still larger than 25MB after compression
584
+ log.debug(
585
+ f"Compressed file size is still larger than {MAX_FILE_SIZE_MB}MB: {os.path.getsize(file_path)}"
586
+ )
587
+ raise HTTPException(
588
+ status_code=status.HTTP_400_BAD_REQUEST,
589
+ detail=ERROR_MESSAGES.FILE_TOO_LARGE(
590
+ size=f"{MAX_FILE_SIZE_MB}MB"
591
+ ),
592
+ )
593
+
594
+ data = transcribe(file_path)
595
+ else:
596
+ data = transcribe(file_path)
597
+
598
+ file_path = file_path.split("/")[-1]
599
+ return {**data, "filename": file_path}
600
+ except Exception as e:
601
+ log.exception(e)
602
+ raise HTTPException(
603
+ status_code=status.HTTP_400_BAD_REQUEST,
604
+ detail=ERROR_MESSAGES.DEFAULT(e),
605
+ )
606
+
607
+ except Exception as e:
608
+ log.exception(e)
609
+
610
+ raise HTTPException(
611
+ status_code=status.HTTP_400_BAD_REQUEST,
612
+ detail=ERROR_MESSAGES.DEFAULT(e),
613
+ )
614
+
615
+
616
+ def get_available_models() -> list[dict]:
617
+ if app.state.config.TTS_ENGINE == "openai":
618
+ return [{"id": "tts-1"}, {"id": "tts-1-hd"}]
619
+ elif app.state.config.TTS_ENGINE == "elevenlabs":
620
+ headers = {
621
+ "xi-api-key": app.state.config.TTS_API_KEY,
622
+ "Content-Type": "application/json",
623
+ }
624
+
625
+ try:
626
+ response = requests.get(
627
+ "https://api.elevenlabs.io/v1/models", headers=headers, timeout=5
628
+ )
629
+ response.raise_for_status()
630
+ models = response.json()
631
+ return [
632
+ {"name": model["name"], "id": model["model_id"]} for model in models
633
+ ]
634
+ except requests.RequestException as e:
635
+ log.error(f"Error fetching voices: {str(e)}")
636
+ return []
637
+
638
+
639
+ @app.get("/models")
640
+ async def get_models(user=Depends(get_verified_user)):
641
+ return {"models": get_available_models()}
642
+
643
+
644
+ def get_available_voices() -> dict:
645
+ """Returns {voice_id: voice_name} dict"""
646
+ ret = {}
647
+ if app.state.config.TTS_ENGINE == "openai":
648
+ ret = {
649
+ "alloy": "alloy",
650
+ "echo": "echo",
651
+ "fable": "fable",
652
+ "onyx": "onyx",
653
+ "nova": "nova",
654
+ "shimmer": "shimmer",
655
+ }
656
+ elif app.state.config.TTS_ENGINE == "elevenlabs":
657
+ try:
658
+ ret = get_elevenlabs_voices()
659
+ except Exception:
660
+ # Avoided @lru_cache with exception
661
+ pass
662
+ elif app.state.config.TTS_ENGINE == "azure":
663
+ try:
664
+ region = app.state.config.TTS_AZURE_SPEECH_REGION
665
+ url = f"https://{region}.tts.speech.microsoft.com/cognitiveservices/voices/list"
666
+ headers = {"Ocp-Apim-Subscription-Key": app.state.config.TTS_API_KEY}
667
+
668
+ response = requests.get(url, headers=headers)
669
+ response.raise_for_status()
670
+ voices = response.json()
671
+ for voice in voices:
672
+ ret[voice["ShortName"]] = (
673
+ f"{voice['DisplayName']} ({voice['ShortName']})"
674
+ )
675
+ except requests.RequestException as e:
676
+ log.error(f"Error fetching voices: {str(e)}")
677
+
678
+ return ret
679
+
680
+
681
+ @lru_cache
682
+ def get_elevenlabs_voices() -> dict:
683
+ """
684
+ Note, set the following in your .env file to use Elevenlabs:
685
+ AUDIO_TTS_ENGINE=elevenlabs
686
+ AUDIO_TTS_API_KEY=sk_... # Your Elevenlabs API key
687
+ AUDIO_TTS_VOICE=EXAVITQu4vr4xnSDxMaL # From https://api.elevenlabs.io/v1/voices
688
+ AUDIO_TTS_MODEL=eleven_multilingual_v2
689
+ """
690
+ headers = {
691
+ "xi-api-key": app.state.config.TTS_API_KEY,
692
+ "Content-Type": "application/json",
693
+ }
694
+ try:
695
+ # TODO: Add retries
696
+ response = requests.get("https://api.elevenlabs.io/v1/voices", headers=headers)
697
+ response.raise_for_status()
698
+ voices_data = response.json()
699
+
700
+ voices = {}
701
+ for voice in voices_data.get("voices", []):
702
+ voices[voice["voice_id"]] = voice["name"]
703
+ except requests.RequestException as e:
704
+ # Avoid @lru_cache with exception
705
+ log.error(f"Error fetching voices: {str(e)}")
706
+ raise RuntimeError(f"Error fetching voices: {str(e)}")
707
+
708
+ return voices
709
+
710
+
711
+ @app.get("/voices")
712
+ async def get_voices(user=Depends(get_verified_user)):
713
+ return {"voices": [{"id": k, "name": v} for k, v in get_available_voices().items()]}
backend/open_webui/apps/images/main.py ADDED
@@ -0,0 +1,609 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import asyncio
2
+ import base64
3
+ import json
4
+ import logging
5
+ import mimetypes
6
+ import re
7
+ import uuid
8
+ from pathlib import Path
9
+ from typing import Optional
10
+
11
+ import requests
12
+ from open_webui.apps.images.utils.comfyui import (
13
+ ComfyUIGenerateImageForm,
14
+ ComfyUIWorkflow,
15
+ comfyui_generate_image,
16
+ )
17
+ from open_webui.config import (
18
+ AUTOMATIC1111_API_AUTH,
19
+ AUTOMATIC1111_BASE_URL,
20
+ AUTOMATIC1111_CFG_SCALE,
21
+ AUTOMATIC1111_SAMPLER,
22
+ AUTOMATIC1111_SCHEDULER,
23
+ CACHE_DIR,
24
+ COMFYUI_BASE_URL,
25
+ COMFYUI_WORKFLOW,
26
+ COMFYUI_WORKFLOW_NODES,
27
+ CORS_ALLOW_ORIGIN,
28
+ ENABLE_IMAGE_GENERATION,
29
+ IMAGE_GENERATION_ENGINE,
30
+ IMAGE_GENERATION_MODEL,
31
+ IMAGE_SIZE,
32
+ IMAGE_STEPS,
33
+ IMAGES_OPENAI_API_BASE_URL,
34
+ IMAGES_OPENAI_API_KEY,
35
+ AppConfig,
36
+ )
37
+ from open_webui.constants import ERROR_MESSAGES
38
+ from open_webui.env import ENV, SRC_LOG_LEVELS, ENABLE_FORWARD_USER_INFO_HEADERS
39
+
40
+ from fastapi import Depends, FastAPI, HTTPException, Request
41
+ from fastapi.middleware.cors import CORSMiddleware
42
+ from pydantic import BaseModel
43
+ from open_webui.utils.utils import get_admin_user, get_verified_user
44
+
45
+ log = logging.getLogger(__name__)
46
+ log.setLevel(SRC_LOG_LEVELS["IMAGES"])
47
+
48
+ IMAGE_CACHE_DIR = Path(CACHE_DIR).joinpath("./image/generations/")
49
+ IMAGE_CACHE_DIR.mkdir(parents=True, exist_ok=True)
50
+
51
+ app = FastAPI(
52
+ docs_url="/docs" if ENV == "dev" else None,
53
+ openapi_url="/openapi.json" if ENV == "dev" else None,
54
+ redoc_url=None,
55
+ )
56
+
57
+ app.add_middleware(
58
+ CORSMiddleware,
59
+ allow_origins=CORS_ALLOW_ORIGIN,
60
+ allow_credentials=True,
61
+ allow_methods=["*"],
62
+ allow_headers=["*"],
63
+ )
64
+
65
+ app.state.config = AppConfig()
66
+
67
+ app.state.config.ENGINE = IMAGE_GENERATION_ENGINE
68
+ app.state.config.ENABLED = ENABLE_IMAGE_GENERATION
69
+
70
+ app.state.config.OPENAI_API_BASE_URL = IMAGES_OPENAI_API_BASE_URL
71
+ app.state.config.OPENAI_API_KEY = IMAGES_OPENAI_API_KEY
72
+
73
+ app.state.config.MODEL = IMAGE_GENERATION_MODEL
74
+
75
+ app.state.config.AUTOMATIC1111_BASE_URL = AUTOMATIC1111_BASE_URL
76
+ app.state.config.AUTOMATIC1111_API_AUTH = AUTOMATIC1111_API_AUTH
77
+ app.state.config.AUTOMATIC1111_CFG_SCALE = AUTOMATIC1111_CFG_SCALE
78
+ app.state.config.AUTOMATIC1111_SAMPLER = AUTOMATIC1111_SAMPLER
79
+ app.state.config.AUTOMATIC1111_SCHEDULER = AUTOMATIC1111_SCHEDULER
80
+ app.state.config.COMFYUI_BASE_URL = COMFYUI_BASE_URL
81
+ app.state.config.COMFYUI_WORKFLOW = COMFYUI_WORKFLOW
82
+ app.state.config.COMFYUI_WORKFLOW_NODES = COMFYUI_WORKFLOW_NODES
83
+
84
+ app.state.config.IMAGE_SIZE = IMAGE_SIZE
85
+ app.state.config.IMAGE_STEPS = IMAGE_STEPS
86
+
87
+
88
+ @app.get("/config")
89
+ async def get_config(request: Request, user=Depends(get_admin_user)):
90
+ return {
91
+ "enabled": app.state.config.ENABLED,
92
+ "engine": app.state.config.ENGINE,
93
+ "openai": {
94
+ "OPENAI_API_BASE_URL": app.state.config.OPENAI_API_BASE_URL,
95
+ "OPENAI_API_KEY": app.state.config.OPENAI_API_KEY,
96
+ },
97
+ "automatic1111": {
98
+ "AUTOMATIC1111_BASE_URL": app.state.config.AUTOMATIC1111_BASE_URL,
99
+ "AUTOMATIC1111_API_AUTH": app.state.config.AUTOMATIC1111_API_AUTH,
100
+ "AUTOMATIC1111_CFG_SCALE": app.state.config.AUTOMATIC1111_CFG_SCALE,
101
+ "AUTOMATIC1111_SAMPLER": app.state.config.AUTOMATIC1111_SAMPLER,
102
+ "AUTOMATIC1111_SCHEDULER": app.state.config.AUTOMATIC1111_SCHEDULER,
103
+ },
104
+ "comfyui": {
105
+ "COMFYUI_BASE_URL": app.state.config.COMFYUI_BASE_URL,
106
+ "COMFYUI_WORKFLOW": app.state.config.COMFYUI_WORKFLOW,
107
+ "COMFYUI_WORKFLOW_NODES": app.state.config.COMFYUI_WORKFLOW_NODES,
108
+ },
109
+ }
110
+
111
+
112
+ class OpenAIConfigForm(BaseModel):
113
+ OPENAI_API_BASE_URL: str
114
+ OPENAI_API_KEY: str
115
+
116
+
117
+ class Automatic1111ConfigForm(BaseModel):
118
+ AUTOMATIC1111_BASE_URL: str
119
+ AUTOMATIC1111_API_AUTH: str
120
+ AUTOMATIC1111_CFG_SCALE: Optional[str]
121
+ AUTOMATIC1111_SAMPLER: Optional[str]
122
+ AUTOMATIC1111_SCHEDULER: Optional[str]
123
+
124
+
125
+ class ComfyUIConfigForm(BaseModel):
126
+ COMFYUI_BASE_URL: str
127
+ COMFYUI_WORKFLOW: str
128
+ COMFYUI_WORKFLOW_NODES: list[dict]
129
+
130
+
131
+ class ConfigForm(BaseModel):
132
+ enabled: bool
133
+ engine: str
134
+ openai: OpenAIConfigForm
135
+ automatic1111: Automatic1111ConfigForm
136
+ comfyui: ComfyUIConfigForm
137
+
138
+
139
+ @app.post("/config/update")
140
+ async def update_config(form_data: ConfigForm, user=Depends(get_admin_user)):
141
+ app.state.config.ENGINE = form_data.engine
142
+ app.state.config.ENABLED = form_data.enabled
143
+
144
+ app.state.config.OPENAI_API_BASE_URL = form_data.openai.OPENAI_API_BASE_URL
145
+ app.state.config.OPENAI_API_KEY = form_data.openai.OPENAI_API_KEY
146
+
147
+ app.state.config.AUTOMATIC1111_BASE_URL = (
148
+ form_data.automatic1111.AUTOMATIC1111_BASE_URL
149
+ )
150
+ app.state.config.AUTOMATIC1111_API_AUTH = (
151
+ form_data.automatic1111.AUTOMATIC1111_API_AUTH
152
+ )
153
+
154
+ app.state.config.AUTOMATIC1111_CFG_SCALE = (
155
+ float(form_data.automatic1111.AUTOMATIC1111_CFG_SCALE)
156
+ if form_data.automatic1111.AUTOMATIC1111_CFG_SCALE
157
+ else None
158
+ )
159
+ app.state.config.AUTOMATIC1111_SAMPLER = (
160
+ form_data.automatic1111.AUTOMATIC1111_SAMPLER
161
+ if form_data.automatic1111.AUTOMATIC1111_SAMPLER
162
+ else None
163
+ )
164
+ app.state.config.AUTOMATIC1111_SCHEDULER = (
165
+ form_data.automatic1111.AUTOMATIC1111_SCHEDULER
166
+ if form_data.automatic1111.AUTOMATIC1111_SCHEDULER
167
+ else None
168
+ )
169
+
170
+ app.state.config.COMFYUI_BASE_URL = form_data.comfyui.COMFYUI_BASE_URL.strip("/")
171
+ app.state.config.COMFYUI_WORKFLOW = form_data.comfyui.COMFYUI_WORKFLOW
172
+ app.state.config.COMFYUI_WORKFLOW_NODES = form_data.comfyui.COMFYUI_WORKFLOW_NODES
173
+
174
+ return {
175
+ "enabled": app.state.config.ENABLED,
176
+ "engine": app.state.config.ENGINE,
177
+ "openai": {
178
+ "OPENAI_API_BASE_URL": app.state.config.OPENAI_API_BASE_URL,
179
+ "OPENAI_API_KEY": app.state.config.OPENAI_API_KEY,
180
+ },
181
+ "automatic1111": {
182
+ "AUTOMATIC1111_BASE_URL": app.state.config.AUTOMATIC1111_BASE_URL,
183
+ "AUTOMATIC1111_API_AUTH": app.state.config.AUTOMATIC1111_API_AUTH,
184
+ "AUTOMATIC1111_CFG_SCALE": app.state.config.AUTOMATIC1111_CFG_SCALE,
185
+ "AUTOMATIC1111_SAMPLER": app.state.config.AUTOMATIC1111_SAMPLER,
186
+ "AUTOMATIC1111_SCHEDULER": app.state.config.AUTOMATIC1111_SCHEDULER,
187
+ },
188
+ "comfyui": {
189
+ "COMFYUI_BASE_URL": app.state.config.COMFYUI_BASE_URL,
190
+ "COMFYUI_WORKFLOW": app.state.config.COMFYUI_WORKFLOW,
191
+ "COMFYUI_WORKFLOW_NODES": app.state.config.COMFYUI_WORKFLOW_NODES,
192
+ },
193
+ }
194
+
195
+
196
+ def get_automatic1111_api_auth():
197
+ if app.state.config.AUTOMATIC1111_API_AUTH is None:
198
+ return ""
199
+ else:
200
+ auth1111_byte_string = app.state.config.AUTOMATIC1111_API_AUTH.encode("utf-8")
201
+ auth1111_base64_encoded_bytes = base64.b64encode(auth1111_byte_string)
202
+ auth1111_base64_encoded_string = auth1111_base64_encoded_bytes.decode("utf-8")
203
+ return f"Basic {auth1111_base64_encoded_string}"
204
+
205
+
206
+ @app.get("/config/url/verify")
207
+ async def verify_url(user=Depends(get_admin_user)):
208
+ if app.state.config.ENGINE == "automatic1111":
209
+ try:
210
+ r = requests.get(
211
+ url=f"{app.state.config.AUTOMATIC1111_BASE_URL}/sdapi/v1/options",
212
+ headers={"authorization": get_automatic1111_api_auth()},
213
+ )
214
+ r.raise_for_status()
215
+ return True
216
+ except Exception:
217
+ app.state.config.ENABLED = False
218
+ raise HTTPException(status_code=400, detail=ERROR_MESSAGES.INVALID_URL)
219
+ elif app.state.config.ENGINE == "comfyui":
220
+ try:
221
+ r = requests.get(url=f"{app.state.config.COMFYUI_BASE_URL}/object_info")
222
+ r.raise_for_status()
223
+ return True
224
+ except Exception:
225
+ app.state.config.ENABLED = False
226
+ raise HTTPException(status_code=400, detail=ERROR_MESSAGES.INVALID_URL)
227
+ else:
228
+ return True
229
+
230
+
231
+ def set_image_model(model: str):
232
+ log.info(f"Setting image model to {model}")
233
+ app.state.config.MODEL = model
234
+ if app.state.config.ENGINE in ["", "automatic1111"]:
235
+ api_auth = get_automatic1111_api_auth()
236
+ r = requests.get(
237
+ url=f"{app.state.config.AUTOMATIC1111_BASE_URL}/sdapi/v1/options",
238
+ headers={"authorization": api_auth},
239
+ )
240
+ options = r.json()
241
+ if model != options["sd_model_checkpoint"]:
242
+ options["sd_model_checkpoint"] = model
243
+ r = requests.post(
244
+ url=f"{app.state.config.AUTOMATIC1111_BASE_URL}/sdapi/v1/options",
245
+ json=options,
246
+ headers={"authorization": api_auth},
247
+ )
248
+ return app.state.config.MODEL
249
+
250
+
251
+ def get_image_model():
252
+ if app.state.config.ENGINE == "openai":
253
+ return app.state.config.MODEL if app.state.config.MODEL else "dall-e-2"
254
+ elif app.state.config.ENGINE == "comfyui":
255
+ return app.state.config.MODEL if app.state.config.MODEL else ""
256
+ elif app.state.config.ENGINE == "automatic1111" or app.state.config.ENGINE == "":
257
+ try:
258
+ r = requests.get(
259
+ url=f"{app.state.config.AUTOMATIC1111_BASE_URL}/sdapi/v1/options",
260
+ headers={"authorization": get_automatic1111_api_auth()},
261
+ )
262
+ options = r.json()
263
+ return options["sd_model_checkpoint"]
264
+ except Exception as e:
265
+ app.state.config.ENABLED = False
266
+ raise HTTPException(status_code=400, detail=ERROR_MESSAGES.DEFAULT(e))
267
+
268
+
269
+ class ImageConfigForm(BaseModel):
270
+ MODEL: str
271
+ IMAGE_SIZE: str
272
+ IMAGE_STEPS: int
273
+
274
+
275
+ @app.get("/image/config")
276
+ async def get_image_config(user=Depends(get_admin_user)):
277
+ return {
278
+ "MODEL": app.state.config.MODEL,
279
+ "IMAGE_SIZE": app.state.config.IMAGE_SIZE,
280
+ "IMAGE_STEPS": app.state.config.IMAGE_STEPS,
281
+ }
282
+
283
+
284
+ @app.post("/image/config/update")
285
+ async def update_image_config(form_data: ImageConfigForm, user=Depends(get_admin_user)):
286
+
287
+ set_image_model(form_data.MODEL)
288
+
289
+ pattern = r"^\d+x\d+$"
290
+ if re.match(pattern, form_data.IMAGE_SIZE):
291
+ app.state.config.IMAGE_SIZE = form_data.IMAGE_SIZE
292
+ else:
293
+ raise HTTPException(
294
+ status_code=400,
295
+ detail=ERROR_MESSAGES.INCORRECT_FORMAT(" (e.g., 512x512)."),
296
+ )
297
+
298
+ if form_data.IMAGE_STEPS >= 0:
299
+ app.state.config.IMAGE_STEPS = form_data.IMAGE_STEPS
300
+ else:
301
+ raise HTTPException(
302
+ status_code=400,
303
+ detail=ERROR_MESSAGES.INCORRECT_FORMAT(" (e.g., 50)."),
304
+ )
305
+
306
+ return {
307
+ "MODEL": app.state.config.MODEL,
308
+ "IMAGE_SIZE": app.state.config.IMAGE_SIZE,
309
+ "IMAGE_STEPS": app.state.config.IMAGE_STEPS,
310
+ }
311
+
312
+
313
+ @app.get("/models")
314
+ def get_models(user=Depends(get_verified_user)):
315
+ try:
316
+ if app.state.config.ENGINE == "openai":
317
+ return [
318
+ {"id": "dall-e-2", "name": "DALL·E 2"},
319
+ {"id": "dall-e-3", "name": "DALL·E 3"},
320
+ ]
321
+ elif app.state.config.ENGINE == "comfyui":
322
+ # TODO - get models from comfyui
323
+ r = requests.get(url=f"{app.state.config.COMFYUI_BASE_URL}/object_info")
324
+ info = r.json()
325
+
326
+ workflow = json.loads(app.state.config.COMFYUI_WORKFLOW)
327
+ model_node_id = None
328
+
329
+ for node in app.state.config.COMFYUI_WORKFLOW_NODES:
330
+ if node["type"] == "model":
331
+ if node["node_ids"]:
332
+ model_node_id = node["node_ids"][0]
333
+ break
334
+
335
+ if model_node_id:
336
+ model_list_key = None
337
+
338
+ print(workflow[model_node_id]["class_type"])
339
+ for key in info[workflow[model_node_id]["class_type"]]["input"][
340
+ "required"
341
+ ]:
342
+ if "_name" in key:
343
+ model_list_key = key
344
+ break
345
+
346
+ if model_list_key:
347
+ return list(
348
+ map(
349
+ lambda model: {"id": model, "name": model},
350
+ info[workflow[model_node_id]["class_type"]]["input"][
351
+ "required"
352
+ ][model_list_key][0],
353
+ )
354
+ )
355
+ else:
356
+ return list(
357
+ map(
358
+ lambda model: {"id": model, "name": model},
359
+ info["CheckpointLoaderSimple"]["input"]["required"][
360
+ "ckpt_name"
361
+ ][0],
362
+ )
363
+ )
364
+ elif (
365
+ app.state.config.ENGINE == "automatic1111" or app.state.config.ENGINE == ""
366
+ ):
367
+ r = requests.get(
368
+ url=f"{app.state.config.AUTOMATIC1111_BASE_URL}/sdapi/v1/sd-models",
369
+ headers={"authorization": get_automatic1111_api_auth()},
370
+ )
371
+ models = r.json()
372
+ return list(
373
+ map(
374
+ lambda model: {"id": model["title"], "name": model["model_name"]},
375
+ models,
376
+ )
377
+ )
378
+ except Exception as e:
379
+ app.state.config.ENABLED = False
380
+ raise HTTPException(status_code=400, detail=ERROR_MESSAGES.DEFAULT(e))
381
+
382
+
383
+ class GenerateImageForm(BaseModel):
384
+ model: Optional[str] = None
385
+ prompt: str
386
+ size: Optional[str] = None
387
+ n: int = 1
388
+ negative_prompt: Optional[str] = None
389
+
390
+
391
+ def save_b64_image(b64_str):
392
+ try:
393
+ image_id = str(uuid.uuid4())
394
+
395
+ if "," in b64_str:
396
+ header, encoded = b64_str.split(",", 1)
397
+ mime_type = header.split(";")[0]
398
+
399
+ img_data = base64.b64decode(encoded)
400
+ image_format = mimetypes.guess_extension(mime_type)
401
+
402
+ image_filename = f"{image_id}{image_format}"
403
+ file_path = IMAGE_CACHE_DIR / f"{image_filename}"
404
+ with open(file_path, "wb") as f:
405
+ f.write(img_data)
406
+ return image_filename
407
+ else:
408
+ image_filename = f"{image_id}.png"
409
+ file_path = IMAGE_CACHE_DIR.joinpath(image_filename)
410
+
411
+ img_data = base64.b64decode(b64_str)
412
+
413
+ # Write the image data to a file
414
+ with open(file_path, "wb") as f:
415
+ f.write(img_data)
416
+ return image_filename
417
+
418
+ except Exception as e:
419
+ log.exception(f"Error saving image: {e}")
420
+ return None
421
+
422
+
423
+ def save_url_image(url):
424
+ image_id = str(uuid.uuid4())
425
+ try:
426
+ r = requests.get(url)
427
+ r.raise_for_status()
428
+ if r.headers["content-type"].split("/")[0] == "image":
429
+ mime_type = r.headers["content-type"]
430
+ image_format = mimetypes.guess_extension(mime_type)
431
+
432
+ if not image_format:
433
+ raise ValueError("Could not determine image type from MIME type")
434
+
435
+ image_filename = f"{image_id}{image_format}"
436
+
437
+ file_path = IMAGE_CACHE_DIR.joinpath(f"{image_filename}")
438
+ with open(file_path, "wb") as image_file:
439
+ for chunk in r.iter_content(chunk_size=8192):
440
+ image_file.write(chunk)
441
+ return image_filename
442
+ else:
443
+ log.error("Url does not point to an image.")
444
+ return None
445
+
446
+ except Exception as e:
447
+ log.exception(f"Error saving image: {e}")
448
+ return None
449
+
450
+
451
+ @app.post("/generations")
452
+ async def image_generations(
453
+ form_data: GenerateImageForm,
454
+ user=Depends(get_verified_user),
455
+ ):
456
+ width, height = tuple(map(int, app.state.config.IMAGE_SIZE.split("x")))
457
+
458
+ r = None
459
+ try:
460
+ if app.state.config.ENGINE == "openai":
461
+ headers = {}
462
+ headers["Authorization"] = f"Bearer {app.state.config.OPENAI_API_KEY}"
463
+ headers["Content-Type"] = "application/json"
464
+
465
+ if ENABLE_FORWARD_USER_INFO_HEADERS:
466
+ headers["X-OpenWebUI-User-Name"] = user.name
467
+ headers["X-OpenWebUI-User-Id"] = user.id
468
+ headers["X-OpenWebUI-User-Email"] = user.email
469
+ headers["X-OpenWebUI-User-Role"] = user.role
470
+
471
+ data = {
472
+ "model": (
473
+ app.state.config.MODEL
474
+ if app.state.config.MODEL != ""
475
+ else "dall-e-2"
476
+ ),
477
+ "prompt": form_data.prompt,
478
+ "n": form_data.n,
479
+ "size": (
480
+ form_data.size if form_data.size else app.state.config.IMAGE_SIZE
481
+ ),
482
+ "response_format": "b64_json",
483
+ }
484
+
485
+ # Use asyncio.to_thread for the requests.post call
486
+ r = await asyncio.to_thread(
487
+ requests.post,
488
+ url=f"{app.state.config.OPENAI_API_BASE_URL}/images/generations",
489
+ json=data,
490
+ headers=headers,
491
+ )
492
+
493
+ r.raise_for_status()
494
+ res = r.json()
495
+
496
+ images = []
497
+
498
+ for image in res["data"]:
499
+ image_filename = save_b64_image(image["b64_json"])
500
+ images.append({"url": f"/cache/image/generations/{image_filename}"})
501
+ file_body_path = IMAGE_CACHE_DIR.joinpath(f"{image_filename}.json")
502
+
503
+ with open(file_body_path, "w") as f:
504
+ json.dump(data, f)
505
+
506
+ return images
507
+
508
+ elif app.state.config.ENGINE == "comfyui":
509
+ data = {
510
+ "prompt": form_data.prompt,
511
+ "width": width,
512
+ "height": height,
513
+ "n": form_data.n,
514
+ }
515
+
516
+ if app.state.config.IMAGE_STEPS is not None:
517
+ data["steps"] = app.state.config.IMAGE_STEPS
518
+
519
+ if form_data.negative_prompt is not None:
520
+ data["negative_prompt"] = form_data.negative_prompt
521
+
522
+ form_data = ComfyUIGenerateImageForm(
523
+ **{
524
+ "workflow": ComfyUIWorkflow(
525
+ **{
526
+ "workflow": app.state.config.COMFYUI_WORKFLOW,
527
+ "nodes": app.state.config.COMFYUI_WORKFLOW_NODES,
528
+ }
529
+ ),
530
+ **data,
531
+ }
532
+ )
533
+ res = await comfyui_generate_image(
534
+ app.state.config.MODEL,
535
+ form_data,
536
+ user.id,
537
+ app.state.config.COMFYUI_BASE_URL,
538
+ )
539
+ log.debug(f"res: {res}")
540
+
541
+ images = []
542
+
543
+ for image in res["data"]:
544
+ image_filename = save_url_image(image["url"])
545
+ images.append({"url": f"/cache/image/generations/{image_filename}"})
546
+ file_body_path = IMAGE_CACHE_DIR.joinpath(f"{image_filename}.json")
547
+
548
+ with open(file_body_path, "w") as f:
549
+ json.dump(form_data.model_dump(exclude_none=True), f)
550
+
551
+ log.debug(f"images: {images}")
552
+ return images
553
+ elif (
554
+ app.state.config.ENGINE == "automatic1111" or app.state.config.ENGINE == ""
555
+ ):
556
+ if form_data.model:
557
+ set_image_model(form_data.model)
558
+
559
+ data = {
560
+ "prompt": form_data.prompt,
561
+ "batch_size": form_data.n,
562
+ "width": width,
563
+ "height": height,
564
+ }
565
+
566
+ if app.state.config.IMAGE_STEPS is not None:
567
+ data["steps"] = app.state.config.IMAGE_STEPS
568
+
569
+ if form_data.negative_prompt is not None:
570
+ data["negative_prompt"] = form_data.negative_prompt
571
+
572
+ if app.state.config.AUTOMATIC1111_CFG_SCALE:
573
+ data["cfg_scale"] = app.state.config.AUTOMATIC1111_CFG_SCALE
574
+
575
+ if app.state.config.AUTOMATIC1111_SAMPLER:
576
+ data["sampler_name"] = app.state.config.AUTOMATIC1111_SAMPLER
577
+
578
+ if app.state.config.AUTOMATIC1111_SCHEDULER:
579
+ data["scheduler"] = app.state.config.AUTOMATIC1111_SCHEDULER
580
+
581
+ # Use asyncio.to_thread for the requests.post call
582
+ r = await asyncio.to_thread(
583
+ requests.post,
584
+ url=f"{app.state.config.AUTOMATIC1111_BASE_URL}/sdapi/v1/txt2img",
585
+ json=data,
586
+ headers={"authorization": get_automatic1111_api_auth()},
587
+ )
588
+
589
+ res = r.json()
590
+ log.debug(f"res: {res}")
591
+
592
+ images = []
593
+
594
+ for image in res["images"]:
595
+ image_filename = save_b64_image(image)
596
+ images.append({"url": f"/cache/image/generations/{image_filename}"})
597
+ file_body_path = IMAGE_CACHE_DIR.joinpath(f"{image_filename}.json")
598
+
599
+ with open(file_body_path, "w") as f:
600
+ json.dump({**data, "info": res["info"]}, f)
601
+
602
+ return images
603
+ except Exception as e:
604
+ error = e
605
+ if r != None:
606
+ data = r.json()
607
+ if "error" in data:
608
+ error = data["error"]["message"]
609
+ raise HTTPException(status_code=400, detail=ERROR_MESSAGES.DEFAULT(error))
backend/open_webui/apps/images/utils/comfyui.py ADDED
@@ -0,0 +1,186 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import asyncio
2
+ import json
3
+ import logging
4
+ import random
5
+ import urllib.parse
6
+ import urllib.request
7
+ from typing import Optional
8
+
9
+ import websocket # NOTE: websocket-client (https://github.com/websocket-client/websocket-client)
10
+ from open_webui.env import SRC_LOG_LEVELS
11
+ from pydantic import BaseModel
12
+
13
+ log = logging.getLogger(__name__)
14
+ log.setLevel(SRC_LOG_LEVELS["COMFYUI"])
15
+
16
+ default_headers = {"User-Agent": "Mozilla/5.0"}
17
+
18
+
19
+ def queue_prompt(prompt, client_id, base_url):
20
+ log.info("queue_prompt")
21
+ p = {"prompt": prompt, "client_id": client_id}
22
+ data = json.dumps(p).encode("utf-8")
23
+ log.debug(f"queue_prompt data: {data}")
24
+ try:
25
+ req = urllib.request.Request(
26
+ f"{base_url}/prompt", data=data, headers=default_headers
27
+ )
28
+ response = urllib.request.urlopen(req).read()
29
+ return json.loads(response)
30
+ except Exception as e:
31
+ log.exception(f"Error while queuing prompt: {e}")
32
+ raise e
33
+
34
+
35
+ def get_image(filename, subfolder, folder_type, base_url):
36
+ log.info("get_image")
37
+ data = {"filename": filename, "subfolder": subfolder, "type": folder_type}
38
+ url_values = urllib.parse.urlencode(data)
39
+ req = urllib.request.Request(
40
+ f"{base_url}/view?{url_values}", headers=default_headers
41
+ )
42
+ with urllib.request.urlopen(req) as response:
43
+ return response.read()
44
+
45
+
46
+ def get_image_url(filename, subfolder, folder_type, base_url):
47
+ log.info("get_image")
48
+ data = {"filename": filename, "subfolder": subfolder, "type": folder_type}
49
+ url_values = urllib.parse.urlencode(data)
50
+ return f"{base_url}/view?{url_values}"
51
+
52
+
53
+ def get_history(prompt_id, base_url):
54
+ log.info("get_history")
55
+
56
+ req = urllib.request.Request(
57
+ f"{base_url}/history/{prompt_id}", headers=default_headers
58
+ )
59
+ with urllib.request.urlopen(req) as response:
60
+ return json.loads(response.read())
61
+
62
+
63
+ def get_images(ws, prompt, client_id, base_url):
64
+ prompt_id = queue_prompt(prompt, client_id, base_url)["prompt_id"]
65
+ output_images = []
66
+ while True:
67
+ out = ws.recv()
68
+ if isinstance(out, str):
69
+ message = json.loads(out)
70
+ if message["type"] == "executing":
71
+ data = message["data"]
72
+ if data["node"] is None and data["prompt_id"] == prompt_id:
73
+ break # Execution is done
74
+ else:
75
+ continue # previews are binary data
76
+
77
+ history = get_history(prompt_id, base_url)[prompt_id]
78
+ for o in history["outputs"]:
79
+ for node_id in history["outputs"]:
80
+ node_output = history["outputs"][node_id]
81
+ if "images" in node_output:
82
+ for image in node_output["images"]:
83
+ url = get_image_url(
84
+ image["filename"], image["subfolder"], image["type"], base_url
85
+ )
86
+ output_images.append({"url": url})
87
+ return {"data": output_images}
88
+
89
+
90
+ class ComfyUINodeInput(BaseModel):
91
+ type: Optional[str] = None
92
+ node_ids: list[str] = []
93
+ key: Optional[str] = "text"
94
+ value: Optional[str] = None
95
+
96
+
97
+ class ComfyUIWorkflow(BaseModel):
98
+ workflow: str
99
+ nodes: list[ComfyUINodeInput]
100
+
101
+
102
+ class ComfyUIGenerateImageForm(BaseModel):
103
+ workflow: ComfyUIWorkflow
104
+
105
+ prompt: str
106
+ negative_prompt: Optional[str] = None
107
+ width: int
108
+ height: int
109
+ n: int = 1
110
+
111
+ steps: Optional[int] = None
112
+ seed: Optional[int] = None
113
+
114
+
115
+ async def comfyui_generate_image(
116
+ model: str, payload: ComfyUIGenerateImageForm, client_id, base_url
117
+ ):
118
+ ws_url = base_url.replace("http://", "ws://").replace("https://", "wss://")
119
+ workflow = json.loads(payload.workflow.workflow)
120
+
121
+ for node in payload.workflow.nodes:
122
+ if node.type:
123
+ if node.type == "model":
124
+ for node_id in node.node_ids:
125
+ workflow[node_id]["inputs"][node.key] = model
126
+ elif node.type == "prompt":
127
+ for node_id in node.node_ids:
128
+ workflow[node_id]["inputs"][
129
+ node.key if node.key else "text"
130
+ ] = payload.prompt
131
+ elif node.type == "negative_prompt":
132
+ for node_id in node.node_ids:
133
+ workflow[node_id]["inputs"][
134
+ node.key if node.key else "text"
135
+ ] = payload.negative_prompt
136
+ elif node.type == "width":
137
+ for node_id in node.node_ids:
138
+ workflow[node_id]["inputs"][
139
+ node.key if node.key else "width"
140
+ ] = payload.width
141
+ elif node.type == "height":
142
+ for node_id in node.node_ids:
143
+ workflow[node_id]["inputs"][
144
+ node.key if node.key else "height"
145
+ ] = payload.height
146
+ elif node.type == "n":
147
+ for node_id in node.node_ids:
148
+ workflow[node_id]["inputs"][
149
+ node.key if node.key else "batch_size"
150
+ ] = payload.n
151
+ elif node.type == "steps":
152
+ for node_id in node.node_ids:
153
+ workflow[node_id]["inputs"][
154
+ node.key if node.key else "steps"
155
+ ] = payload.steps
156
+ elif node.type == "seed":
157
+ seed = (
158
+ payload.seed
159
+ if payload.seed
160
+ else random.randint(0, 18446744073709551614)
161
+ )
162
+ for node_id in node.node_ids:
163
+ workflow[node_id]["inputs"][node.key] = seed
164
+ else:
165
+ for node_id in node.node_ids:
166
+ workflow[node_id]["inputs"][node.key] = node.value
167
+
168
+ try:
169
+ ws = websocket.WebSocket()
170
+ ws.connect(f"{ws_url}/ws?clientId={client_id}")
171
+ log.info("WebSocket connection established.")
172
+ except Exception as e:
173
+ log.exception(f"Failed to connect to WebSocket server: {e}")
174
+ return None
175
+
176
+ try:
177
+ log.info("Sending workflow to WebSocket server.")
178
+ log.info(f"Workflow: {workflow}")
179
+ images = await asyncio.to_thread(get_images, ws, workflow, client_id, base_url)
180
+ except Exception as e:
181
+ log.exception(f"Error while receiving images: {e}")
182
+ images = None
183
+
184
+ ws.close()
185
+
186
+ return images
backend/open_webui/apps/ollama/main.py ADDED
@@ -0,0 +1,1324 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import asyncio
2
+ import json
3
+ import logging
4
+ import os
5
+ import random
6
+ import re
7
+ import time
8
+ from typing import Optional, Union
9
+ from urllib.parse import urlparse
10
+
11
+ import aiohttp
12
+ import requests
13
+ from open_webui.apps.webui.models.models import Models
14
+ from open_webui.config import (
15
+ CORS_ALLOW_ORIGIN,
16
+ ENABLE_OLLAMA_API,
17
+ OLLAMA_BASE_URLS,
18
+ OLLAMA_API_CONFIGS,
19
+ UPLOAD_DIR,
20
+ AppConfig,
21
+ )
22
+ from open_webui.env import (
23
+ AIOHTTP_CLIENT_TIMEOUT,
24
+ AIOHTTP_CLIENT_TIMEOUT_OPENAI_MODEL_LIST,
25
+ )
26
+
27
+
28
+ from open_webui.constants import ERROR_MESSAGES
29
+ from open_webui.env import ENV, SRC_LOG_LEVELS
30
+ from fastapi import Depends, FastAPI, File, HTTPException, Request, UploadFile
31
+ from fastapi.middleware.cors import CORSMiddleware
32
+ from fastapi.responses import StreamingResponse
33
+ from pydantic import BaseModel, ConfigDict
34
+ from starlette.background import BackgroundTask
35
+
36
+
37
+ from open_webui.utils.misc import (
38
+ calculate_sha256,
39
+ )
40
+ from open_webui.utils.payload import (
41
+ apply_model_params_to_body_ollama,
42
+ apply_model_params_to_body_openai,
43
+ apply_model_system_prompt_to_body,
44
+ )
45
+ from open_webui.utils.utils import get_admin_user, get_verified_user
46
+ from open_webui.utils.access_control import has_access
47
+
48
+ log = logging.getLogger(__name__)
49
+ log.setLevel(SRC_LOG_LEVELS["OLLAMA"])
50
+
51
+
52
+ app = FastAPI(
53
+ docs_url="/docs" if ENV == "dev" else None,
54
+ openapi_url="/openapi.json" if ENV == "dev" else None,
55
+ redoc_url=None,
56
+ )
57
+
58
+ app.add_middleware(
59
+ CORSMiddleware,
60
+ allow_origins=CORS_ALLOW_ORIGIN,
61
+ allow_credentials=True,
62
+ allow_methods=["*"],
63
+ allow_headers=["*"],
64
+ )
65
+
66
+ app.state.config = AppConfig()
67
+
68
+ app.state.config.ENABLE_OLLAMA_API = ENABLE_OLLAMA_API
69
+ app.state.config.OLLAMA_BASE_URLS = OLLAMA_BASE_URLS
70
+ app.state.config.OLLAMA_API_CONFIGS = OLLAMA_API_CONFIGS
71
+
72
+
73
+ # TODO: Implement a more intelligent load balancing mechanism for distributing requests among multiple backend instances.
74
+ # Current implementation uses a simple round-robin approach (random.choice). Consider incorporating algorithms like weighted round-robin,
75
+ # least connections, or least response time for better resource utilization and performance optimization.
76
+
77
+
78
+ @app.head("/")
79
+ @app.get("/")
80
+ async def get_status():
81
+ return {"status": True}
82
+
83
+
84
+ class ConnectionVerificationForm(BaseModel):
85
+ url: str
86
+ key: Optional[str] = None
87
+
88
+
89
+ @app.post("/verify")
90
+ async def verify_connection(
91
+ form_data: ConnectionVerificationForm, user=Depends(get_admin_user)
92
+ ):
93
+ url = form_data.url
94
+ key = form_data.key
95
+
96
+ headers = {}
97
+ if key:
98
+ headers["Authorization"] = f"Bearer {key}"
99
+
100
+ timeout = aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_OPENAI_MODEL_LIST)
101
+ async with aiohttp.ClientSession(timeout=timeout) as session:
102
+ try:
103
+ async with session.get(f"{url}/api/version", headers=headers) as r:
104
+ if r.status != 200:
105
+ # Extract response error details if available
106
+ error_detail = f"HTTP Error: {r.status}"
107
+ res = await r.json()
108
+ if "error" in res:
109
+ error_detail = f"External Error: {res['error']}"
110
+ raise Exception(error_detail)
111
+
112
+ response_data = await r.json()
113
+ return response_data
114
+
115
+ except aiohttp.ClientError as e:
116
+ # ClientError covers all aiohttp requests issues
117
+ log.exception(f"Client error: {str(e)}")
118
+ # Handle aiohttp-specific connection issues, timeout etc.
119
+ raise HTTPException(
120
+ status_code=500, detail="Open WebUI: Server Connection Error"
121
+ )
122
+ except Exception as e:
123
+ log.exception(f"Unexpected error: {e}")
124
+ # Generic error handler in case parsing JSON or other steps fail
125
+ error_detail = f"Unexpected error: {str(e)}"
126
+ raise HTTPException(status_code=500, detail=error_detail)
127
+
128
+
129
+ @app.get("/config")
130
+ async def get_config(user=Depends(get_admin_user)):
131
+ return {
132
+ "ENABLE_OLLAMA_API": app.state.config.ENABLE_OLLAMA_API,
133
+ "OLLAMA_BASE_URLS": app.state.config.OLLAMA_BASE_URLS,
134
+ "OLLAMA_API_CONFIGS": app.state.config.OLLAMA_API_CONFIGS,
135
+ }
136
+
137
+
138
+ class OllamaConfigForm(BaseModel):
139
+ ENABLE_OLLAMA_API: Optional[bool] = None
140
+ OLLAMA_BASE_URLS: list[str]
141
+ OLLAMA_API_CONFIGS: dict
142
+
143
+
144
+ @app.post("/config/update")
145
+ async def update_config(form_data: OllamaConfigForm, user=Depends(get_admin_user)):
146
+ app.state.config.ENABLE_OLLAMA_API = form_data.ENABLE_OLLAMA_API
147
+ app.state.config.OLLAMA_BASE_URLS = form_data.OLLAMA_BASE_URLS
148
+
149
+ app.state.config.OLLAMA_API_CONFIGS = form_data.OLLAMA_API_CONFIGS
150
+
151
+ # Remove any extra configs
152
+ config_urls = app.state.config.OLLAMA_API_CONFIGS.keys()
153
+ for url in list(app.state.config.OLLAMA_BASE_URLS):
154
+ if url not in config_urls:
155
+ app.state.config.OLLAMA_API_CONFIGS.pop(url, None)
156
+
157
+ return {
158
+ "ENABLE_OLLAMA_API": app.state.config.ENABLE_OLLAMA_API,
159
+ "OLLAMA_BASE_URLS": app.state.config.OLLAMA_BASE_URLS,
160
+ "OLLAMA_API_CONFIGS": app.state.config.OLLAMA_API_CONFIGS,
161
+ }
162
+
163
+
164
+ async def aiohttp_get(url, key=None):
165
+ timeout = aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_OPENAI_MODEL_LIST)
166
+ try:
167
+ headers = {"Authorization": f"Bearer {key}"} if key else {}
168
+ async with aiohttp.ClientSession(timeout=timeout, trust_env=True) as session:
169
+ async with session.get(url, headers=headers) as response:
170
+ return await response.json()
171
+ except Exception as e:
172
+ # Handle connection error here
173
+ log.error(f"Connection error: {e}")
174
+ return None
175
+
176
+
177
+ async def cleanup_response(
178
+ response: Optional[aiohttp.ClientResponse],
179
+ session: Optional[aiohttp.ClientSession],
180
+ ):
181
+ if response:
182
+ response.close()
183
+ if session:
184
+ await session.close()
185
+
186
+
187
+ async def post_streaming_url(
188
+ url: str, payload: Union[str, bytes], stream: bool = True, content_type=None
189
+ ):
190
+ r = None
191
+ try:
192
+ session = aiohttp.ClientSession(
193
+ trust_env=True, timeout=aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT)
194
+ )
195
+
196
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
197
+ key = api_config.get("key", None)
198
+
199
+ headers = {"Content-Type": "application/json"}
200
+ if key:
201
+ headers["Authorization"] = f"Bearer {key}"
202
+
203
+ r = await session.post(
204
+ url,
205
+ data=payload,
206
+ headers=headers,
207
+ )
208
+ r.raise_for_status()
209
+
210
+ if stream:
211
+ headers = dict(r.headers)
212
+ if content_type:
213
+ headers["Content-Type"] = content_type
214
+ return StreamingResponse(
215
+ r.content,
216
+ status_code=r.status,
217
+ headers=headers,
218
+ background=BackgroundTask(
219
+ cleanup_response, response=r, session=session
220
+ ),
221
+ )
222
+ else:
223
+ res = await r.json()
224
+ await cleanup_response(r, session)
225
+ return res
226
+
227
+ except Exception as e:
228
+ error_detail = "Open WebUI: Server Connection Error"
229
+ if r is not None:
230
+ try:
231
+ res = await r.json()
232
+ if "error" in res:
233
+ error_detail = f"Ollama: {res['error']}"
234
+ except Exception:
235
+ error_detail = f"Ollama: {e}"
236
+
237
+ raise HTTPException(
238
+ status_code=r.status if r else 500,
239
+ detail=error_detail,
240
+ )
241
+
242
+
243
+ def merge_models_lists(model_lists):
244
+ merged_models = {}
245
+
246
+ for idx, model_list in enumerate(model_lists):
247
+ if model_list is not None:
248
+ for model in model_list:
249
+ id = model["model"]
250
+ if id not in merged_models:
251
+ model["urls"] = [idx]
252
+ merged_models[id] = model
253
+ else:
254
+ merged_models[id]["urls"].append(idx)
255
+
256
+ return list(merged_models.values())
257
+
258
+
259
+ async def get_all_models():
260
+ log.info("get_all_models()")
261
+ if app.state.config.ENABLE_OLLAMA_API:
262
+ tasks = []
263
+ for idx, url in enumerate(app.state.config.OLLAMA_BASE_URLS):
264
+ if url not in app.state.config.OLLAMA_API_CONFIGS:
265
+ tasks.append(aiohttp_get(f"{url}/api/tags"))
266
+ else:
267
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
268
+ enable = api_config.get("enable", True)
269
+ key = api_config.get("key", None)
270
+
271
+ if enable:
272
+ tasks.append(aiohttp_get(f"{url}/api/tags", key))
273
+ else:
274
+ tasks.append(asyncio.ensure_future(asyncio.sleep(0, None)))
275
+
276
+ responses = await asyncio.gather(*tasks)
277
+
278
+ for idx, response in enumerate(responses):
279
+ if response:
280
+ url = app.state.config.OLLAMA_BASE_URLS[idx]
281
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
282
+
283
+ prefix_id = api_config.get("prefix_id", None)
284
+ model_ids = api_config.get("model_ids", [])
285
+
286
+ if len(model_ids) != 0 and "models" in response:
287
+ response["models"] = list(
288
+ filter(
289
+ lambda model: model["model"] in model_ids,
290
+ response["models"],
291
+ )
292
+ )
293
+
294
+ if prefix_id:
295
+ for model in response.get("models", []):
296
+ model["model"] = f"{prefix_id}.{model['model']}"
297
+
298
+ print(responses)
299
+
300
+ models = {
301
+ "models": merge_models_lists(
302
+ map(
303
+ lambda response: response.get("models", []) if response else None,
304
+ responses,
305
+ )
306
+ )
307
+ }
308
+
309
+ else:
310
+ models = {"models": []}
311
+
312
+ return models
313
+
314
+
315
+ @app.get("/api/tags")
316
+ @app.get("/api/tags/{url_idx}")
317
+ async def get_ollama_tags(
318
+ url_idx: Optional[int] = None, user=Depends(get_verified_user)
319
+ ):
320
+ models = []
321
+ if url_idx is None:
322
+ models = await get_all_models()
323
+ else:
324
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
325
+
326
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
327
+ key = api_config.get("key", None)
328
+
329
+ headers = {}
330
+ if key:
331
+ headers["Authorization"] = f"Bearer {key}"
332
+
333
+ r = None
334
+ try:
335
+ r = requests.request(method="GET", url=f"{url}/api/tags", headers=headers)
336
+ r.raise_for_status()
337
+
338
+ models = r.json()
339
+ except Exception as e:
340
+ log.exception(e)
341
+ error_detail = "Open WebUI: Server Connection Error"
342
+ if r is not None:
343
+ try:
344
+ res = r.json()
345
+ if "error" in res:
346
+ error_detail = f"Ollama: {res['error']}"
347
+ except Exception:
348
+ error_detail = f"Ollama: {e}"
349
+
350
+ raise HTTPException(
351
+ status_code=r.status_code if r else 500,
352
+ detail=error_detail,
353
+ )
354
+
355
+ if user.role == "user":
356
+ # Filter models based on user access control
357
+ filtered_models = []
358
+ for model in models.get("models", []):
359
+ model_info = Models.get_model_by_id(model["model"])
360
+ if model_info:
361
+ if user.id == model_info.user_id or has_access(
362
+ user.id, type="read", access_control=model_info.access_control
363
+ ):
364
+ filtered_models.append(model)
365
+ models["models"] = filtered_models
366
+
367
+ return models
368
+
369
+
370
+ @app.get("/api/version")
371
+ @app.get("/api/version/{url_idx}")
372
+ async def get_ollama_versions(url_idx: Optional[int] = None):
373
+ if app.state.config.ENABLE_OLLAMA_API:
374
+ if url_idx is None:
375
+ # returns lowest version
376
+ tasks = [
377
+ aiohttp_get(
378
+ f"{url}/api/version",
379
+ app.state.config.OLLAMA_API_CONFIGS.get(url, {}).get("key", None),
380
+ )
381
+ for url in app.state.config.OLLAMA_BASE_URLS
382
+ ]
383
+ responses = await asyncio.gather(*tasks)
384
+ responses = list(filter(lambda x: x is not None, responses))
385
+
386
+ if len(responses) > 0:
387
+ lowest_version = min(
388
+ responses,
389
+ key=lambda x: tuple(
390
+ map(int, re.sub(r"^v|-.*", "", x["version"]).split("."))
391
+ ),
392
+ )
393
+
394
+ return {"version": lowest_version["version"]}
395
+ else:
396
+ raise HTTPException(
397
+ status_code=500,
398
+ detail=ERROR_MESSAGES.OLLAMA_NOT_FOUND,
399
+ )
400
+ else:
401
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
402
+
403
+ r = None
404
+ try:
405
+ r = requests.request(method="GET", url=f"{url}/api/version")
406
+ r.raise_for_status()
407
+
408
+ return r.json()
409
+ except Exception as e:
410
+ log.exception(e)
411
+ error_detail = "Open WebUI: Server Connection Error"
412
+ if r is not None:
413
+ try:
414
+ res = r.json()
415
+ if "error" in res:
416
+ error_detail = f"Ollama: {res['error']}"
417
+ except Exception:
418
+ error_detail = f"Ollama: {e}"
419
+
420
+ raise HTTPException(
421
+ status_code=r.status_code if r else 500,
422
+ detail=error_detail,
423
+ )
424
+ else:
425
+ return {"version": False}
426
+
427
+
428
+ class ModelNameForm(BaseModel):
429
+ name: str
430
+
431
+
432
+ @app.post("/api/pull")
433
+ @app.post("/api/pull/{url_idx}")
434
+ async def pull_model(
435
+ form_data: ModelNameForm, url_idx: int = 0, user=Depends(get_admin_user)
436
+ ):
437
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
438
+ log.info(f"url: {url}")
439
+
440
+ # Admin should be able to pull models from any source
441
+ payload = {**form_data.model_dump(exclude_none=True), "insecure": True}
442
+
443
+ return await post_streaming_url(f"{url}/api/pull", json.dumps(payload))
444
+
445
+
446
+ class PushModelForm(BaseModel):
447
+ name: str
448
+ insecure: Optional[bool] = None
449
+ stream: Optional[bool] = None
450
+
451
+
452
+ @app.delete("/api/push")
453
+ @app.delete("/api/push/{url_idx}")
454
+ async def push_model(
455
+ form_data: PushModelForm,
456
+ url_idx: Optional[int] = None,
457
+ user=Depends(get_admin_user),
458
+ ):
459
+ if url_idx is None:
460
+ model_list = await get_all_models()
461
+ models = {model["model"]: model for model in model_list["models"]}
462
+
463
+ if form_data.name in models:
464
+ url_idx = models[form_data.name]["urls"][0]
465
+ else:
466
+ raise HTTPException(
467
+ status_code=400,
468
+ detail=ERROR_MESSAGES.MODEL_NOT_FOUND(form_data.name),
469
+ )
470
+
471
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
472
+ log.debug(f"url: {url}")
473
+
474
+ return await post_streaming_url(
475
+ f"{url}/api/push", form_data.model_dump_json(exclude_none=True).encode()
476
+ )
477
+
478
+
479
+ class CreateModelForm(BaseModel):
480
+ name: str
481
+ modelfile: Optional[str] = None
482
+ stream: Optional[bool] = None
483
+ path: Optional[str] = None
484
+
485
+
486
+ @app.post("/api/create")
487
+ @app.post("/api/create/{url_idx}")
488
+ async def create_model(
489
+ form_data: CreateModelForm, url_idx: int = 0, user=Depends(get_admin_user)
490
+ ):
491
+ log.debug(f"form_data: {form_data}")
492
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
493
+ log.info(f"url: {url}")
494
+
495
+ return await post_streaming_url(
496
+ f"{url}/api/create", form_data.model_dump_json(exclude_none=True).encode()
497
+ )
498
+
499
+
500
+ class CopyModelForm(BaseModel):
501
+ source: str
502
+ destination: str
503
+
504
+
505
+ @app.post("/api/copy")
506
+ @app.post("/api/copy/{url_idx}")
507
+ async def copy_model(
508
+ form_data: CopyModelForm,
509
+ url_idx: Optional[int] = None,
510
+ user=Depends(get_admin_user),
511
+ ):
512
+ if url_idx is None:
513
+ model_list = await get_all_models()
514
+ models = {model["model"]: model for model in model_list["models"]}
515
+
516
+ if form_data.source in models:
517
+ url_idx = models[form_data.source]["urls"][0]
518
+ else:
519
+ raise HTTPException(
520
+ status_code=400,
521
+ detail=ERROR_MESSAGES.MODEL_NOT_FOUND(form_data.source),
522
+ )
523
+
524
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
525
+ log.info(f"url: {url}")
526
+
527
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
528
+ key = api_config.get("key", None)
529
+
530
+ headers = {"Content-Type": "application/json"}
531
+ if key:
532
+ headers["Authorization"] = f"Bearer {key}"
533
+
534
+ r = requests.request(
535
+ method="POST",
536
+ url=f"{url}/api/copy",
537
+ headers=headers,
538
+ data=form_data.model_dump_json(exclude_none=True).encode(),
539
+ )
540
+
541
+ try:
542
+ r.raise_for_status()
543
+
544
+ log.debug(f"r.text: {r.text}")
545
+
546
+ return True
547
+ except Exception as e:
548
+ log.exception(e)
549
+ error_detail = "Open WebUI: Server Connection Error"
550
+ if r is not None:
551
+ try:
552
+ res = r.json()
553
+ if "error" in res:
554
+ error_detail = f"Ollama: {res['error']}"
555
+ except Exception:
556
+ error_detail = f"Ollama: {e}"
557
+
558
+ raise HTTPException(
559
+ status_code=r.status_code if r else 500,
560
+ detail=error_detail,
561
+ )
562
+
563
+
564
+ @app.delete("/api/delete")
565
+ @app.delete("/api/delete/{url_idx}")
566
+ async def delete_model(
567
+ form_data: ModelNameForm,
568
+ url_idx: Optional[int] = None,
569
+ user=Depends(get_admin_user),
570
+ ):
571
+ if url_idx is None:
572
+ model_list = await get_all_models()
573
+ models = {model["model"]: model for model in model_list["models"]}
574
+
575
+ if form_data.name in models:
576
+ url_idx = models[form_data.name]["urls"][0]
577
+ else:
578
+ raise HTTPException(
579
+ status_code=400,
580
+ detail=ERROR_MESSAGES.MODEL_NOT_FOUND(form_data.name),
581
+ )
582
+
583
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
584
+ log.info(f"url: {url}")
585
+
586
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
587
+ key = api_config.get("key", None)
588
+
589
+ headers = {"Content-Type": "application/json"}
590
+ if key:
591
+ headers["Authorization"] = f"Bearer {key}"
592
+
593
+ r = requests.request(
594
+ method="DELETE",
595
+ url=f"{url}/api/delete",
596
+ data=form_data.model_dump_json(exclude_none=True).encode(),
597
+ headers=headers,
598
+ )
599
+ try:
600
+ r.raise_for_status()
601
+
602
+ log.debug(f"r.text: {r.text}")
603
+
604
+ return True
605
+ except Exception as e:
606
+ log.exception(e)
607
+ error_detail = "Open WebUI: Server Connection Error"
608
+ if r is not None:
609
+ try:
610
+ res = r.json()
611
+ if "error" in res:
612
+ error_detail = f"Ollama: {res['error']}"
613
+ except Exception:
614
+ error_detail = f"Ollama: {e}"
615
+
616
+ raise HTTPException(
617
+ status_code=r.status_code if r else 500,
618
+ detail=error_detail,
619
+ )
620
+
621
+
622
+ @app.post("/api/show")
623
+ async def show_model_info(form_data: ModelNameForm, user=Depends(get_verified_user)):
624
+ model_list = await get_all_models()
625
+ models = {model["model"]: model for model in model_list["models"]}
626
+
627
+ if form_data.name not in models:
628
+ raise HTTPException(
629
+ status_code=400,
630
+ detail=ERROR_MESSAGES.MODEL_NOT_FOUND(form_data.name),
631
+ )
632
+
633
+ url_idx = random.choice(models[form_data.name]["urls"])
634
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
635
+ log.info(f"url: {url}")
636
+
637
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
638
+ key = api_config.get("key", None)
639
+
640
+ headers = {"Content-Type": "application/json"}
641
+ if key:
642
+ headers["Authorization"] = f"Bearer {key}"
643
+
644
+ r = requests.request(
645
+ method="POST",
646
+ url=f"{url}/api/show",
647
+ headers=headers,
648
+ data=form_data.model_dump_json(exclude_none=True).encode(),
649
+ )
650
+ try:
651
+ r.raise_for_status()
652
+
653
+ return r.json()
654
+ except Exception as e:
655
+ log.exception(e)
656
+ error_detail = "Open WebUI: Server Connection Error"
657
+ if r is not None:
658
+ try:
659
+ res = r.json()
660
+ if "error" in res:
661
+ error_detail = f"Ollama: {res['error']}"
662
+ except Exception:
663
+ error_detail = f"Ollama: {e}"
664
+
665
+ raise HTTPException(
666
+ status_code=r.status_code if r else 500,
667
+ detail=error_detail,
668
+ )
669
+
670
+
671
+ class GenerateEmbeddingsForm(BaseModel):
672
+ model: str
673
+ prompt: str
674
+ options: Optional[dict] = None
675
+ keep_alive: Optional[Union[int, str]] = None
676
+
677
+
678
+ class GenerateEmbedForm(BaseModel):
679
+ model: str
680
+ input: list[str] | str
681
+ truncate: Optional[bool] = None
682
+ options: Optional[dict] = None
683
+ keep_alive: Optional[Union[int, str]] = None
684
+
685
+
686
+ @app.post("/api/embed")
687
+ @app.post("/api/embed/{url_idx}")
688
+ async def generate_embeddings(
689
+ form_data: GenerateEmbedForm,
690
+ url_idx: Optional[int] = None,
691
+ user=Depends(get_verified_user),
692
+ ):
693
+ return generate_ollama_batch_embeddings(form_data, url_idx)
694
+
695
+
696
+ @app.post("/api/embeddings")
697
+ @app.post("/api/embeddings/{url_idx}")
698
+ async def generate_embeddings(
699
+ form_data: GenerateEmbeddingsForm,
700
+ url_idx: Optional[int] = None,
701
+ user=Depends(get_verified_user),
702
+ ):
703
+ return await generate_ollama_embeddings(form_data=form_data, url_idx=url_idx)
704
+
705
+
706
+ async def generate_ollama_embeddings(
707
+ form_data: GenerateEmbeddingsForm,
708
+ url_idx: Optional[int] = None,
709
+ ):
710
+ log.info(f"generate_ollama_embeddings {form_data}")
711
+
712
+ if url_idx is None:
713
+ model_list = await get_all_models()
714
+ models = {model["model"]: model for model in model_list["models"]}
715
+
716
+ model = form_data.model
717
+
718
+ if ":" not in model:
719
+ model = f"{model}:latest"
720
+
721
+ if model in models:
722
+ url_idx = random.choice(models[model]["urls"])
723
+ else:
724
+ raise HTTPException(
725
+ status_code=400,
726
+ detail=ERROR_MESSAGES.MODEL_NOT_FOUND(form_data.model),
727
+ )
728
+
729
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
730
+ log.info(f"url: {url}")
731
+
732
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
733
+ key = api_config.get("key", None)
734
+
735
+ headers = {"Content-Type": "application/json"}
736
+ if key:
737
+ headers["Authorization"] = f"Bearer {key}"
738
+
739
+ r = requests.request(
740
+ method="POST",
741
+ url=f"{url}/api/embeddings",
742
+ headers=headers,
743
+ data=form_data.model_dump_json(exclude_none=True).encode(),
744
+ )
745
+ try:
746
+ r.raise_for_status()
747
+
748
+ data = r.json()
749
+
750
+ log.info(f"generate_ollama_embeddings {data}")
751
+
752
+ if "embedding" in data:
753
+ return data
754
+ else:
755
+ raise Exception("Something went wrong :/")
756
+ except Exception as e:
757
+ log.exception(e)
758
+ error_detail = "Open WebUI: Server Connection Error"
759
+ if r is not None:
760
+ try:
761
+ res = r.json()
762
+ if "error" in res:
763
+ error_detail = f"Ollama: {res['error']}"
764
+ except Exception:
765
+ error_detail = f"Ollama: {e}"
766
+
767
+ raise HTTPException(
768
+ status_code=r.status_code if r else 500,
769
+ detail=error_detail,
770
+ )
771
+
772
+
773
+ async def generate_ollama_batch_embeddings(
774
+ form_data: GenerateEmbedForm,
775
+ url_idx: Optional[int] = None,
776
+ ):
777
+ log.info(f"generate_ollama_batch_embeddings {form_data}")
778
+
779
+ if url_idx is None:
780
+ model_list = await get_all_models()
781
+ models = {model["model"]: model for model in model_list["models"]}
782
+
783
+ model = form_data.model
784
+
785
+ if ":" not in model:
786
+ model = f"{model}:latest"
787
+
788
+ if model in models:
789
+ url_idx = random.choice(models[model]["urls"])
790
+ else:
791
+ raise HTTPException(
792
+ status_code=400,
793
+ detail=ERROR_MESSAGES.MODEL_NOT_FOUND(form_data.model),
794
+ )
795
+
796
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
797
+ log.info(f"url: {url}")
798
+
799
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
800
+ key = api_config.get("key", None)
801
+
802
+ headers = {"Content-Type": "application/json"}
803
+ if key:
804
+ headers["Authorization"] = f"Bearer {key}"
805
+
806
+ r = requests.request(
807
+ method="POST",
808
+ url=f"{url}/api/embed",
809
+ headers=headers,
810
+ data=form_data.model_dump_json(exclude_none=True).encode(),
811
+ )
812
+ try:
813
+ r.raise_for_status()
814
+
815
+ data = r.json()
816
+
817
+ log.info(f"generate_ollama_batch_embeddings {data}")
818
+
819
+ if "embeddings" in data:
820
+ return data
821
+ else:
822
+ raise Exception("Something went wrong :/")
823
+ except Exception as e:
824
+ log.exception(e)
825
+ error_detail = "Open WebUI: Server Connection Error"
826
+ if r is not None:
827
+ try:
828
+ res = r.json()
829
+ if "error" in res:
830
+ error_detail = f"Ollama: {res['error']}"
831
+ except Exception:
832
+ error_detail = f"Ollama: {e}"
833
+
834
+ raise Exception(error_detail)
835
+
836
+
837
+ class GenerateCompletionForm(BaseModel):
838
+ model: str
839
+ prompt: str
840
+ images: Optional[list[str]] = None
841
+ format: Optional[str] = None
842
+ options: Optional[dict] = None
843
+ system: Optional[str] = None
844
+ template: Optional[str] = None
845
+ context: Optional[list[int]] = None
846
+ stream: Optional[bool] = True
847
+ raw: Optional[bool] = None
848
+ keep_alive: Optional[Union[int, str]] = None
849
+
850
+
851
+ @app.post("/api/generate")
852
+ @app.post("/api/generate/{url_idx}")
853
+ async def generate_completion(
854
+ form_data: GenerateCompletionForm,
855
+ url_idx: Optional[int] = None,
856
+ user=Depends(get_verified_user),
857
+ ):
858
+ if url_idx is None:
859
+ model_list = await get_all_models()
860
+ models = {model["model"]: model for model in model_list["models"]}
861
+
862
+ model = form_data.model
863
+
864
+ if ":" not in model:
865
+ model = f"{model}:latest"
866
+
867
+ if model in models:
868
+ url_idx = random.choice(models[model]["urls"])
869
+ else:
870
+ raise HTTPException(
871
+ status_code=400,
872
+ detail=ERROR_MESSAGES.MODEL_NOT_FOUND(form_data.model),
873
+ )
874
+
875
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
876
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
877
+ prefix_id = api_config.get("prefix_id", None)
878
+ if prefix_id:
879
+ form_data.model = form_data.model.replace(f"{prefix_id}.", "")
880
+ log.info(f"url: {url}")
881
+
882
+ return await post_streaming_url(
883
+ f"{url}/api/generate", form_data.model_dump_json(exclude_none=True).encode()
884
+ )
885
+
886
+
887
+ class ChatMessage(BaseModel):
888
+ role: str
889
+ content: str
890
+ images: Optional[list[str]] = None
891
+
892
+
893
+ class GenerateChatCompletionForm(BaseModel):
894
+ model: str
895
+ messages: list[ChatMessage]
896
+ format: Optional[str] = None
897
+ options: Optional[dict] = None
898
+ template: Optional[str] = None
899
+ stream: Optional[bool] = True
900
+ keep_alive: Optional[Union[int, str]] = None
901
+
902
+
903
+ async def get_ollama_url(url_idx: Optional[int], model: str):
904
+ if url_idx is None:
905
+ model_list = await get_all_models()
906
+ models = {model["model"]: model for model in model_list["models"]}
907
+
908
+ if model not in models:
909
+ raise HTTPException(
910
+ status_code=400,
911
+ detail=ERROR_MESSAGES.MODEL_NOT_FOUND(model),
912
+ )
913
+ url_idx = random.choice(models[model]["urls"])
914
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
915
+ return url
916
+
917
+
918
+ @app.post("/api/chat")
919
+ @app.post("/api/chat/{url_idx}")
920
+ async def generate_chat_completion(
921
+ form_data: GenerateChatCompletionForm,
922
+ url_idx: Optional[int] = None,
923
+ user=Depends(get_verified_user),
924
+ bypass_filter: Optional[bool] = False,
925
+ ):
926
+ payload = {**form_data.model_dump(exclude_none=True)}
927
+ log.debug(f"generate_chat_completion() - 1.payload = {payload}")
928
+ if "metadata" in payload:
929
+ del payload["metadata"]
930
+
931
+ model_id = payload["model"]
932
+ model_info = Models.get_model_by_id(model_id)
933
+
934
+ if model_info:
935
+ if model_info.base_model_id:
936
+ payload["model"] = model_info.base_model_id
937
+
938
+ params = model_info.params.model_dump()
939
+
940
+ if params:
941
+ if payload.get("options") is None:
942
+ payload["options"] = {}
943
+
944
+ payload["options"] = apply_model_params_to_body_ollama(
945
+ params, payload["options"]
946
+ )
947
+ payload = apply_model_system_prompt_to_body(params, payload, user)
948
+
949
+ # Check if user has access to the model
950
+ if not bypass_filter and user.role == "user":
951
+ if not (
952
+ user.id == model_info.user_id
953
+ or has_access(
954
+ user.id, type="read", access_control=model_info.access_control
955
+ )
956
+ ):
957
+ raise HTTPException(
958
+ status_code=403,
959
+ detail="Model not found",
960
+ )
961
+ elif not bypass_filter:
962
+ if user.role != "admin":
963
+ raise HTTPException(
964
+ status_code=403,
965
+ detail="Model not found",
966
+ )
967
+
968
+ if ":" not in payload["model"]:
969
+ payload["model"] = f"{payload['model']}:latest"
970
+
971
+ url = await get_ollama_url(url_idx, payload["model"])
972
+ log.info(f"url: {url}")
973
+ log.debug(f"generate_chat_completion() - 2.payload = {payload}")
974
+
975
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
976
+ prefix_id = api_config.get("prefix_id", None)
977
+ if prefix_id:
978
+ payload["model"] = payload["model"].replace(f"{prefix_id}.", "")
979
+
980
+ return await post_streaming_url(
981
+ f"{url}/api/chat",
982
+ json.dumps(payload),
983
+ stream=form_data.stream,
984
+ content_type="application/x-ndjson",
985
+ )
986
+
987
+
988
+ # TODO: we should update this part once Ollama supports other types
989
+ class OpenAIChatMessageContent(BaseModel):
990
+ type: str
991
+ model_config = ConfigDict(extra="allow")
992
+
993
+
994
+ class OpenAIChatMessage(BaseModel):
995
+ role: str
996
+ content: Union[str, list[OpenAIChatMessageContent]]
997
+
998
+ model_config = ConfigDict(extra="allow")
999
+
1000
+
1001
+ class OpenAIChatCompletionForm(BaseModel):
1002
+ model: str
1003
+ messages: list[OpenAIChatMessage]
1004
+
1005
+ model_config = ConfigDict(extra="allow")
1006
+
1007
+
1008
+ @app.post("/v1/chat/completions")
1009
+ @app.post("/v1/chat/completions/{url_idx}")
1010
+ async def generate_openai_chat_completion(
1011
+ form_data: dict,
1012
+ url_idx: Optional[int] = None,
1013
+ user=Depends(get_verified_user),
1014
+ ):
1015
+ try:
1016
+ completion_form = OpenAIChatCompletionForm(**form_data)
1017
+ except Exception as e:
1018
+ log.exception(e)
1019
+ raise HTTPException(
1020
+ status_code=400,
1021
+ detail=str(e),
1022
+ )
1023
+
1024
+ payload = {**completion_form.model_dump(exclude_none=True, exclude=["metadata"])}
1025
+ if "metadata" in payload:
1026
+ del payload["metadata"]
1027
+
1028
+ model_id = completion_form.model
1029
+ if ":" not in model_id:
1030
+ model_id = f"{model_id}:latest"
1031
+
1032
+ model_info = Models.get_model_by_id(model_id)
1033
+ if model_info:
1034
+ if model_info.base_model_id:
1035
+ payload["model"] = model_info.base_model_id
1036
+
1037
+ params = model_info.params.model_dump()
1038
+
1039
+ if params:
1040
+ payload = apply_model_params_to_body_openai(params, payload)
1041
+ payload = apply_model_system_prompt_to_body(params, payload, user)
1042
+
1043
+ # Check if user has access to the model
1044
+ if user.role == "user":
1045
+ if not (
1046
+ user.id == model_info.user_id
1047
+ or has_access(
1048
+ user.id, type="read", access_control=model_info.access_control
1049
+ )
1050
+ ):
1051
+ raise HTTPException(
1052
+ status_code=403,
1053
+ detail="Model not found",
1054
+ )
1055
+ else:
1056
+ if user.role != "admin":
1057
+ raise HTTPException(
1058
+ status_code=403,
1059
+ detail="Model not found",
1060
+ )
1061
+
1062
+ if ":" not in payload["model"]:
1063
+ payload["model"] = f"{payload['model']}:latest"
1064
+
1065
+ url = await get_ollama_url(url_idx, payload["model"])
1066
+ log.info(f"url: {url}")
1067
+
1068
+ api_config = app.state.config.OLLAMA_API_CONFIGS.get(url, {})
1069
+ prefix_id = api_config.get("prefix_id", None)
1070
+ if prefix_id:
1071
+ payload["model"] = payload["model"].replace(f"{prefix_id}.", "")
1072
+
1073
+ return await post_streaming_url(
1074
+ f"{url}/v1/chat/completions",
1075
+ json.dumps(payload),
1076
+ stream=payload.get("stream", False),
1077
+ )
1078
+
1079
+
1080
+ @app.get("/v1/models")
1081
+ @app.get("/v1/models/{url_idx}")
1082
+ async def get_openai_models(
1083
+ url_idx: Optional[int] = None,
1084
+ user=Depends(get_verified_user),
1085
+ ):
1086
+
1087
+ models = []
1088
+ if url_idx is None:
1089
+ model_list = await get_all_models()
1090
+ models = [
1091
+ {
1092
+ "id": model["model"],
1093
+ "object": "model",
1094
+ "created": int(time.time()),
1095
+ "owned_by": "openai",
1096
+ }
1097
+ for model in model_list["models"]
1098
+ ]
1099
+
1100
+ else:
1101
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
1102
+ try:
1103
+ r = requests.request(method="GET", url=f"{url}/api/tags")
1104
+ r.raise_for_status()
1105
+
1106
+ model_list = r.json()
1107
+
1108
+ models = [
1109
+ {
1110
+ "id": model["model"],
1111
+ "object": "model",
1112
+ "created": int(time.time()),
1113
+ "owned_by": "openai",
1114
+ }
1115
+ for model in models["models"]
1116
+ ]
1117
+ except Exception as e:
1118
+ log.exception(e)
1119
+ error_detail = "Open WebUI: Server Connection Error"
1120
+ if r is not None:
1121
+ try:
1122
+ res = r.json()
1123
+ if "error" in res:
1124
+ error_detail = f"Ollama: {res['error']}"
1125
+ except Exception:
1126
+ error_detail = f"Ollama: {e}"
1127
+
1128
+ raise HTTPException(
1129
+ status_code=r.status_code if r else 500,
1130
+ detail=error_detail,
1131
+ )
1132
+
1133
+ if user.role == "user":
1134
+ # Filter models based on user access control
1135
+ filtered_models = []
1136
+ for model in models:
1137
+ model_info = Models.get_model_by_id(model["id"])
1138
+ if model_info:
1139
+ if user.id == model_info.user_id or has_access(
1140
+ user.id, type="read", access_control=model_info.access_control
1141
+ ):
1142
+ filtered_models.append(model)
1143
+ models = filtered_models
1144
+
1145
+ return {
1146
+ "data": models,
1147
+ "object": "list",
1148
+ }
1149
+
1150
+
1151
+ class UrlForm(BaseModel):
1152
+ url: str
1153
+
1154
+
1155
+ class UploadBlobForm(BaseModel):
1156
+ filename: str
1157
+
1158
+
1159
+ def parse_huggingface_url(hf_url):
1160
+ try:
1161
+ # Parse the URL
1162
+ parsed_url = urlparse(hf_url)
1163
+
1164
+ # Get the path and split it into components
1165
+ path_components = parsed_url.path.split("/")
1166
+
1167
+ # Extract the desired output
1168
+ model_file = path_components[-1]
1169
+
1170
+ return model_file
1171
+ except ValueError:
1172
+ return None
1173
+
1174
+
1175
+ async def download_file_stream(
1176
+ ollama_url, file_url, file_path, file_name, chunk_size=1024 * 1024
1177
+ ):
1178
+ done = False
1179
+
1180
+ if os.path.exists(file_path):
1181
+ current_size = os.path.getsize(file_path)
1182
+ else:
1183
+ current_size = 0
1184
+
1185
+ headers = {"Range": f"bytes={current_size}-"} if current_size > 0 else {}
1186
+
1187
+ timeout = aiohttp.ClientTimeout(total=600) # Set the timeout
1188
+
1189
+ async with aiohttp.ClientSession(timeout=timeout, trust_env=True) as session:
1190
+ async with session.get(file_url, headers=headers) as response:
1191
+ total_size = int(response.headers.get("content-length", 0)) + current_size
1192
+
1193
+ with open(file_path, "ab+") as file:
1194
+ async for data in response.content.iter_chunked(chunk_size):
1195
+ current_size += len(data)
1196
+ file.write(data)
1197
+
1198
+ done = current_size == total_size
1199
+ progress = round((current_size / total_size) * 100, 2)
1200
+
1201
+ yield f'data: {{"progress": {progress}, "completed": {current_size}, "total": {total_size}}}\n\n'
1202
+
1203
+ if done:
1204
+ file.seek(0)
1205
+ hashed = calculate_sha256(file)
1206
+ file.seek(0)
1207
+
1208
+ url = f"{ollama_url}/api/blobs/sha256:{hashed}"
1209
+ response = requests.post(url, data=file)
1210
+
1211
+ if response.ok:
1212
+ res = {
1213
+ "done": done,
1214
+ "blob": f"sha256:{hashed}",
1215
+ "name": file_name,
1216
+ }
1217
+ os.remove(file_path)
1218
+
1219
+ yield f"data: {json.dumps(res)}\n\n"
1220
+ else:
1221
+ raise "Ollama: Could not create blob, Please try again."
1222
+
1223
+
1224
+ # url = "https://huggingface.co/TheBloke/stablelm-zephyr-3b-GGUF/resolve/main/stablelm-zephyr-3b.Q2_K.gguf"
1225
+ @app.post("/models/download")
1226
+ @app.post("/models/download/{url_idx}")
1227
+ async def download_model(
1228
+ form_data: UrlForm,
1229
+ url_idx: Optional[int] = None,
1230
+ user=Depends(get_admin_user),
1231
+ ):
1232
+ allowed_hosts = ["https://huggingface.co/", "https://github.com/"]
1233
+
1234
+ if not any(form_data.url.startswith(host) for host in allowed_hosts):
1235
+ raise HTTPException(
1236
+ status_code=400,
1237
+ detail="Invalid file_url. Only URLs from allowed hosts are permitted.",
1238
+ )
1239
+
1240
+ if url_idx is None:
1241
+ url_idx = 0
1242
+ url = app.state.config.OLLAMA_BASE_URLS[url_idx]
1243
+
1244
+ file_name = parse_huggingface_url(form_data.url)
1245
+
1246
+ if file_name:
1247
+ file_path = f"{UPLOAD_DIR}/{file_name}"
1248
+
1249
+ return StreamingResponse(
1250
+ download_file_stream(url, form_data.url, file_path, file_name),
1251
+ )
1252
+ else:
1253
+ return None
1254
+
1255
+
1256
+ @app.post("/models/upload")
1257
+ @app.post("/models/upload/{url_idx}")
1258
+ def upload_model(
1259
+ file: UploadFile = File(...),
1260
+ url_idx: Optional[int] = None,
1261
+ user=Depends(get_admin_user),
1262
+ ):
1263
+ if url_idx is None:
1264
+ url_idx = 0
1265
+ ollama_url = app.state.config.OLLAMA_BASE_URLS[url_idx]
1266
+
1267
+ file_path = f"{UPLOAD_DIR}/{file.filename}"
1268
+
1269
+ # Save file in chunks
1270
+ with open(file_path, "wb+") as f:
1271
+ for chunk in file.file:
1272
+ f.write(chunk)
1273
+
1274
+ def file_process_stream():
1275
+ nonlocal ollama_url
1276
+ total_size = os.path.getsize(file_path)
1277
+ chunk_size = 1024 * 1024
1278
+ try:
1279
+ with open(file_path, "rb") as f:
1280
+ total = 0
1281
+ done = False
1282
+
1283
+ while not done:
1284
+ chunk = f.read(chunk_size)
1285
+ if not chunk:
1286
+ done = True
1287
+ continue
1288
+
1289
+ total += len(chunk)
1290
+ progress = round((total / total_size) * 100, 2)
1291
+
1292
+ res = {
1293
+ "progress": progress,
1294
+ "total": total_size,
1295
+ "completed": total,
1296
+ }
1297
+ yield f"data: {json.dumps(res)}\n\n"
1298
+
1299
+ if done:
1300
+ f.seek(0)
1301
+ hashed = calculate_sha256(f)
1302
+ f.seek(0)
1303
+
1304
+ url = f"{ollama_url}/api/blobs/sha256:{hashed}"
1305
+ response = requests.post(url, data=f)
1306
+
1307
+ if response.ok:
1308
+ res = {
1309
+ "done": done,
1310
+ "blob": f"sha256:{hashed}",
1311
+ "name": file.filename,
1312
+ }
1313
+ os.remove(file_path)
1314
+ yield f"data: {json.dumps(res)}\n\n"
1315
+ else:
1316
+ raise Exception(
1317
+ "Ollama: Could not create blob, Please try again."
1318
+ )
1319
+
1320
+ except Exception as e:
1321
+ res = {"error": str(e)}
1322
+ yield f"data: {json.dumps(res)}\n\n"
1323
+
1324
+ return StreamingResponse(file_process_stream(), media_type="text/event-stream")
backend/open_webui/apps/openai/main.py ADDED
@@ -0,0 +1,714 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import asyncio
2
+ import hashlib
3
+ import json
4
+ import logging
5
+ from pathlib import Path
6
+ from typing import Literal, Optional, overload
7
+
8
+ import aiohttp
9
+ import requests
10
+ from open_webui.apps.webui.models.models import Models
11
+ from open_webui.config import (
12
+ CACHE_DIR,
13
+ CORS_ALLOW_ORIGIN,
14
+ ENABLE_OPENAI_API,
15
+ OPENAI_API_BASE_URLS,
16
+ OPENAI_API_KEYS,
17
+ OPENAI_API_CONFIGS,
18
+ AppConfig,
19
+ )
20
+ from open_webui.env import (
21
+ AIOHTTP_CLIENT_TIMEOUT,
22
+ AIOHTTP_CLIENT_TIMEOUT_OPENAI_MODEL_LIST,
23
+ ENABLE_FORWARD_USER_INFO_HEADERS,
24
+ )
25
+
26
+ from open_webui.constants import ERROR_MESSAGES
27
+ from open_webui.env import ENV, SRC_LOG_LEVELS
28
+ from fastapi import Depends, FastAPI, HTTPException, Request
29
+ from fastapi.middleware.cors import CORSMiddleware
30
+ from fastapi.responses import FileResponse, StreamingResponse
31
+ from pydantic import BaseModel
32
+ from starlette.background import BackgroundTask
33
+
34
+ from open_webui.utils.payload import (
35
+ apply_model_params_to_body_openai,
36
+ apply_model_system_prompt_to_body,
37
+ )
38
+
39
+ from open_webui.utils.utils import get_admin_user, get_verified_user
40
+ from open_webui.utils.access_control import has_access
41
+
42
+
43
+ log = logging.getLogger(__name__)
44
+ log.setLevel(SRC_LOG_LEVELS["OPENAI"])
45
+
46
+
47
+ app = FastAPI(
48
+ docs_url="/docs" if ENV == "dev" else None,
49
+ openapi_url="/openapi.json" if ENV == "dev" else None,
50
+ redoc_url=None,
51
+ )
52
+
53
+
54
+ app.add_middleware(
55
+ CORSMiddleware,
56
+ allow_origins=CORS_ALLOW_ORIGIN,
57
+ allow_credentials=True,
58
+ allow_methods=["*"],
59
+ allow_headers=["*"],
60
+ )
61
+
62
+ app.state.config = AppConfig()
63
+
64
+ app.state.config.ENABLE_OPENAI_API = ENABLE_OPENAI_API
65
+ app.state.config.OPENAI_API_BASE_URLS = OPENAI_API_BASE_URLS
66
+ app.state.config.OPENAI_API_KEYS = OPENAI_API_KEYS
67
+ app.state.config.OPENAI_API_CONFIGS = OPENAI_API_CONFIGS
68
+
69
+
70
+ @app.get("/config")
71
+ async def get_config(user=Depends(get_admin_user)):
72
+ return {
73
+ "ENABLE_OPENAI_API": app.state.config.ENABLE_OPENAI_API,
74
+ "OPENAI_API_BASE_URLS": app.state.config.OPENAI_API_BASE_URLS,
75
+ "OPENAI_API_KEYS": app.state.config.OPENAI_API_KEYS,
76
+ "OPENAI_API_CONFIGS": app.state.config.OPENAI_API_CONFIGS,
77
+ }
78
+
79
+
80
+ class OpenAIConfigForm(BaseModel):
81
+ ENABLE_OPENAI_API: Optional[bool] = None
82
+ OPENAI_API_BASE_URLS: list[str]
83
+ OPENAI_API_KEYS: list[str]
84
+ OPENAI_API_CONFIGS: dict
85
+
86
+
87
+ @app.post("/config/update")
88
+ async def update_config(form_data: OpenAIConfigForm, user=Depends(get_admin_user)):
89
+ app.state.config.ENABLE_OPENAI_API = form_data.ENABLE_OPENAI_API
90
+
91
+ app.state.config.OPENAI_API_BASE_URLS = form_data.OPENAI_API_BASE_URLS
92
+ app.state.config.OPENAI_API_KEYS = form_data.OPENAI_API_KEYS
93
+
94
+ # Check if API KEYS length is same than API URLS length
95
+ if len(app.state.config.OPENAI_API_KEYS) != len(
96
+ app.state.config.OPENAI_API_BASE_URLS
97
+ ):
98
+ if len(app.state.config.OPENAI_API_KEYS) > len(
99
+ app.state.config.OPENAI_API_BASE_URLS
100
+ ):
101
+ app.state.config.OPENAI_API_KEYS = app.state.config.OPENAI_API_KEYS[
102
+ : len(app.state.config.OPENAI_API_BASE_URLS)
103
+ ]
104
+ else:
105
+ app.state.config.OPENAI_API_KEYS += [""] * (
106
+ len(app.state.config.OPENAI_API_BASE_URLS)
107
+ - len(app.state.config.OPENAI_API_KEYS)
108
+ )
109
+
110
+ app.state.config.OPENAI_API_CONFIGS = form_data.OPENAI_API_CONFIGS
111
+
112
+ # Remove any extra configs
113
+ config_urls = app.state.config.OPENAI_API_CONFIGS.keys()
114
+ for idx, url in enumerate(app.state.config.OPENAI_API_BASE_URLS):
115
+ if url not in config_urls:
116
+ app.state.config.OPENAI_API_CONFIGS.pop(url, None)
117
+
118
+ return {
119
+ "ENABLE_OPENAI_API": app.state.config.ENABLE_OPENAI_API,
120
+ "OPENAI_API_BASE_URLS": app.state.config.OPENAI_API_BASE_URLS,
121
+ "OPENAI_API_KEYS": app.state.config.OPENAI_API_KEYS,
122
+ "OPENAI_API_CONFIGS": app.state.config.OPENAI_API_CONFIGS,
123
+ }
124
+
125
+
126
+ @app.post("/audio/speech")
127
+ async def speech(request: Request, user=Depends(get_verified_user)):
128
+ idx = None
129
+ try:
130
+ idx = app.state.config.OPENAI_API_BASE_URLS.index("https://api.openai.com/v1")
131
+ body = await request.body()
132
+ name = hashlib.sha256(body).hexdigest()
133
+
134
+ SPEECH_CACHE_DIR = Path(CACHE_DIR).joinpath("./audio/speech/")
135
+ SPEECH_CACHE_DIR.mkdir(parents=True, exist_ok=True)
136
+ file_path = SPEECH_CACHE_DIR.joinpath(f"{name}.mp3")
137
+ file_body_path = SPEECH_CACHE_DIR.joinpath(f"{name}.json")
138
+
139
+ # Check if the file already exists in the cache
140
+ if file_path.is_file():
141
+ return FileResponse(file_path)
142
+
143
+ headers = {}
144
+ headers["Authorization"] = f"Bearer {app.state.config.OPENAI_API_KEYS[idx]}"
145
+ headers["Content-Type"] = "application/json"
146
+ if "openrouter.ai" in app.state.config.OPENAI_API_BASE_URLS[idx]:
147
+ headers["HTTP-Referer"] = "https://openwebui.com/"
148
+ headers["X-Title"] = "Open WebUI"
149
+ if ENABLE_FORWARD_USER_INFO_HEADERS:
150
+ headers["X-OpenWebUI-User-Name"] = user.name
151
+ headers["X-OpenWebUI-User-Id"] = user.id
152
+ headers["X-OpenWebUI-User-Email"] = user.email
153
+ headers["X-OpenWebUI-User-Role"] = user.role
154
+ r = None
155
+ try:
156
+ r = requests.post(
157
+ url=f"{app.state.config.OPENAI_API_BASE_URLS[idx]}/audio/speech",
158
+ data=body,
159
+ headers=headers,
160
+ stream=True,
161
+ )
162
+
163
+ r.raise_for_status()
164
+
165
+ # Save the streaming content to a file
166
+ with open(file_path, "wb") as f:
167
+ for chunk in r.iter_content(chunk_size=8192):
168
+ f.write(chunk)
169
+
170
+ with open(file_body_path, "w") as f:
171
+ json.dump(json.loads(body.decode("utf-8")), f)
172
+
173
+ # Return the saved file
174
+ return FileResponse(file_path)
175
+
176
+ except Exception as e:
177
+ log.exception(e)
178
+ error_detail = "Open WebUI: Server Connection Error"
179
+ if r is not None:
180
+ try:
181
+ res = r.json()
182
+ if "error" in res:
183
+ error_detail = f"External: {res['error']}"
184
+ except Exception:
185
+ error_detail = f"External: {e}"
186
+
187
+ raise HTTPException(
188
+ status_code=r.status_code if r else 500, detail=error_detail
189
+ )
190
+
191
+ except ValueError:
192
+ raise HTTPException(status_code=401, detail=ERROR_MESSAGES.OPENAI_NOT_FOUND)
193
+
194
+
195
+ async def aiohttp_get(url, key=None):
196
+ timeout = aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_OPENAI_MODEL_LIST)
197
+ try:
198
+ headers = {"Authorization": f"Bearer {key}"} if key else {}
199
+ async with aiohttp.ClientSession(timeout=timeout, trust_env=True) as session:
200
+ async with session.get(url, headers=headers) as response:
201
+ return await response.json()
202
+ except Exception as e:
203
+ # Handle connection error here
204
+ log.error(f"Connection error: {e}")
205
+ return None
206
+
207
+
208
+ async def cleanup_response(
209
+ response: Optional[aiohttp.ClientResponse],
210
+ session: Optional[aiohttp.ClientSession],
211
+ ):
212
+ if response:
213
+ response.close()
214
+ if session:
215
+ await session.close()
216
+
217
+
218
+ def merge_models_lists(model_lists):
219
+ log.debug(f"merge_models_lists {model_lists}")
220
+ merged_list = []
221
+
222
+ for idx, models in enumerate(model_lists):
223
+ if models is not None and "error" not in models:
224
+ merged_list.extend(
225
+ [
226
+ {
227
+ **model,
228
+ "name": model.get("name", model["id"]),
229
+ "owned_by": "openai",
230
+ "openai": model,
231
+ "urlIdx": idx,
232
+ }
233
+ for model in models
234
+ if "api.openai.com"
235
+ not in app.state.config.OPENAI_API_BASE_URLS[idx]
236
+ or not any(
237
+ name in model["id"]
238
+ for name in [
239
+ "babbage",
240
+ "dall-e",
241
+ "davinci",
242
+ "embedding",
243
+ "tts",
244
+ "whisper",
245
+ ]
246
+ )
247
+ ]
248
+ )
249
+
250
+ return merged_list
251
+
252
+
253
+ async def get_all_models_responses() -> list:
254
+ if not app.state.config.ENABLE_OPENAI_API:
255
+ return []
256
+
257
+ # Check if API KEYS length is same than API URLS length
258
+ num_urls = len(app.state.config.OPENAI_API_BASE_URLS)
259
+ num_keys = len(app.state.config.OPENAI_API_KEYS)
260
+
261
+ if num_keys != num_urls:
262
+ # if there are more keys than urls, remove the extra keys
263
+ if num_keys > num_urls:
264
+ new_keys = app.state.config.OPENAI_API_KEYS[:num_urls]
265
+ app.state.config.OPENAI_API_KEYS = new_keys
266
+ # if there are more urls than keys, add empty keys
267
+ else:
268
+ app.state.config.OPENAI_API_KEYS += [""] * (num_urls - num_keys)
269
+
270
+ tasks = []
271
+ for idx, url in enumerate(app.state.config.OPENAI_API_BASE_URLS):
272
+ if url not in app.state.config.OPENAI_API_CONFIGS:
273
+ tasks.append(
274
+ aiohttp_get(f"{url}/models", app.state.config.OPENAI_API_KEYS[idx])
275
+ )
276
+ else:
277
+ api_config = app.state.config.OPENAI_API_CONFIGS.get(url, {})
278
+
279
+ enable = api_config.get("enable", True)
280
+ model_ids = api_config.get("model_ids", [])
281
+
282
+ if enable:
283
+ if len(model_ids) == 0:
284
+ tasks.append(
285
+ aiohttp_get(
286
+ f"{url}/models", app.state.config.OPENAI_API_KEYS[idx]
287
+ )
288
+ )
289
+ else:
290
+ model_list = {
291
+ "object": "list",
292
+ "data": [
293
+ {
294
+ "id": model_id,
295
+ "name": model_id,
296
+ "owned_by": "openai",
297
+ "openai": {"id": model_id},
298
+ "urlIdx": idx,
299
+ }
300
+ for model_id in model_ids
301
+ ],
302
+ }
303
+
304
+ tasks.append(asyncio.ensure_future(asyncio.sleep(0, model_list)))
305
+
306
+ responses = await asyncio.gather(*tasks)
307
+
308
+ for idx, response in enumerate(responses):
309
+ if response:
310
+ url = app.state.config.OPENAI_API_BASE_URLS[idx]
311
+ api_config = app.state.config.OPENAI_API_CONFIGS.get(url, {})
312
+
313
+ prefix_id = api_config.get("prefix_id", None)
314
+
315
+ if prefix_id:
316
+ for model in (
317
+ response if isinstance(response, list) else response.get("data", [])
318
+ ):
319
+ model["id"] = f"{prefix_id}.{model['id']}"
320
+
321
+ log.debug(f"get_all_models:responses() {responses}")
322
+
323
+ return responses
324
+
325
+
326
+ async def get_all_models() -> dict[str, list]:
327
+ log.info("get_all_models()")
328
+
329
+ if not app.state.config.ENABLE_OPENAI_API:
330
+ return {"data": []}
331
+
332
+ responses = await get_all_models_responses()
333
+
334
+ def extract_data(response):
335
+ if response and "data" in response:
336
+ return response["data"]
337
+ if isinstance(response, list):
338
+ return response
339
+ return None
340
+
341
+ models = {"data": merge_models_lists(map(extract_data, responses))}
342
+ log.debug(f"models: {models}")
343
+
344
+ return models
345
+
346
+
347
+ @app.get("/models")
348
+ @app.get("/models/{url_idx}")
349
+ async def get_models(url_idx: Optional[int] = None, user=Depends(get_verified_user)):
350
+ models = {
351
+ "data": [],
352
+ }
353
+
354
+ if url_idx is None:
355
+ models = await get_all_models()
356
+ else:
357
+ url = app.state.config.OPENAI_API_BASE_URLS[url_idx]
358
+ key = app.state.config.OPENAI_API_KEYS[url_idx]
359
+
360
+ headers = {}
361
+ headers["Authorization"] = f"Bearer {key}"
362
+ headers["Content-Type"] = "application/json"
363
+
364
+ if ENABLE_FORWARD_USER_INFO_HEADERS:
365
+ headers["X-OpenWebUI-User-Name"] = user.name
366
+ headers["X-OpenWebUI-User-Id"] = user.id
367
+ headers["X-OpenWebUI-User-Email"] = user.email
368
+ headers["X-OpenWebUI-User-Role"] = user.role
369
+
370
+ r = None
371
+
372
+ timeout = aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_OPENAI_MODEL_LIST)
373
+ async with aiohttp.ClientSession(timeout=timeout) as session:
374
+ try:
375
+ async with session.get(f"{url}/models", headers=headers) as r:
376
+ if r.status != 200:
377
+ # Extract response error details if available
378
+ error_detail = f"HTTP Error: {r.status}"
379
+ res = await r.json()
380
+ if "error" in res:
381
+ error_detail = f"External Error: {res['error']}"
382
+ raise Exception(error_detail)
383
+
384
+ response_data = await r.json()
385
+
386
+ # Check if we're calling OpenAI API based on the URL
387
+ if "api.openai.com" in url:
388
+ # Filter models according to the specified conditions
389
+ response_data["data"] = [
390
+ model
391
+ for model in response_data.get("data", [])
392
+ if not any(
393
+ name in model["id"]
394
+ for name in [
395
+ "babbage",
396
+ "dall-e",
397
+ "davinci",
398
+ "embedding",
399
+ "tts",
400
+ "whisper",
401
+ ]
402
+ )
403
+ ]
404
+
405
+ models = response_data
406
+ except aiohttp.ClientError as e:
407
+ # ClientError covers all aiohttp requests issues
408
+ log.exception(f"Client error: {str(e)}")
409
+ # Handle aiohttp-specific connection issues, timeout etc.
410
+ raise HTTPException(
411
+ status_code=500, detail="Open WebUI: Server Connection Error"
412
+ )
413
+ except Exception as e:
414
+ log.exception(f"Unexpected error: {e}")
415
+ # Generic error handler in case parsing JSON or other steps fail
416
+ error_detail = f"Unexpected error: {str(e)}"
417
+ raise HTTPException(status_code=500, detail=error_detail)
418
+
419
+ if user.role == "user":
420
+ # Filter models based on user access control
421
+ filtered_models = []
422
+ for model in models.get("data", []):
423
+ model_info = Models.get_model_by_id(model["id"])
424
+ if model_info:
425
+ if user.id == model_info.user_id or has_access(
426
+ user.id, type="read", access_control=model_info.access_control
427
+ ):
428
+ filtered_models.append(model)
429
+ models["data"] = filtered_models
430
+
431
+ return models
432
+
433
+
434
+ class ConnectionVerificationForm(BaseModel):
435
+ url: str
436
+ key: str
437
+
438
+
439
+ @app.post("/verify")
440
+ async def verify_connection(
441
+ form_data: ConnectionVerificationForm, user=Depends(get_admin_user)
442
+ ):
443
+ url = form_data.url
444
+ key = form_data.key
445
+
446
+ headers = {}
447
+ headers["Authorization"] = f"Bearer {key}"
448
+ headers["Content-Type"] = "application/json"
449
+
450
+ timeout = aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_OPENAI_MODEL_LIST)
451
+ async with aiohttp.ClientSession(timeout=timeout) as session:
452
+ try:
453
+ async with session.get(f"{url}/models", headers=headers) as r:
454
+ if r.status != 200:
455
+ # Extract response error details if available
456
+ error_detail = f"HTTP Error: {r.status}"
457
+ res = await r.json()
458
+ if "error" in res:
459
+ error_detail = f"External Error: {res['error']}"
460
+ raise Exception(error_detail)
461
+
462
+ response_data = await r.json()
463
+ return response_data
464
+
465
+ except aiohttp.ClientError as e:
466
+ # ClientError covers all aiohttp requests issues
467
+ log.exception(f"Client error: {str(e)}")
468
+ # Handle aiohttp-specific connection issues, timeout etc.
469
+ raise HTTPException(
470
+ status_code=500, detail="Open WebUI: Server Connection Error"
471
+ )
472
+ except Exception as e:
473
+ log.exception(f"Unexpected error: {e}")
474
+ # Generic error handler in case parsing JSON or other steps fail
475
+ error_detail = f"Unexpected error: {str(e)}"
476
+ raise HTTPException(status_code=500, detail=error_detail)
477
+
478
+
479
+ @app.post("/chat/completions")
480
+ async def generate_chat_completion(
481
+ form_data: dict,
482
+ user=Depends(get_verified_user),
483
+ bypass_filter: Optional[bool] = False,
484
+ ):
485
+ idx = 0
486
+ payload = {**form_data}
487
+
488
+ if "metadata" in payload:
489
+ del payload["metadata"]
490
+
491
+ model_id = form_data.get("model")
492
+ model_info = Models.get_model_by_id(model_id)
493
+
494
+ # Check model info and override the payload
495
+ if model_info:
496
+ if model_info.base_model_id:
497
+ payload["model"] = model_info.base_model_id
498
+
499
+ params = model_info.params.model_dump()
500
+ payload = apply_model_params_to_body_openai(params, payload)
501
+ payload = apply_model_system_prompt_to_body(params, payload, user)
502
+
503
+ # Check if user has access to the model
504
+ if not bypass_filter and user.role == "user":
505
+ if not (
506
+ user.id == model_info.user_id
507
+ or has_access(
508
+ user.id, type="read", access_control=model_info.access_control
509
+ )
510
+ ):
511
+ raise HTTPException(
512
+ status_code=403,
513
+ detail="Model not found",
514
+ )
515
+ elif not bypass_filter:
516
+ if user.role != "admin":
517
+ raise HTTPException(
518
+ status_code=403,
519
+ detail="Model not found",
520
+ )
521
+
522
+ # Attemp to get urlIdx from the model
523
+ models = await get_all_models()
524
+
525
+ # Find the model from the list
526
+ model = next(
527
+ (model for model in models["data"] if model["id"] == payload.get("model")),
528
+ None,
529
+ )
530
+
531
+ if model:
532
+ idx = model["urlIdx"]
533
+ else:
534
+ raise HTTPException(
535
+ status_code=404,
536
+ detail="Model not found",
537
+ )
538
+
539
+ # Get the API config for the model
540
+ api_config = app.state.config.OPENAI_API_CONFIGS.get(
541
+ app.state.config.OPENAI_API_BASE_URLS[idx], {}
542
+ )
543
+ prefix_id = api_config.get("prefix_id", None)
544
+
545
+ if prefix_id:
546
+ payload["model"] = payload["model"].replace(f"{prefix_id}.", "")
547
+
548
+ # Add user info to the payload if the model is a pipeline
549
+ if "pipeline" in model and model.get("pipeline"):
550
+ payload["user"] = {
551
+ "name": user.name,
552
+ "id": user.id,
553
+ "email": user.email,
554
+ "role": user.role,
555
+ }
556
+
557
+ url = app.state.config.OPENAI_API_BASE_URLS[idx]
558
+ key = app.state.config.OPENAI_API_KEYS[idx]
559
+
560
+ # Fix: O1 does not support the "max_tokens" parameter, Modify "max_tokens" to "max_completion_tokens"
561
+ is_o1 = payload["model"].lower().startswith("o1-")
562
+ # Change max_completion_tokens to max_tokens (Backward compatible)
563
+ if "api.openai.com" not in url and not is_o1:
564
+ if "max_completion_tokens" in payload:
565
+ # Remove "max_completion_tokens" from the payload
566
+ payload["max_tokens"] = payload["max_completion_tokens"]
567
+ del payload["max_completion_tokens"]
568
+ else:
569
+ if is_o1 and "max_tokens" in payload:
570
+ payload["max_completion_tokens"] = payload["max_tokens"]
571
+ del payload["max_tokens"]
572
+ if "max_tokens" in payload and "max_completion_tokens" in payload:
573
+ del payload["max_tokens"]
574
+
575
+ # Fix: O1 does not support the "system" parameter, Modify "system" to "user"
576
+ if is_o1 and payload["messages"][0]["role"] == "system":
577
+ payload["messages"][0]["role"] = "user"
578
+
579
+ # Convert the modified body back to JSON
580
+ payload = json.dumps(payload)
581
+
582
+ log.debug(payload)
583
+
584
+ headers = {}
585
+ headers["Authorization"] = f"Bearer {key}"
586
+ headers["Content-Type"] = "application/json"
587
+ if "openrouter.ai" in app.state.config.OPENAI_API_BASE_URLS[idx]:
588
+ headers["HTTP-Referer"] = "https://openwebui.com/"
589
+ headers["X-Title"] = "Open WebUI"
590
+ if ENABLE_FORWARD_USER_INFO_HEADERS:
591
+ headers["X-OpenWebUI-User-Name"] = user.name
592
+ headers["X-OpenWebUI-User-Id"] = user.id
593
+ headers["X-OpenWebUI-User-Email"] = user.email
594
+ headers["X-OpenWebUI-User-Role"] = user.role
595
+
596
+ r = None
597
+ session = None
598
+ streaming = False
599
+ response = None
600
+
601
+ try:
602
+ session = aiohttp.ClientSession(
603
+ trust_env=True, timeout=aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT)
604
+ )
605
+ r = await session.request(
606
+ method="POST",
607
+ url=f"{url}/chat/completions",
608
+ data=payload,
609
+ headers=headers,
610
+ )
611
+
612
+ # Check if response is SSE
613
+ if "text/event-stream" in r.headers.get("Content-Type", ""):
614
+ streaming = True
615
+ return StreamingResponse(
616
+ r.content,
617
+ status_code=r.status,
618
+ headers=dict(r.headers),
619
+ background=BackgroundTask(
620
+ cleanup_response, response=r, session=session
621
+ ),
622
+ )
623
+ else:
624
+ try:
625
+ response = await r.json()
626
+ except Exception as e:
627
+ log.error(e)
628
+ response = await r.text()
629
+
630
+ r.raise_for_status()
631
+ return response
632
+ except Exception as e:
633
+ log.exception(e)
634
+ error_detail = "Open WebUI: Server Connection Error"
635
+ if isinstance(response, dict):
636
+ if "error" in response:
637
+ error_detail = f"{response['error']['message'] if 'message' in response['error'] else response['error']}"
638
+ elif isinstance(response, str):
639
+ error_detail = response
640
+
641
+ raise HTTPException(status_code=r.status if r else 500, detail=error_detail)
642
+ finally:
643
+ if not streaming and session:
644
+ if r:
645
+ r.close()
646
+ await session.close()
647
+
648
+
649
+ @app.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE"])
650
+ async def proxy(path: str, request: Request, user=Depends(get_verified_user)):
651
+ idx = 0
652
+
653
+ body = await request.body()
654
+
655
+ url = app.state.config.OPENAI_API_BASE_URLS[idx]
656
+ key = app.state.config.OPENAI_API_KEYS[idx]
657
+
658
+ target_url = f"{url}/{path}"
659
+
660
+ headers = {}
661
+ headers["Authorization"] = f"Bearer {key}"
662
+ headers["Content-Type"] = "application/json"
663
+ if ENABLE_FORWARD_USER_INFO_HEADERS:
664
+ headers["X-OpenWebUI-User-Name"] = user.name
665
+ headers["X-OpenWebUI-User-Id"] = user.id
666
+ headers["X-OpenWebUI-User-Email"] = user.email
667
+ headers["X-OpenWebUI-User-Role"] = user.role
668
+
669
+ r = None
670
+ session = None
671
+ streaming = False
672
+
673
+ try:
674
+ session = aiohttp.ClientSession(trust_env=True)
675
+ r = await session.request(
676
+ method=request.method,
677
+ url=target_url,
678
+ data=body,
679
+ headers=headers,
680
+ )
681
+
682
+ r.raise_for_status()
683
+
684
+ # Check if response is SSE
685
+ if "text/event-stream" in r.headers.get("Content-Type", ""):
686
+ streaming = True
687
+ return StreamingResponse(
688
+ r.content,
689
+ status_code=r.status,
690
+ headers=dict(r.headers),
691
+ background=BackgroundTask(
692
+ cleanup_response, response=r, session=session
693
+ ),
694
+ )
695
+ else:
696
+ response_data = await r.json()
697
+ return response_data
698
+ except Exception as e:
699
+ log.exception(e)
700
+ error_detail = "Open WebUI: Server Connection Error"
701
+ if r is not None:
702
+ try:
703
+ res = await r.json()
704
+ print(res)
705
+ if "error" in res:
706
+ error_detail = f"External: {res['error']['message'] if 'message' in res['error'] else res['error']}"
707
+ except Exception:
708
+ error_detail = f"External: {e}"
709
+ raise HTTPException(status_code=r.status if r else 500, detail=error_detail)
710
+ finally:
711
+ if not streaming and session:
712
+ if r:
713
+ r.close()
714
+ await session.close()
backend/open_webui/apps/retrieval/loaders/main.py ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import requests
2
+ import logging
3
+ import ftfy
4
+
5
+ from langchain_community.document_loaders import (
6
+ BSHTMLLoader,
7
+ CSVLoader,
8
+ Docx2txtLoader,
9
+ OutlookMessageLoader,
10
+ PyPDFLoader,
11
+ TextLoader,
12
+ UnstructuredEPubLoader,
13
+ UnstructuredExcelLoader,
14
+ UnstructuredMarkdownLoader,
15
+ UnstructuredPowerPointLoader,
16
+ UnstructuredRSTLoader,
17
+ UnstructuredXMLLoader,
18
+ YoutubeLoader,
19
+ )
20
+ from langchain_core.documents import Document
21
+ from open_webui.env import SRC_LOG_LEVELS
22
+
23
+ log = logging.getLogger(__name__)
24
+ log.setLevel(SRC_LOG_LEVELS["RAG"])
25
+
26
+ known_source_ext = [
27
+ "go",
28
+ "py",
29
+ "java",
30
+ "sh",
31
+ "bat",
32
+ "ps1",
33
+ "cmd",
34
+ "js",
35
+ "ts",
36
+ "css",
37
+ "cpp",
38
+ "hpp",
39
+ "h",
40
+ "c",
41
+ "cs",
42
+ "sql",
43
+ "log",
44
+ "ini",
45
+ "pl",
46
+ "pm",
47
+ "r",
48
+ "dart",
49
+ "dockerfile",
50
+ "env",
51
+ "php",
52
+ "hs",
53
+ "hsc",
54
+ "lua",
55
+ "nginxconf",
56
+ "conf",
57
+ "m",
58
+ "mm",
59
+ "plsql",
60
+ "perl",
61
+ "rb",
62
+ "rs",
63
+ "db2",
64
+ "scala",
65
+ "bash",
66
+ "swift",
67
+ "vue",
68
+ "svelte",
69
+ "msg",
70
+ "ex",
71
+ "exs",
72
+ "erl",
73
+ "tsx",
74
+ "jsx",
75
+ "hs",
76
+ "lhs",
77
+ ]
78
+
79
+
80
+ class TikaLoader:
81
+ def __init__(self, url, file_path, mime_type=None):
82
+ self.url = url
83
+ self.file_path = file_path
84
+ self.mime_type = mime_type
85
+
86
+ def load(self) -> list[Document]:
87
+ with open(self.file_path, "rb") as f:
88
+ data = f.read()
89
+
90
+ if self.mime_type is not None:
91
+ headers = {"Content-Type": self.mime_type}
92
+ else:
93
+ headers = {}
94
+
95
+ endpoint = self.url
96
+ if not endpoint.endswith("/"):
97
+ endpoint += "/"
98
+ endpoint += "tika/text"
99
+
100
+ r = requests.put(endpoint, data=data, headers=headers)
101
+
102
+ if r.ok:
103
+ raw_metadata = r.json()
104
+ text = raw_metadata.get("X-TIKA:content", "<No text content found>")
105
+
106
+ if "Content-Type" in raw_metadata:
107
+ headers["Content-Type"] = raw_metadata["Content-Type"]
108
+
109
+ log.info("Tika extracted text: %s", text)
110
+
111
+ return [Document(page_content=text, metadata=headers)]
112
+ else:
113
+ raise Exception(f"Error calling Tika: {r.reason}")
114
+
115
+
116
+ class Loader:
117
+ def __init__(self, engine: str = "", **kwargs):
118
+ self.engine = engine
119
+ self.kwargs = kwargs
120
+
121
+ def load(
122
+ self, filename: str, file_content_type: str, file_path: str
123
+ ) -> list[Document]:
124
+ loader = self._get_loader(filename, file_content_type, file_path)
125
+ docs = loader.load()
126
+
127
+ return [
128
+ Document(
129
+ page_content=ftfy.fix_text(doc.page_content), metadata=doc.metadata
130
+ )
131
+ for doc in docs
132
+ ]
133
+
134
+ def _get_loader(self, filename: str, file_content_type: str, file_path: str):
135
+ file_ext = filename.split(".")[-1].lower()
136
+
137
+ if self.engine == "tika" and self.kwargs.get("TIKA_SERVER_URL"):
138
+ if file_ext in known_source_ext or (
139
+ file_content_type and file_content_type.find("text/") >= 0
140
+ ):
141
+ loader = TextLoader(file_path, autodetect_encoding=True)
142
+ else:
143
+ loader = TikaLoader(
144
+ url=self.kwargs.get("TIKA_SERVER_URL"),
145
+ file_path=file_path,
146
+ mime_type=file_content_type,
147
+ )
148
+ else:
149
+ if file_ext == "pdf":
150
+ loader = PyPDFLoader(
151
+ file_path, extract_images=self.kwargs.get("PDF_EXTRACT_IMAGES")
152
+ )
153
+ elif file_ext == "csv":
154
+ loader = CSVLoader(file_path)
155
+ elif file_ext == "rst":
156
+ loader = UnstructuredRSTLoader(file_path, mode="elements")
157
+ elif file_ext == "xml":
158
+ loader = UnstructuredXMLLoader(file_path)
159
+ elif file_ext in ["htm", "html"]:
160
+ loader = BSHTMLLoader(file_path, open_encoding="unicode_escape")
161
+ elif file_ext == "md":
162
+ loader = TextLoader(file_path, autodetect_encoding=True)
163
+ elif file_content_type == "application/epub+zip":
164
+ loader = UnstructuredEPubLoader(file_path)
165
+ elif (
166
+ file_content_type
167
+ == "application/vnd.openxmlformats-officedocument.wordprocessingml.document"
168
+ or file_ext == "docx"
169
+ ):
170
+ loader = Docx2txtLoader(file_path)
171
+ elif file_content_type in [
172
+ "application/vnd.ms-excel",
173
+ "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
174
+ ] or file_ext in ["xls", "xlsx"]:
175
+ loader = UnstructuredExcelLoader(file_path)
176
+ elif file_content_type in [
177
+ "application/vnd.ms-powerpoint",
178
+ "application/vnd.openxmlformats-officedocument.presentationml.presentation",
179
+ ] or file_ext in ["ppt", "pptx"]:
180
+ loader = UnstructuredPowerPointLoader(file_path)
181
+ elif file_ext == "msg":
182
+ loader = OutlookMessageLoader(file_path)
183
+ elif file_ext in known_source_ext or (
184
+ file_content_type and file_content_type.find("text/") >= 0
185
+ ):
186
+ loader = TextLoader(file_path, autodetect_encoding=True)
187
+ else:
188
+ loader = TextLoader(file_path, autodetect_encoding=True)
189
+
190
+ return loader
backend/open_webui/apps/retrieval/loaders/youtube.py ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from typing import Any, Dict, Generator, List, Optional, Sequence, Union
2
+ from urllib.parse import parse_qs, urlparse
3
+ from langchain_core.documents import Document
4
+
5
+
6
+ ALLOWED_SCHEMES = {"http", "https"}
7
+ ALLOWED_NETLOCS = {
8
+ "youtu.be",
9
+ "m.youtube.com",
10
+ "youtube.com",
11
+ "www.youtube.com",
12
+ "www.youtube-nocookie.com",
13
+ "vid.plus",
14
+ }
15
+
16
+
17
+ def _parse_video_id(url: str) -> Optional[str]:
18
+ """Parse a YouTube URL and return the video ID if valid, otherwise None."""
19
+ parsed_url = urlparse(url)
20
+
21
+ if parsed_url.scheme not in ALLOWED_SCHEMES:
22
+ return None
23
+
24
+ if parsed_url.netloc not in ALLOWED_NETLOCS:
25
+ return None
26
+
27
+ path = parsed_url.path
28
+
29
+ if path.endswith("/watch"):
30
+ query = parsed_url.query
31
+ parsed_query = parse_qs(query)
32
+ if "v" in parsed_query:
33
+ ids = parsed_query["v"]
34
+ video_id = ids if isinstance(ids, str) else ids[0]
35
+ else:
36
+ return None
37
+ else:
38
+ path = parsed_url.path.lstrip("/")
39
+ video_id = path.split("/")[-1]
40
+
41
+ if len(video_id) != 11: # Video IDs are 11 characters long
42
+ return None
43
+
44
+ return video_id
45
+
46
+
47
+ class YoutubeLoader:
48
+ """Load `YouTube` video transcripts."""
49
+
50
+ def __init__(
51
+ self,
52
+ video_id: str,
53
+ language: Union[str, Sequence[str]] = "en",
54
+ ):
55
+ """Initialize with YouTube video ID."""
56
+ _video_id = _parse_video_id(video_id)
57
+ self.video_id = _video_id if _video_id is not None else video_id
58
+ self._metadata = {"source": video_id}
59
+ self.language = language
60
+ if isinstance(language, str):
61
+ self.language = [language]
62
+ else:
63
+ self.language = language
64
+
65
+ def load(self) -> List[Document]:
66
+ """Load YouTube transcripts into `Document` objects."""
67
+ try:
68
+ from youtube_transcript_api import (
69
+ NoTranscriptFound,
70
+ TranscriptsDisabled,
71
+ YouTubeTranscriptApi,
72
+ )
73
+ except ImportError:
74
+ raise ImportError(
75
+ 'Could not import "youtube_transcript_api" Python package. '
76
+ "Please install it with `pip install youtube-transcript-api`."
77
+ )
78
+
79
+ try:
80
+ transcript_list = YouTubeTranscriptApi.list_transcripts(self.video_id)
81
+ except Exception as e:
82
+ print(e)
83
+ return []
84
+
85
+ try:
86
+ transcript = transcript_list.find_transcript(self.language)
87
+ except NoTranscriptFound:
88
+ transcript = transcript_list.find_transcript(["en"])
89
+
90
+ transcript_pieces: List[Dict[str, Any]] = transcript.fetch()
91
+
92
+ transcript = " ".join(
93
+ map(
94
+ lambda transcript_piece: transcript_piece["text"].strip(" "),
95
+ transcript_pieces,
96
+ )
97
+ )
98
+ return [Document(page_content=transcript, metadata=self._metadata)]
backend/open_webui/apps/retrieval/main.py ADDED
@@ -0,0 +1,1452 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # TODO: Merge this with the webui_app and make it a single app
2
+
3
+ import json
4
+ import logging
5
+ import mimetypes
6
+ import os
7
+ import shutil
8
+
9
+ import uuid
10
+ from datetime import datetime
11
+ from pathlib import Path
12
+ from typing import Iterator, Optional, Sequence, Union
13
+
14
+ from fastapi import Depends, FastAPI, File, Form, HTTPException, UploadFile, status
15
+ from fastapi.middleware.cors import CORSMiddleware
16
+ from pydantic import BaseModel
17
+ import tiktoken
18
+
19
+
20
+ from open_webui.storage.provider import Storage
21
+ from open_webui.apps.webui.models.knowledge import Knowledges
22
+ from open_webui.apps.retrieval.vector.connector import VECTOR_DB_CLIENT
23
+
24
+ # Document loaders
25
+ from open_webui.apps.retrieval.loaders.main import Loader
26
+ from open_webui.apps.retrieval.loaders.youtube import YoutubeLoader
27
+
28
+ # Web search engines
29
+ from open_webui.apps.retrieval.web.main import SearchResult
30
+ from open_webui.apps.retrieval.web.utils import get_web_loader
31
+ from open_webui.apps.retrieval.web.brave import search_brave
32
+ from open_webui.apps.retrieval.web.duckduckgo import search_duckduckgo
33
+ from open_webui.apps.retrieval.web.google_pse import search_google_pse
34
+ from open_webui.apps.retrieval.web.jina_search import search_jina
35
+ from open_webui.apps.retrieval.web.searchapi import search_searchapi
36
+ from open_webui.apps.retrieval.web.searxng import search_searxng
37
+ from open_webui.apps.retrieval.web.serper import search_serper
38
+ from open_webui.apps.retrieval.web.serply import search_serply
39
+ from open_webui.apps.retrieval.web.serpstack import search_serpstack
40
+ from open_webui.apps.retrieval.web.tavily import search_tavily
41
+ from open_webui.apps.retrieval.web.bing import search_bing
42
+
43
+
44
+ from open_webui.apps.retrieval.utils import (
45
+ get_embedding_function,
46
+ get_model_path,
47
+ query_collection,
48
+ query_collection_with_hybrid_search,
49
+ query_doc,
50
+ query_doc_with_hybrid_search,
51
+ )
52
+
53
+ from open_webui.apps.webui.models.files import Files
54
+ from open_webui.config import (
55
+ BRAVE_SEARCH_API_KEY,
56
+ TIKTOKEN_ENCODING_NAME,
57
+ RAG_TEXT_SPLITTER,
58
+ CHUNK_OVERLAP,
59
+ CHUNK_SIZE,
60
+ CONTENT_EXTRACTION_ENGINE,
61
+ CORS_ALLOW_ORIGIN,
62
+ ENABLE_RAG_HYBRID_SEARCH,
63
+ ENABLE_RAG_LOCAL_WEB_FETCH,
64
+ ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION,
65
+ ENABLE_RAG_WEB_SEARCH,
66
+ ENV,
67
+ GOOGLE_PSE_API_KEY,
68
+ GOOGLE_PSE_ENGINE_ID,
69
+ PDF_EXTRACT_IMAGES,
70
+ RAG_EMBEDDING_ENGINE,
71
+ RAG_EMBEDDING_MODEL,
72
+ RAG_EMBEDDING_MODEL_AUTO_UPDATE,
73
+ RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE,
74
+ RAG_EMBEDDING_BATCH_SIZE,
75
+ RAG_FILE_MAX_COUNT,
76
+ RAG_FILE_MAX_SIZE,
77
+ RAG_OPENAI_API_BASE_URL,
78
+ RAG_OPENAI_API_KEY,
79
+ RAG_OLLAMA_BASE_URL,
80
+ RAG_OLLAMA_API_KEY,
81
+ RAG_RELEVANCE_THRESHOLD,
82
+ RAG_RERANKING_MODEL,
83
+ RAG_RERANKING_MODEL_AUTO_UPDATE,
84
+ RAG_RERANKING_MODEL_TRUST_REMOTE_CODE,
85
+ DEFAULT_RAG_TEMPLATE,
86
+ RAG_TEMPLATE,
87
+ RAG_TOP_K,
88
+ RAG_WEB_SEARCH_CONCURRENT_REQUESTS,
89
+ RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
90
+ RAG_WEB_SEARCH_ENGINE,
91
+ RAG_WEB_SEARCH_RESULT_COUNT,
92
+ JINA_API_KEY,
93
+ SEARCHAPI_API_KEY,
94
+ SEARCHAPI_ENGINE,
95
+ SEARXNG_QUERY_URL,
96
+ SERPER_API_KEY,
97
+ SERPLY_API_KEY,
98
+ SERPSTACK_API_KEY,
99
+ SERPSTACK_HTTPS,
100
+ TAVILY_API_KEY,
101
+ BING_SEARCH_V7_ENDPOINT,
102
+ BING_SEARCH_V7_SUBSCRIPTION_KEY,
103
+ TIKA_SERVER_URL,
104
+ UPLOAD_DIR,
105
+ YOUTUBE_LOADER_LANGUAGE,
106
+ DEFAULT_LOCALE,
107
+ AppConfig,
108
+ )
109
+ from open_webui.constants import ERROR_MESSAGES
110
+ from open_webui.env import (
111
+ SRC_LOG_LEVELS,
112
+ DEVICE_TYPE,
113
+ DOCKER,
114
+ )
115
+ from open_webui.utils.misc import (
116
+ calculate_sha256,
117
+ calculate_sha256_string,
118
+ extract_folders_after_data_docs,
119
+ sanitize_filename,
120
+ )
121
+ from open_webui.utils.utils import get_admin_user, get_verified_user
122
+
123
+ from langchain.text_splitter import RecursiveCharacterTextSplitter, TokenTextSplitter
124
+ from langchain_core.documents import Document
125
+
126
+
127
+ log = logging.getLogger(__name__)
128
+ log.setLevel(SRC_LOG_LEVELS["RAG"])
129
+
130
+ app = FastAPI(
131
+ docs_url="/docs" if ENV == "dev" else None,
132
+ openapi_url="/openapi.json" if ENV == "dev" else None,
133
+ redoc_url=None,
134
+ )
135
+
136
+ app.state.config = AppConfig()
137
+
138
+ app.state.config.TOP_K = RAG_TOP_K
139
+ app.state.config.RELEVANCE_THRESHOLD = RAG_RELEVANCE_THRESHOLD
140
+ app.state.config.FILE_MAX_SIZE = RAG_FILE_MAX_SIZE
141
+ app.state.config.FILE_MAX_COUNT = RAG_FILE_MAX_COUNT
142
+
143
+ app.state.config.ENABLE_RAG_HYBRID_SEARCH = ENABLE_RAG_HYBRID_SEARCH
144
+ app.state.config.ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION = (
145
+ ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION
146
+ )
147
+
148
+ app.state.config.CONTENT_EXTRACTION_ENGINE = CONTENT_EXTRACTION_ENGINE
149
+ app.state.config.TIKA_SERVER_URL = TIKA_SERVER_URL
150
+
151
+ app.state.config.TEXT_SPLITTER = RAG_TEXT_SPLITTER
152
+ app.state.config.TIKTOKEN_ENCODING_NAME = TIKTOKEN_ENCODING_NAME
153
+
154
+ app.state.config.CHUNK_SIZE = CHUNK_SIZE
155
+ app.state.config.CHUNK_OVERLAP = CHUNK_OVERLAP
156
+
157
+ app.state.config.RAG_EMBEDDING_ENGINE = RAG_EMBEDDING_ENGINE
158
+ app.state.config.RAG_EMBEDDING_MODEL = RAG_EMBEDDING_MODEL
159
+ app.state.config.RAG_EMBEDDING_BATCH_SIZE = RAG_EMBEDDING_BATCH_SIZE
160
+ app.state.config.RAG_RERANKING_MODEL = RAG_RERANKING_MODEL
161
+ app.state.config.RAG_TEMPLATE = RAG_TEMPLATE
162
+
163
+ app.state.config.OPENAI_API_BASE_URL = RAG_OPENAI_API_BASE_URL
164
+ app.state.config.OPENAI_API_KEY = RAG_OPENAI_API_KEY
165
+
166
+ app.state.config.OLLAMA_BASE_URL = RAG_OLLAMA_BASE_URL
167
+ app.state.config.OLLAMA_API_KEY = RAG_OLLAMA_API_KEY
168
+
169
+ app.state.config.PDF_EXTRACT_IMAGES = PDF_EXTRACT_IMAGES
170
+
171
+ app.state.config.YOUTUBE_LOADER_LANGUAGE = YOUTUBE_LOADER_LANGUAGE
172
+ app.state.YOUTUBE_LOADER_TRANSLATION = None
173
+
174
+
175
+ app.state.config.ENABLE_RAG_WEB_SEARCH = ENABLE_RAG_WEB_SEARCH
176
+ app.state.config.RAG_WEB_SEARCH_ENGINE = RAG_WEB_SEARCH_ENGINE
177
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST = RAG_WEB_SEARCH_DOMAIN_FILTER_LIST
178
+
179
+ app.state.config.SEARXNG_QUERY_URL = SEARXNG_QUERY_URL
180
+ app.state.config.GOOGLE_PSE_API_KEY = GOOGLE_PSE_API_KEY
181
+ app.state.config.GOOGLE_PSE_ENGINE_ID = GOOGLE_PSE_ENGINE_ID
182
+ app.state.config.BRAVE_SEARCH_API_KEY = BRAVE_SEARCH_API_KEY
183
+ app.state.config.SERPSTACK_API_KEY = SERPSTACK_API_KEY
184
+ app.state.config.SERPSTACK_HTTPS = SERPSTACK_HTTPS
185
+ app.state.config.SERPER_API_KEY = SERPER_API_KEY
186
+ app.state.config.SERPLY_API_KEY = SERPLY_API_KEY
187
+ app.state.config.TAVILY_API_KEY = TAVILY_API_KEY
188
+ app.state.config.SEARCHAPI_API_KEY = SEARCHAPI_API_KEY
189
+ app.state.config.SEARCHAPI_ENGINE = SEARCHAPI_ENGINE
190
+ app.state.config.JINA_API_KEY = JINA_API_KEY
191
+ app.state.config.BING_SEARCH_V7_ENDPOINT = BING_SEARCH_V7_ENDPOINT
192
+ app.state.config.BING_SEARCH_V7_SUBSCRIPTION_KEY = BING_SEARCH_V7_SUBSCRIPTION_KEY
193
+
194
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT = RAG_WEB_SEARCH_RESULT_COUNT
195
+ app.state.config.RAG_WEB_SEARCH_CONCURRENT_REQUESTS = RAG_WEB_SEARCH_CONCURRENT_REQUESTS
196
+
197
+
198
+ def update_embedding_model(
199
+ embedding_model: str,
200
+ auto_update: bool = False,
201
+ ):
202
+ if embedding_model and app.state.config.RAG_EMBEDDING_ENGINE == "":
203
+ from sentence_transformers import SentenceTransformer
204
+
205
+ try:
206
+ app.state.sentence_transformer_ef = SentenceTransformer(
207
+ get_model_path(embedding_model, auto_update),
208
+ device=DEVICE_TYPE,
209
+ trust_remote_code=RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE,
210
+ )
211
+ except Exception as e:
212
+ log.debug(f"Error loading SentenceTransformer: {e}")
213
+ app.state.sentence_transformer_ef = None
214
+ else:
215
+ app.state.sentence_transformer_ef = None
216
+
217
+
218
+ def update_reranking_model(
219
+ reranking_model: str,
220
+ auto_update: bool = False,
221
+ ):
222
+ if reranking_model:
223
+ if any(model in reranking_model for model in ["jinaai/jina-colbert-v2"]):
224
+ try:
225
+ from open_webui.apps.retrieval.models.colbert import ColBERT
226
+
227
+ app.state.sentence_transformer_rf = ColBERT(
228
+ get_model_path(reranking_model, auto_update),
229
+ env="docker" if DOCKER else None,
230
+ )
231
+ except Exception as e:
232
+ log.error(f"ColBERT: {e}")
233
+ app.state.sentence_transformer_rf = None
234
+ app.state.config.ENABLE_RAG_HYBRID_SEARCH = False
235
+ else:
236
+ import sentence_transformers
237
+
238
+ try:
239
+ app.state.sentence_transformer_rf = sentence_transformers.CrossEncoder(
240
+ get_model_path(reranking_model, auto_update),
241
+ device=DEVICE_TYPE,
242
+ trust_remote_code=RAG_RERANKING_MODEL_TRUST_REMOTE_CODE,
243
+ )
244
+ except:
245
+ log.error("CrossEncoder error")
246
+ app.state.sentence_transformer_rf = None
247
+ app.state.config.ENABLE_RAG_HYBRID_SEARCH = False
248
+ else:
249
+ app.state.sentence_transformer_rf = None
250
+
251
+
252
+ update_embedding_model(
253
+ app.state.config.RAG_EMBEDDING_MODEL,
254
+ RAG_EMBEDDING_MODEL_AUTO_UPDATE,
255
+ )
256
+
257
+ update_reranking_model(
258
+ app.state.config.RAG_RERANKING_MODEL,
259
+ RAG_RERANKING_MODEL_AUTO_UPDATE,
260
+ )
261
+
262
+
263
+ app.state.EMBEDDING_FUNCTION = get_embedding_function(
264
+ app.state.config.RAG_EMBEDDING_ENGINE,
265
+ app.state.config.RAG_EMBEDDING_MODEL,
266
+ app.state.sentence_transformer_ef,
267
+ (
268
+ app.state.config.OPENAI_API_BASE_URL
269
+ if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
270
+ else app.state.config.OLLAMA_BASE_URL
271
+ ),
272
+ (
273
+ app.state.config.OPENAI_API_KEY
274
+ if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
275
+ else app.state.config.OLLAMA_API_KEY
276
+ ),
277
+ app.state.config.RAG_EMBEDDING_BATCH_SIZE,
278
+ )
279
+
280
+ app.add_middleware(
281
+ CORSMiddleware,
282
+ allow_origins=CORS_ALLOW_ORIGIN,
283
+ allow_credentials=True,
284
+ allow_methods=["*"],
285
+ allow_headers=["*"],
286
+ )
287
+
288
+
289
+ class CollectionNameForm(BaseModel):
290
+ collection_name: Optional[str] = None
291
+
292
+
293
+ class ProcessUrlForm(CollectionNameForm):
294
+ url: str
295
+
296
+
297
+ class SearchForm(CollectionNameForm):
298
+ query: str
299
+
300
+
301
+ @app.get("/")
302
+ async def get_status():
303
+ return {
304
+ "status": True,
305
+ "chunk_size": app.state.config.CHUNK_SIZE,
306
+ "chunk_overlap": app.state.config.CHUNK_OVERLAP,
307
+ "template": app.state.config.RAG_TEMPLATE,
308
+ "embedding_engine": app.state.config.RAG_EMBEDDING_ENGINE,
309
+ "embedding_model": app.state.config.RAG_EMBEDDING_MODEL,
310
+ "reranking_model": app.state.config.RAG_RERANKING_MODEL,
311
+ "embedding_batch_size": app.state.config.RAG_EMBEDDING_BATCH_SIZE,
312
+ }
313
+
314
+
315
+ @app.get("/embedding")
316
+ async def get_embedding_config(user=Depends(get_admin_user)):
317
+ return {
318
+ "status": True,
319
+ "embedding_engine": app.state.config.RAG_EMBEDDING_ENGINE,
320
+ "embedding_model": app.state.config.RAG_EMBEDDING_MODEL,
321
+ "embedding_batch_size": app.state.config.RAG_EMBEDDING_BATCH_SIZE,
322
+ "openai_config": {
323
+ "url": app.state.config.OPENAI_API_BASE_URL,
324
+ "key": app.state.config.OPENAI_API_KEY,
325
+ },
326
+ "ollama_config": {
327
+ "url": app.state.config.OLLAMA_BASE_URL,
328
+ "key": app.state.config.OLLAMA_API_KEY,
329
+ },
330
+ }
331
+
332
+
333
+ @app.get("/reranking")
334
+ async def get_reraanking_config(user=Depends(get_admin_user)):
335
+ return {
336
+ "status": True,
337
+ "reranking_model": app.state.config.RAG_RERANKING_MODEL,
338
+ }
339
+
340
+
341
+ class OpenAIConfigForm(BaseModel):
342
+ url: str
343
+ key: str
344
+
345
+
346
+ class OllamaConfigForm(BaseModel):
347
+ url: str
348
+ key: str
349
+
350
+
351
+ class EmbeddingModelUpdateForm(BaseModel):
352
+ openai_config: Optional[OpenAIConfigForm] = None
353
+ ollama_config: Optional[OllamaConfigForm] = None
354
+ embedding_engine: str
355
+ embedding_model: str
356
+ embedding_batch_size: Optional[int] = 1
357
+
358
+
359
+ @app.post("/embedding/update")
360
+ async def update_embedding_config(
361
+ form_data: EmbeddingModelUpdateForm, user=Depends(get_admin_user)
362
+ ):
363
+ log.info(
364
+ f"Updating embedding model: {app.state.config.RAG_EMBEDDING_MODEL} to {form_data.embedding_model}"
365
+ )
366
+ try:
367
+ app.state.config.RAG_EMBEDDING_ENGINE = form_data.embedding_engine
368
+ app.state.config.RAG_EMBEDDING_MODEL = form_data.embedding_model
369
+
370
+ if app.state.config.RAG_EMBEDDING_ENGINE in ["ollama", "openai"]:
371
+ if form_data.openai_config is not None:
372
+ app.state.config.OPENAI_API_BASE_URL = form_data.openai_config.url
373
+ app.state.config.OPENAI_API_KEY = form_data.openai_config.key
374
+
375
+ if form_data.ollama_config is not None:
376
+ app.state.config.OLLAMA_BASE_URL = form_data.ollama_config.url
377
+ app.state.config.OLLAMA_API_KEY = form_data.ollama_config.key
378
+
379
+ app.state.config.RAG_EMBEDDING_BATCH_SIZE = form_data.embedding_batch_size
380
+
381
+ update_embedding_model(app.state.config.RAG_EMBEDDING_MODEL)
382
+
383
+ app.state.EMBEDDING_FUNCTION = get_embedding_function(
384
+ app.state.config.RAG_EMBEDDING_ENGINE,
385
+ app.state.config.RAG_EMBEDDING_MODEL,
386
+ app.state.sentence_transformer_ef,
387
+ (
388
+ app.state.config.OPENAI_API_BASE_URL
389
+ if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
390
+ else app.state.config.OLLAMA_BASE_URL
391
+ ),
392
+ (
393
+ app.state.config.OPENAI_API_KEY
394
+ if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
395
+ else app.state.config.OLLAMA_API_KEY
396
+ ),
397
+ app.state.config.RAG_EMBEDDING_BATCH_SIZE,
398
+ )
399
+
400
+ return {
401
+ "status": True,
402
+ "embedding_engine": app.state.config.RAG_EMBEDDING_ENGINE,
403
+ "embedding_model": app.state.config.RAG_EMBEDDING_MODEL,
404
+ "embedding_batch_size": app.state.config.RAG_EMBEDDING_BATCH_SIZE,
405
+ "openai_config": {
406
+ "url": app.state.config.OPENAI_API_BASE_URL,
407
+ "key": app.state.config.OPENAI_API_KEY,
408
+ },
409
+ "ollama_config": {
410
+ "url": app.state.config.OLLAMA_BASE_URL,
411
+ "key": app.state.config.OLLAMA_API_KEY,
412
+ },
413
+ }
414
+ except Exception as e:
415
+ log.exception(f"Problem updating embedding model: {e}")
416
+ raise HTTPException(
417
+ status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
418
+ detail=ERROR_MESSAGES.DEFAULT(e),
419
+ )
420
+
421
+
422
+ class RerankingModelUpdateForm(BaseModel):
423
+ reranking_model: str
424
+
425
+
426
+ @app.post("/reranking/update")
427
+ async def update_reranking_config(
428
+ form_data: RerankingModelUpdateForm, user=Depends(get_admin_user)
429
+ ):
430
+ log.info(
431
+ f"Updating reranking model: {app.state.config.RAG_RERANKING_MODEL} to {form_data.reranking_model}"
432
+ )
433
+ try:
434
+ app.state.config.RAG_RERANKING_MODEL = form_data.reranking_model
435
+
436
+ update_reranking_model(app.state.config.RAG_RERANKING_MODEL, True)
437
+
438
+ return {
439
+ "status": True,
440
+ "reranking_model": app.state.config.RAG_RERANKING_MODEL,
441
+ }
442
+ except Exception as e:
443
+ log.exception(f"Problem updating reranking model: {e}")
444
+ raise HTTPException(
445
+ status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
446
+ detail=ERROR_MESSAGES.DEFAULT(e),
447
+ )
448
+
449
+
450
+ @app.get("/config")
451
+ async def get_rag_config(user=Depends(get_admin_user)):
452
+ return {
453
+ "status": True,
454
+ "pdf_extract_images": app.state.config.PDF_EXTRACT_IMAGES,
455
+ "content_extraction": {
456
+ "engine": app.state.config.CONTENT_EXTRACTION_ENGINE,
457
+ "tika_server_url": app.state.config.TIKA_SERVER_URL,
458
+ },
459
+ "chunk": {
460
+ "text_splitter": app.state.config.TEXT_SPLITTER,
461
+ "chunk_size": app.state.config.CHUNK_SIZE,
462
+ "chunk_overlap": app.state.config.CHUNK_OVERLAP,
463
+ },
464
+ "file": {
465
+ "max_size": app.state.config.FILE_MAX_SIZE,
466
+ "max_count": app.state.config.FILE_MAX_COUNT,
467
+ },
468
+ "youtube": {
469
+ "language": app.state.config.YOUTUBE_LOADER_LANGUAGE,
470
+ "translation": app.state.YOUTUBE_LOADER_TRANSLATION,
471
+ },
472
+ "web": {
473
+ "web_loader_ssl_verification": app.state.config.ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION,
474
+ "search": {
475
+ "enabled": app.state.config.ENABLE_RAG_WEB_SEARCH,
476
+ "engine": app.state.config.RAG_WEB_SEARCH_ENGINE,
477
+ "searxng_query_url": app.state.config.SEARXNG_QUERY_URL,
478
+ "google_pse_api_key": app.state.config.GOOGLE_PSE_API_KEY,
479
+ "google_pse_engine_id": app.state.config.GOOGLE_PSE_ENGINE_ID,
480
+ "brave_search_api_key": app.state.config.BRAVE_SEARCH_API_KEY,
481
+ "serpstack_api_key": app.state.config.SERPSTACK_API_KEY,
482
+ "serpstack_https": app.state.config.SERPSTACK_HTTPS,
483
+ "serper_api_key": app.state.config.SERPER_API_KEY,
484
+ "serply_api_key": app.state.config.SERPLY_API_KEY,
485
+ "tavily_api_key": app.state.config.TAVILY_API_KEY,
486
+ "searchapi_api_key": app.state.config.SEARCHAPI_API_KEY,
487
+ "seaarchapi_engine": app.state.config.SEARCHAPI_ENGINE,
488
+ "jina_api_key": app.state.config.JINA_API_KEY,
489
+ "bing_search_v7_endpoint": app.state.config.BING_SEARCH_V7_ENDPOINT,
490
+ "bing_search_v7_subscription_key": app.state.config.BING_SEARCH_V7_SUBSCRIPTION_KEY,
491
+ "result_count": app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
492
+ "concurrent_requests": app.state.config.RAG_WEB_SEARCH_CONCURRENT_REQUESTS,
493
+ },
494
+ },
495
+ }
496
+
497
+
498
+ class FileConfig(BaseModel):
499
+ max_size: Optional[int] = None
500
+ max_count: Optional[int] = None
501
+
502
+
503
+ class ContentExtractionConfig(BaseModel):
504
+ engine: str = ""
505
+ tika_server_url: Optional[str] = None
506
+
507
+
508
+ class ChunkParamUpdateForm(BaseModel):
509
+ text_splitter: Optional[str] = None
510
+ chunk_size: int
511
+ chunk_overlap: int
512
+
513
+
514
+ class YoutubeLoaderConfig(BaseModel):
515
+ language: list[str]
516
+ translation: Optional[str] = None
517
+
518
+
519
+ class WebSearchConfig(BaseModel):
520
+ enabled: bool
521
+ engine: Optional[str] = None
522
+ searxng_query_url: Optional[str] = None
523
+ google_pse_api_key: Optional[str] = None
524
+ google_pse_engine_id: Optional[str] = None
525
+ brave_search_api_key: Optional[str] = None
526
+ serpstack_api_key: Optional[str] = None
527
+ serpstack_https: Optional[bool] = None
528
+ serper_api_key: Optional[str] = None
529
+ serply_api_key: Optional[str] = None
530
+ tavily_api_key: Optional[str] = None
531
+ searchapi_api_key: Optional[str] = None
532
+ searchapi_engine: Optional[str] = None
533
+ jina_api_key: Optional[str] = None
534
+ bing_search_v7_endpoint: Optional[str] = None
535
+ bing_search_v7_subscription_key: Optional[str] = None
536
+ result_count: Optional[int] = None
537
+ concurrent_requests: Optional[int] = None
538
+
539
+
540
+ class WebConfig(BaseModel):
541
+ search: WebSearchConfig
542
+ web_loader_ssl_verification: Optional[bool] = None
543
+
544
+
545
+ class ConfigUpdateForm(BaseModel):
546
+ pdf_extract_images: Optional[bool] = None
547
+ file: Optional[FileConfig] = None
548
+ content_extraction: Optional[ContentExtractionConfig] = None
549
+ chunk: Optional[ChunkParamUpdateForm] = None
550
+ youtube: Optional[YoutubeLoaderConfig] = None
551
+ web: Optional[WebConfig] = None
552
+
553
+
554
+ @app.post("/config/update")
555
+ async def update_rag_config(form_data: ConfigUpdateForm, user=Depends(get_admin_user)):
556
+ app.state.config.PDF_EXTRACT_IMAGES = (
557
+ form_data.pdf_extract_images
558
+ if form_data.pdf_extract_images is not None
559
+ else app.state.config.PDF_EXTRACT_IMAGES
560
+ )
561
+
562
+ if form_data.file is not None:
563
+ app.state.config.FILE_MAX_SIZE = form_data.file.max_size
564
+ app.state.config.FILE_MAX_COUNT = form_data.file.max_count
565
+
566
+ if form_data.content_extraction is not None:
567
+ log.info(f"Updating text settings: {form_data.content_extraction}")
568
+ app.state.config.CONTENT_EXTRACTION_ENGINE = form_data.content_extraction.engine
569
+ app.state.config.TIKA_SERVER_URL = form_data.content_extraction.tika_server_url
570
+
571
+ if form_data.chunk is not None:
572
+ app.state.config.TEXT_SPLITTER = form_data.chunk.text_splitter
573
+ app.state.config.CHUNK_SIZE = form_data.chunk.chunk_size
574
+ app.state.config.CHUNK_OVERLAP = form_data.chunk.chunk_overlap
575
+
576
+ if form_data.youtube is not None:
577
+ app.state.config.YOUTUBE_LOADER_LANGUAGE = form_data.youtube.language
578
+ app.state.YOUTUBE_LOADER_TRANSLATION = form_data.youtube.translation
579
+
580
+ if form_data.web is not None:
581
+ app.state.config.ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION = (
582
+ # Note: When UI "Bypass SSL verification for Websites"=True then ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION=False
583
+ form_data.web.web_loader_ssl_verification
584
+ )
585
+
586
+ app.state.config.ENABLE_RAG_WEB_SEARCH = form_data.web.search.enabled
587
+ app.state.config.RAG_WEB_SEARCH_ENGINE = form_data.web.search.engine
588
+ app.state.config.SEARXNG_QUERY_URL = form_data.web.search.searxng_query_url
589
+ app.state.config.GOOGLE_PSE_API_KEY = form_data.web.search.google_pse_api_key
590
+ app.state.config.GOOGLE_PSE_ENGINE_ID = (
591
+ form_data.web.search.google_pse_engine_id
592
+ )
593
+ app.state.config.BRAVE_SEARCH_API_KEY = (
594
+ form_data.web.search.brave_search_api_key
595
+ )
596
+ app.state.config.SERPSTACK_API_KEY = form_data.web.search.serpstack_api_key
597
+ app.state.config.SERPSTACK_HTTPS = form_data.web.search.serpstack_https
598
+ app.state.config.SERPER_API_KEY = form_data.web.search.serper_api_key
599
+ app.state.config.SERPLY_API_KEY = form_data.web.search.serply_api_key
600
+ app.state.config.TAVILY_API_KEY = form_data.web.search.tavily_api_key
601
+ app.state.config.SEARCHAPI_API_KEY = form_data.web.search.searchapi_api_key
602
+ app.state.config.SEARCHAPI_ENGINE = form_data.web.search.searchapi_engine
603
+
604
+ app.state.config.JINA_API_KEY = form_data.web.search.jina_api_key
605
+ app.state.config.BING_SEARCH_V7_ENDPOINT = (
606
+ form_data.web.search.bing_search_v7_endpoint
607
+ )
608
+ app.state.config.BING_SEARCH_V7_SUBSCRIPTION_KEY = (
609
+ form_data.web.search.bing_search_v7_subscription_key
610
+ )
611
+
612
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT = form_data.web.search.result_count
613
+ app.state.config.RAG_WEB_SEARCH_CONCURRENT_REQUESTS = (
614
+ form_data.web.search.concurrent_requests
615
+ )
616
+
617
+ return {
618
+ "status": True,
619
+ "pdf_extract_images": app.state.config.PDF_EXTRACT_IMAGES,
620
+ "file": {
621
+ "max_size": app.state.config.FILE_MAX_SIZE,
622
+ "max_count": app.state.config.FILE_MAX_COUNT,
623
+ },
624
+ "content_extraction": {
625
+ "engine": app.state.config.CONTENT_EXTRACTION_ENGINE,
626
+ "tika_server_url": app.state.config.TIKA_SERVER_URL,
627
+ },
628
+ "chunk": {
629
+ "text_splitter": app.state.config.TEXT_SPLITTER,
630
+ "chunk_size": app.state.config.CHUNK_SIZE,
631
+ "chunk_overlap": app.state.config.CHUNK_OVERLAP,
632
+ },
633
+ "youtube": {
634
+ "language": app.state.config.YOUTUBE_LOADER_LANGUAGE,
635
+ "translation": app.state.YOUTUBE_LOADER_TRANSLATION,
636
+ },
637
+ "web": {
638
+ "web_loader_ssl_verification": app.state.config.ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION,
639
+ "search": {
640
+ "enabled": app.state.config.ENABLE_RAG_WEB_SEARCH,
641
+ "engine": app.state.config.RAG_WEB_SEARCH_ENGINE,
642
+ "searxng_query_url": app.state.config.SEARXNG_QUERY_URL,
643
+ "google_pse_api_key": app.state.config.GOOGLE_PSE_API_KEY,
644
+ "google_pse_engine_id": app.state.config.GOOGLE_PSE_ENGINE_ID,
645
+ "brave_search_api_key": app.state.config.BRAVE_SEARCH_API_KEY,
646
+ "serpstack_api_key": app.state.config.SERPSTACK_API_KEY,
647
+ "serpstack_https": app.state.config.SERPSTACK_HTTPS,
648
+ "serper_api_key": app.state.config.SERPER_API_KEY,
649
+ "serply_api_key": app.state.config.SERPLY_API_KEY,
650
+ "serachapi_api_key": app.state.config.SEARCHAPI_API_KEY,
651
+ "searchapi_engine": app.state.config.SEARCHAPI_ENGINE,
652
+ "tavily_api_key": app.state.config.TAVILY_API_KEY,
653
+ "jina_api_key": app.state.config.JINA_API_KEY,
654
+ "bing_search_v7_endpoint": app.state.config.BING_SEARCH_V7_ENDPOINT,
655
+ "bing_search_v7_subscription_key": app.state.config.BING_SEARCH_V7_SUBSCRIPTION_KEY,
656
+ "result_count": app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
657
+ "concurrent_requests": app.state.config.RAG_WEB_SEARCH_CONCURRENT_REQUESTS,
658
+ },
659
+ },
660
+ }
661
+
662
+
663
+ @app.get("/template")
664
+ async def get_rag_template(user=Depends(get_verified_user)):
665
+ return {
666
+ "status": True,
667
+ "template": app.state.config.RAG_TEMPLATE,
668
+ }
669
+
670
+
671
+ @app.get("/query/settings")
672
+ async def get_query_settings(user=Depends(get_admin_user)):
673
+ return {
674
+ "status": True,
675
+ "template": app.state.config.RAG_TEMPLATE,
676
+ "k": app.state.config.TOP_K,
677
+ "r": app.state.config.RELEVANCE_THRESHOLD,
678
+ "hybrid": app.state.config.ENABLE_RAG_HYBRID_SEARCH,
679
+ }
680
+
681
+
682
+ class QuerySettingsForm(BaseModel):
683
+ k: Optional[int] = None
684
+ r: Optional[float] = None
685
+ template: Optional[str] = None
686
+ hybrid: Optional[bool] = None
687
+
688
+
689
+ @app.post("/query/settings/update")
690
+ async def update_query_settings(
691
+ form_data: QuerySettingsForm, user=Depends(get_admin_user)
692
+ ):
693
+ app.state.config.RAG_TEMPLATE = form_data.template
694
+ app.state.config.TOP_K = form_data.k if form_data.k else 4
695
+ app.state.config.RELEVANCE_THRESHOLD = form_data.r if form_data.r else 0.0
696
+
697
+ app.state.config.ENABLE_RAG_HYBRID_SEARCH = (
698
+ form_data.hybrid if form_data.hybrid else False
699
+ )
700
+
701
+ return {
702
+ "status": True,
703
+ "template": app.state.config.RAG_TEMPLATE,
704
+ "k": app.state.config.TOP_K,
705
+ "r": app.state.config.RELEVANCE_THRESHOLD,
706
+ "hybrid": app.state.config.ENABLE_RAG_HYBRID_SEARCH,
707
+ }
708
+
709
+
710
+ ####################################
711
+ #
712
+ # Document process and retrieval
713
+ #
714
+ ####################################
715
+
716
+
717
+ def _get_docs_info(docs: list[Document]) -> str:
718
+ docs_info = set()
719
+
720
+ # Trying to select relevant metadata identifying the document.
721
+ for doc in docs:
722
+ metadata = getattr(doc, "metadata", {})
723
+ doc_name = metadata.get("name", "")
724
+ if not doc_name:
725
+ doc_name = metadata.get("title", "")
726
+ if not doc_name:
727
+ doc_name = metadata.get("source", "")
728
+ if doc_name:
729
+ docs_info.add(doc_name)
730
+
731
+ return ", ".join(docs_info)
732
+
733
+
734
+ def save_docs_to_vector_db(
735
+ docs,
736
+ collection_name,
737
+ metadata: Optional[dict] = None,
738
+ overwrite: bool = False,
739
+ split: bool = True,
740
+ add: bool = False,
741
+ ) -> bool:
742
+ log.info(
743
+ f"save_docs_to_vector_db: document {_get_docs_info(docs)} {collection_name}"
744
+ )
745
+
746
+ # Check if entries with the same hash (metadata.hash) already exist
747
+ if metadata and "hash" in metadata:
748
+ result = VECTOR_DB_CLIENT.query(
749
+ collection_name=collection_name,
750
+ filter={"hash": metadata["hash"]},
751
+ )
752
+
753
+ if result is not None:
754
+ existing_doc_ids = result.ids[0]
755
+ if existing_doc_ids:
756
+ log.info(f"Document with hash {metadata['hash']} already exists")
757
+ raise ValueError(ERROR_MESSAGES.DUPLICATE_CONTENT)
758
+
759
+ if split:
760
+ if app.state.config.TEXT_SPLITTER in ["", "character"]:
761
+ text_splitter = RecursiveCharacterTextSplitter(
762
+ chunk_size=app.state.config.CHUNK_SIZE,
763
+ chunk_overlap=app.state.config.CHUNK_OVERLAP,
764
+ add_start_index=True,
765
+ )
766
+ elif app.state.config.TEXT_SPLITTER == "token":
767
+ log.info(
768
+ f"Using token text splitter: {app.state.config.TIKTOKEN_ENCODING_NAME}"
769
+ )
770
+
771
+ tiktoken.get_encoding(str(app.state.config.TIKTOKEN_ENCODING_NAME))
772
+ text_splitter = TokenTextSplitter(
773
+ encoding_name=str(app.state.config.TIKTOKEN_ENCODING_NAME),
774
+ chunk_size=app.state.config.CHUNK_SIZE,
775
+ chunk_overlap=app.state.config.CHUNK_OVERLAP,
776
+ add_start_index=True,
777
+ )
778
+ else:
779
+ raise ValueError(ERROR_MESSAGES.DEFAULT("Invalid text splitter"))
780
+
781
+ docs = text_splitter.split_documents(docs)
782
+
783
+ if len(docs) == 0:
784
+ raise ValueError(ERROR_MESSAGES.EMPTY_CONTENT)
785
+
786
+ texts = [doc.page_content for doc in docs]
787
+ metadatas = [
788
+ {
789
+ **doc.metadata,
790
+ **(metadata if metadata else {}),
791
+ "embedding_config": json.dumps(
792
+ {
793
+ "engine": app.state.config.RAG_EMBEDDING_ENGINE,
794
+ "model": app.state.config.RAG_EMBEDDING_MODEL,
795
+ }
796
+ ),
797
+ }
798
+ for doc in docs
799
+ ]
800
+
801
+ # ChromaDB does not like datetime formats
802
+ # for meta-data so convert them to string.
803
+ for metadata in metadatas:
804
+ for key, value in metadata.items():
805
+ if isinstance(value, datetime):
806
+ metadata[key] = str(value)
807
+
808
+ try:
809
+ if VECTOR_DB_CLIENT.has_collection(collection_name=collection_name):
810
+ log.info(f"collection {collection_name} already exists")
811
+
812
+ if overwrite:
813
+ VECTOR_DB_CLIENT.delete_collection(collection_name=collection_name)
814
+ log.info(f"deleting existing collection {collection_name}")
815
+ elif add is False:
816
+ log.info(
817
+ f"collection {collection_name} already exists, overwrite is False and add is False"
818
+ )
819
+ return True
820
+
821
+ log.info(f"adding to collection {collection_name}")
822
+ embedding_function = get_embedding_function(
823
+ app.state.config.RAG_EMBEDDING_ENGINE,
824
+ app.state.config.RAG_EMBEDDING_MODEL,
825
+ app.state.sentence_transformer_ef,
826
+ (
827
+ app.state.config.OPENAI_API_BASE_URL
828
+ if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
829
+ else app.state.config.OLLAMA_BASE_URL
830
+ ),
831
+ (
832
+ app.state.config.OPENAI_API_KEY
833
+ if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
834
+ else app.state.config.OLLAMA_API_KEY
835
+ ),
836
+ app.state.config.RAG_EMBEDDING_BATCH_SIZE,
837
+ )
838
+
839
+ embeddings = embedding_function(
840
+ list(map(lambda x: x.replace("\n", " "), texts))
841
+ )
842
+
843
+ items = [
844
+ {
845
+ "id": str(uuid.uuid4()),
846
+ "text": text,
847
+ "vector": embeddings[idx],
848
+ "metadata": metadatas[idx],
849
+ }
850
+ for idx, text in enumerate(texts)
851
+ ]
852
+
853
+ VECTOR_DB_CLIENT.insert(
854
+ collection_name=collection_name,
855
+ items=items,
856
+ )
857
+
858
+ return True
859
+ except Exception as e:
860
+ log.exception(e)
861
+ return False
862
+
863
+
864
+ class ProcessFileForm(BaseModel):
865
+ file_id: str
866
+ content: Optional[str] = None
867
+ collection_name: Optional[str] = None
868
+
869
+
870
+ @app.post("/process/file")
871
+ def process_file(
872
+ form_data: ProcessFileForm,
873
+ user=Depends(get_verified_user),
874
+ ):
875
+ try:
876
+ file = Files.get_file_by_id(form_data.file_id)
877
+
878
+ collection_name = form_data.collection_name
879
+
880
+ if collection_name is None:
881
+ collection_name = f"file-{file.id}"
882
+
883
+ if form_data.content:
884
+ # Update the content in the file
885
+ # Usage: /files/{file_id}/data/content/update
886
+
887
+ VECTOR_DB_CLIENT.delete(
888
+ collection_name=f"file-{file.id}",
889
+ filter={"file_id": file.id},
890
+ )
891
+
892
+ docs = [
893
+ Document(
894
+ page_content=form_data.content,
895
+ metadata={
896
+ "name": file.meta.get("name", file.filename),
897
+ "created_by": file.user_id,
898
+ "file_id": file.id,
899
+ **file.meta,
900
+ },
901
+ )
902
+ ]
903
+
904
+ text_content = form_data.content
905
+ elif form_data.collection_name:
906
+ # Check if the file has already been processed and save the content
907
+ # Usage: /knowledge/{id}/file/add, /knowledge/{id}/file/update
908
+
909
+ result = VECTOR_DB_CLIENT.query(
910
+ collection_name=f"file-{file.id}", filter={"file_id": file.id}
911
+ )
912
+
913
+ if result is not None and len(result.ids[0]) > 0:
914
+ docs = [
915
+ Document(
916
+ page_content=result.documents[0][idx],
917
+ metadata=result.metadatas[0][idx],
918
+ )
919
+ for idx, id in enumerate(result.ids[0])
920
+ ]
921
+ else:
922
+ docs = [
923
+ Document(
924
+ page_content=file.data.get("content", ""),
925
+ metadata={
926
+ "name": file.meta.get("name", file.filename),
927
+ "created_by": file.user_id,
928
+ "file_id": file.id,
929
+ **file.meta,
930
+ },
931
+ )
932
+ ]
933
+
934
+ text_content = file.data.get("content", "")
935
+ else:
936
+ # Process the file and save the content
937
+ # Usage: /files/
938
+ file_path = file.path
939
+ if file_path:
940
+ file_path = Storage.get_file(file_path)
941
+ loader = Loader(
942
+ engine=app.state.config.CONTENT_EXTRACTION_ENGINE,
943
+ TIKA_SERVER_URL=app.state.config.TIKA_SERVER_URL,
944
+ PDF_EXTRACT_IMAGES=app.state.config.PDF_EXTRACT_IMAGES,
945
+ )
946
+ docs = loader.load(
947
+ file.filename, file.meta.get("content_type"), file_path
948
+ )
949
+ else:
950
+ docs = [
951
+ Document(
952
+ page_content=file.data.get("content", ""),
953
+ metadata={
954
+ "name": file.filename,
955
+ "created_by": file.user_id,
956
+ "file_id": file.id,
957
+ **file.meta,
958
+ },
959
+ )
960
+ ]
961
+ text_content = " ".join([doc.page_content for doc in docs])
962
+
963
+ log.debug(f"text_content: {text_content}")
964
+ Files.update_file_data_by_id(
965
+ file.id,
966
+ {"content": text_content},
967
+ )
968
+
969
+ hash = calculate_sha256_string(text_content)
970
+ Files.update_file_hash_by_id(file.id, hash)
971
+
972
+ try:
973
+ result = save_docs_to_vector_db(
974
+ docs=docs,
975
+ collection_name=collection_name,
976
+ metadata={
977
+ "file_id": file.id,
978
+ "name": file.meta.get("name", file.filename),
979
+ "hash": hash,
980
+ },
981
+ add=(True if form_data.collection_name else False),
982
+ )
983
+
984
+ if result:
985
+ Files.update_file_metadata_by_id(
986
+ file.id,
987
+ {
988
+ "collection_name": collection_name,
989
+ },
990
+ )
991
+
992
+ return {
993
+ "status": True,
994
+ "collection_name": collection_name,
995
+ "filename": file.meta.get("name", file.filename),
996
+ "content": text_content,
997
+ }
998
+ except Exception as e:
999
+ raise e
1000
+ except Exception as e:
1001
+ log.exception(e)
1002
+ if "No pandoc was found" in str(e):
1003
+ raise HTTPException(
1004
+ status_code=status.HTTP_400_BAD_REQUEST,
1005
+ detail=ERROR_MESSAGES.PANDOC_NOT_INSTALLED,
1006
+ )
1007
+ else:
1008
+ raise HTTPException(
1009
+ status_code=status.HTTP_400_BAD_REQUEST,
1010
+ detail=str(e),
1011
+ )
1012
+
1013
+
1014
+ class ProcessTextForm(BaseModel):
1015
+ name: str
1016
+ content: str
1017
+ collection_name: Optional[str] = None
1018
+
1019
+
1020
+ @app.post("/process/text")
1021
+ def process_text(
1022
+ form_data: ProcessTextForm,
1023
+ user=Depends(get_verified_user),
1024
+ ):
1025
+ collection_name = form_data.collection_name
1026
+ if collection_name is None:
1027
+ collection_name = calculate_sha256_string(form_data.content)
1028
+
1029
+ docs = [
1030
+ Document(
1031
+ page_content=form_data.content,
1032
+ metadata={"name": form_data.name, "created_by": user.id},
1033
+ )
1034
+ ]
1035
+ text_content = form_data.content
1036
+ log.debug(f"text_content: {text_content}")
1037
+
1038
+ result = save_docs_to_vector_db(docs, collection_name)
1039
+
1040
+ if result:
1041
+ return {
1042
+ "status": True,
1043
+ "collection_name": collection_name,
1044
+ "content": text_content,
1045
+ }
1046
+ else:
1047
+ raise HTTPException(
1048
+ status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
1049
+ detail=ERROR_MESSAGES.DEFAULT(),
1050
+ )
1051
+
1052
+
1053
+ @app.post("/process/youtube")
1054
+ def process_youtube_video(form_data: ProcessUrlForm, user=Depends(get_verified_user)):
1055
+ try:
1056
+ collection_name = form_data.collection_name
1057
+ if not collection_name:
1058
+ collection_name = calculate_sha256_string(form_data.url)[:63]
1059
+
1060
+ loader = YoutubeLoader(
1061
+ form_data.url, language=app.state.config.YOUTUBE_LOADER_LANGUAGE
1062
+ )
1063
+
1064
+ docs = loader.load()
1065
+ content = " ".join([doc.page_content for doc in docs])
1066
+ log.debug(f"text_content: {content}")
1067
+ save_docs_to_vector_db(docs, collection_name, overwrite=True)
1068
+
1069
+ return {
1070
+ "status": True,
1071
+ "collection_name": collection_name,
1072
+ "filename": form_data.url,
1073
+ "file": {
1074
+ "data": {
1075
+ "content": content,
1076
+ },
1077
+ "meta": {
1078
+ "name": form_data.url,
1079
+ },
1080
+ },
1081
+ }
1082
+ except Exception as e:
1083
+ log.exception(e)
1084
+ raise HTTPException(
1085
+ status_code=status.HTTP_400_BAD_REQUEST,
1086
+ detail=ERROR_MESSAGES.DEFAULT(e),
1087
+ )
1088
+
1089
+
1090
+ @app.post("/process/web")
1091
+ def process_web(form_data: ProcessUrlForm, user=Depends(get_verified_user)):
1092
+ try:
1093
+ collection_name = form_data.collection_name
1094
+ if not collection_name:
1095
+ collection_name = calculate_sha256_string(form_data.url)[:63]
1096
+
1097
+ loader = get_web_loader(
1098
+ form_data.url,
1099
+ verify_ssl=app.state.config.ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION,
1100
+ requests_per_second=app.state.config.RAG_WEB_SEARCH_CONCURRENT_REQUESTS,
1101
+ )
1102
+ docs = loader.load()
1103
+ content = " ".join([doc.page_content for doc in docs])
1104
+ log.debug(f"text_content: {content}")
1105
+ save_docs_to_vector_db(docs, collection_name, overwrite=True)
1106
+
1107
+ return {
1108
+ "status": True,
1109
+ "collection_name": collection_name,
1110
+ "filename": form_data.url,
1111
+ "file": {
1112
+ "data": {
1113
+ "content": content,
1114
+ },
1115
+ "meta": {
1116
+ "name": form_data.url,
1117
+ },
1118
+ },
1119
+ }
1120
+ except Exception as e:
1121
+ log.exception(e)
1122
+ raise HTTPException(
1123
+ status_code=status.HTTP_400_BAD_REQUEST,
1124
+ detail=ERROR_MESSAGES.DEFAULT(e),
1125
+ )
1126
+
1127
+
1128
+ def search_web(engine: str, query: str) -> list[SearchResult]:
1129
+ """Search the web using a search engine and return the results as a list of SearchResult objects.
1130
+ Will look for a search engine API key in environment variables in the following order:
1131
+ - SEARXNG_QUERY_URL
1132
+ - GOOGLE_PSE_API_KEY + GOOGLE_PSE_ENGINE_ID
1133
+ - BRAVE_SEARCH_API_KEY
1134
+ - SERPSTACK_API_KEY
1135
+ - SERPER_API_KEY
1136
+ - SERPLY_API_KEY
1137
+ - TAVILY_API_KEY
1138
+ - SEARCHAPI_API_KEY + SEARCHAPI_ENGINE (by default `google`)
1139
+ Args:
1140
+ query (str): The query to search for
1141
+ """
1142
+
1143
+ # TODO: add playwright to search the web
1144
+ if engine == "searxng":
1145
+ if app.state.config.SEARXNG_QUERY_URL:
1146
+ return search_searxng(
1147
+ app.state.config.SEARXNG_QUERY_URL,
1148
+ query,
1149
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1150
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1151
+ )
1152
+ else:
1153
+ raise Exception("No SEARXNG_QUERY_URL found in environment variables")
1154
+ elif engine == "google_pse":
1155
+ if (
1156
+ app.state.config.GOOGLE_PSE_API_KEY
1157
+ and app.state.config.GOOGLE_PSE_ENGINE_ID
1158
+ ):
1159
+ return search_google_pse(
1160
+ app.state.config.GOOGLE_PSE_API_KEY,
1161
+ app.state.config.GOOGLE_PSE_ENGINE_ID,
1162
+ query,
1163
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1164
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1165
+ )
1166
+ else:
1167
+ raise Exception(
1168
+ "No GOOGLE_PSE_API_KEY or GOOGLE_PSE_ENGINE_ID found in environment variables"
1169
+ )
1170
+ elif engine == "brave":
1171
+ if app.state.config.BRAVE_SEARCH_API_KEY:
1172
+ return search_brave(
1173
+ app.state.config.BRAVE_SEARCH_API_KEY,
1174
+ query,
1175
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1176
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1177
+ )
1178
+ else:
1179
+ raise Exception("No BRAVE_SEARCH_API_KEY found in environment variables")
1180
+ elif engine == "serpstack":
1181
+ if app.state.config.SERPSTACK_API_KEY:
1182
+ return search_serpstack(
1183
+ app.state.config.SERPSTACK_API_KEY,
1184
+ query,
1185
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1186
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1187
+ https_enabled=app.state.config.SERPSTACK_HTTPS,
1188
+ )
1189
+ else:
1190
+ raise Exception("No SERPSTACK_API_KEY found in environment variables")
1191
+ elif engine == "serper":
1192
+ if app.state.config.SERPER_API_KEY:
1193
+ return search_serper(
1194
+ app.state.config.SERPER_API_KEY,
1195
+ query,
1196
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1197
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1198
+ )
1199
+ else:
1200
+ raise Exception("No SERPER_API_KEY found in environment variables")
1201
+ elif engine == "serply":
1202
+ if app.state.config.SERPLY_API_KEY:
1203
+ return search_serply(
1204
+ app.state.config.SERPLY_API_KEY,
1205
+ query,
1206
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1207
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1208
+ )
1209
+ else:
1210
+ raise Exception("No SERPLY_API_KEY found in environment variables")
1211
+ elif engine == "duckduckgo":
1212
+ return search_duckduckgo(
1213
+ query,
1214
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1215
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1216
+ )
1217
+ elif engine == "tavily":
1218
+ if app.state.config.TAVILY_API_KEY:
1219
+ return search_tavily(
1220
+ app.state.config.TAVILY_API_KEY,
1221
+ query,
1222
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1223
+ )
1224
+ else:
1225
+ raise Exception("No TAVILY_API_KEY found in environment variables")
1226
+ elif engine == "searchapi":
1227
+ if app.state.config.SEARCHAPI_API_KEY:
1228
+ return search_searchapi(
1229
+ app.state.config.SEARCHAPI_API_KEY,
1230
+ app.state.config.SEARCHAPI_ENGINE,
1231
+ query,
1232
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1233
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1234
+ )
1235
+ else:
1236
+ raise Exception("No SEARCHAPI_API_KEY found in environment variables")
1237
+ elif engine == "jina":
1238
+ return search_jina(
1239
+ app.state.config.JINA_API_KEY,
1240
+ query,
1241
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1242
+ )
1243
+ elif engine == "bing":
1244
+ return search_bing(
1245
+ app.state.config.BING_SEARCH_V7_SUBSCRIPTION_KEY,
1246
+ app.state.config.BING_SEARCH_V7_ENDPOINT,
1247
+ str(DEFAULT_LOCALE),
1248
+ query,
1249
+ app.state.config.RAG_WEB_SEARCH_RESULT_COUNT,
1250
+ app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
1251
+ )
1252
+ else:
1253
+ raise Exception("No search engine API key found in environment variables")
1254
+
1255
+
1256
+ @app.post("/process/web/search")
1257
+ def process_web_search(form_data: SearchForm, user=Depends(get_verified_user)):
1258
+ try:
1259
+ logging.info(
1260
+ f"trying to web search with {app.state.config.RAG_WEB_SEARCH_ENGINE, form_data.query}"
1261
+ )
1262
+ web_results = search_web(
1263
+ app.state.config.RAG_WEB_SEARCH_ENGINE, form_data.query
1264
+ )
1265
+ except Exception as e:
1266
+ log.exception(e)
1267
+
1268
+ print(e)
1269
+ raise HTTPException(
1270
+ status_code=status.HTTP_400_BAD_REQUEST,
1271
+ detail=ERROR_MESSAGES.WEB_SEARCH_ERROR(e),
1272
+ )
1273
+
1274
+ try:
1275
+ collection_name = form_data.collection_name
1276
+ if collection_name == "":
1277
+ collection_name = calculate_sha256_string(form_data.query)[:63]
1278
+
1279
+ urls = [result.link for result in web_results]
1280
+
1281
+ loader = get_web_loader(
1282
+ urls,
1283
+ verify_ssl=app.state.config.ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION,
1284
+ requests_per_second=app.state.config.RAG_WEB_SEARCH_CONCURRENT_REQUESTS,
1285
+ )
1286
+ docs = loader.aload()
1287
+
1288
+ save_docs_to_vector_db(docs, collection_name, overwrite=True)
1289
+
1290
+ return {
1291
+ "status": True,
1292
+ "collection_name": collection_name,
1293
+ "filenames": urls,
1294
+ }
1295
+ except Exception as e:
1296
+ log.exception(e)
1297
+ raise HTTPException(
1298
+ status_code=status.HTTP_400_BAD_REQUEST,
1299
+ detail=ERROR_MESSAGES.DEFAULT(e),
1300
+ )
1301
+
1302
+
1303
+ class QueryDocForm(BaseModel):
1304
+ collection_name: str
1305
+ query: str
1306
+ k: Optional[int] = None
1307
+ r: Optional[float] = None
1308
+ hybrid: Optional[bool] = None
1309
+
1310
+
1311
+ @app.post("/query/doc")
1312
+ def query_doc_handler(
1313
+ form_data: QueryDocForm,
1314
+ user=Depends(get_verified_user),
1315
+ ):
1316
+ try:
1317
+ if app.state.config.ENABLE_RAG_HYBRID_SEARCH:
1318
+ return query_doc_with_hybrid_search(
1319
+ collection_name=form_data.collection_name,
1320
+ query=form_data.query,
1321
+ embedding_function=app.state.EMBEDDING_FUNCTION,
1322
+ k=form_data.k if form_data.k else app.state.config.TOP_K,
1323
+ reranking_function=app.state.sentence_transformer_rf,
1324
+ r=(
1325
+ form_data.r if form_data.r else app.state.config.RELEVANCE_THRESHOLD
1326
+ ),
1327
+ )
1328
+ else:
1329
+ return query_doc(
1330
+ collection_name=form_data.collection_name,
1331
+ query=form_data.query,
1332
+ embedding_function=app.state.EMBEDDING_FUNCTION,
1333
+ k=form_data.k if form_data.k else app.state.config.TOP_K,
1334
+ )
1335
+ except Exception as e:
1336
+ log.exception(e)
1337
+ raise HTTPException(
1338
+ status_code=status.HTTP_400_BAD_REQUEST,
1339
+ detail=ERROR_MESSAGES.DEFAULT(e),
1340
+ )
1341
+
1342
+
1343
+ class QueryCollectionsForm(BaseModel):
1344
+ collection_names: list[str]
1345
+ query: str
1346
+ k: Optional[int] = None
1347
+ r: Optional[float] = None
1348
+ hybrid: Optional[bool] = None
1349
+
1350
+
1351
+ @app.post("/query/collection")
1352
+ def query_collection_handler(
1353
+ form_data: QueryCollectionsForm,
1354
+ user=Depends(get_verified_user),
1355
+ ):
1356
+ try:
1357
+ if app.state.config.ENABLE_RAG_HYBRID_SEARCH:
1358
+ return query_collection_with_hybrid_search(
1359
+ collection_names=form_data.collection_names,
1360
+ query=form_data.query,
1361
+ embedding_function=app.state.EMBEDDING_FUNCTION,
1362
+ k=form_data.k if form_data.k else app.state.config.TOP_K,
1363
+ reranking_function=app.state.sentence_transformer_rf,
1364
+ r=(
1365
+ form_data.r if form_data.r else app.state.config.RELEVANCE_THRESHOLD
1366
+ ),
1367
+ )
1368
+ else:
1369
+ return query_collection(
1370
+ collection_names=form_data.collection_names,
1371
+ query=form_data.query,
1372
+ embedding_function=app.state.EMBEDDING_FUNCTION,
1373
+ k=form_data.k if form_data.k else app.state.config.TOP_K,
1374
+ )
1375
+
1376
+ except Exception as e:
1377
+ log.exception(e)
1378
+ raise HTTPException(
1379
+ status_code=status.HTTP_400_BAD_REQUEST,
1380
+ detail=ERROR_MESSAGES.DEFAULT(e),
1381
+ )
1382
+
1383
+
1384
+ ####################################
1385
+ #
1386
+ # Vector DB operations
1387
+ #
1388
+ ####################################
1389
+
1390
+
1391
+ class DeleteForm(BaseModel):
1392
+ collection_name: str
1393
+ file_id: str
1394
+
1395
+
1396
+ @app.post("/delete")
1397
+ def delete_entries_from_collection(form_data: DeleteForm, user=Depends(get_admin_user)):
1398
+ try:
1399
+ if VECTOR_DB_CLIENT.has_collection(collection_name=form_data.collection_name):
1400
+ file = Files.get_file_by_id(form_data.file_id)
1401
+ hash = file.hash
1402
+
1403
+ VECTOR_DB_CLIENT.delete(
1404
+ collection_name=form_data.collection_name,
1405
+ metadata={"hash": hash},
1406
+ )
1407
+ return {"status": True}
1408
+ else:
1409
+ return {"status": False}
1410
+ except Exception as e:
1411
+ log.exception(e)
1412
+ return {"status": False}
1413
+
1414
+
1415
+ @app.post("/reset/db")
1416
+ def reset_vector_db(user=Depends(get_admin_user)):
1417
+ VECTOR_DB_CLIENT.reset()
1418
+ Knowledges.delete_all_knowledge()
1419
+
1420
+
1421
+ @app.post("/reset/uploads")
1422
+ def reset_upload_dir(user=Depends(get_admin_user)) -> bool:
1423
+ folder = f"{UPLOAD_DIR}"
1424
+ try:
1425
+ # Check if the directory exists
1426
+ if os.path.exists(folder):
1427
+ # Iterate over all the files and directories in the specified directory
1428
+ for filename in os.listdir(folder):
1429
+ file_path = os.path.join(folder, filename)
1430
+ try:
1431
+ if os.path.isfile(file_path) or os.path.islink(file_path):
1432
+ os.unlink(file_path) # Remove the file or link
1433
+ elif os.path.isdir(file_path):
1434
+ shutil.rmtree(file_path) # Remove the directory
1435
+ except Exception as e:
1436
+ print(f"Failed to delete {file_path}. Reason: {e}")
1437
+ else:
1438
+ print(f"The directory {folder} does not exist")
1439
+ except Exception as e:
1440
+ print(f"Failed to process the directory {folder}. Reason: {e}")
1441
+ return True
1442
+
1443
+
1444
+ if ENV == "dev":
1445
+
1446
+ @app.get("/ef")
1447
+ async def get_embeddings():
1448
+ return {"result": app.state.EMBEDDING_FUNCTION("hello world")}
1449
+
1450
+ @app.get("/ef/{text}")
1451
+ async def get_embeddings_text(text: str):
1452
+ return {"result": app.state.EMBEDDING_FUNCTION(text)}
backend/open_webui/apps/retrieval/models/colbert.py ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ import torch
3
+ import numpy as np
4
+ from colbert.infra import ColBERTConfig
5
+ from colbert.modeling.checkpoint import Checkpoint
6
+
7
+
8
+ class ColBERT:
9
+ def __init__(self, name, **kwargs) -> None:
10
+ print("ColBERT: Loading model", name)
11
+ self.device = "cuda" if torch.cuda.is_available() else "cpu"
12
+
13
+ DOCKER = kwargs.get("env") == "docker"
14
+ if DOCKER:
15
+ # This is a workaround for the issue with the docker container
16
+ # where the torch extension is not loaded properly
17
+ # and the following error is thrown:
18
+ # /root/.cache/torch_extensions/py311_cpu/segmented_maxsim_cpp/segmented_maxsim_cpp.so: cannot open shared object file: No such file or directory
19
+
20
+ lock_file = (
21
+ "/root/.cache/torch_extensions/py311_cpu/segmented_maxsim_cpp/lock"
22
+ )
23
+ if os.path.exists(lock_file):
24
+ os.remove(lock_file)
25
+
26
+ self.ckpt = Checkpoint(
27
+ name,
28
+ colbert_config=ColBERTConfig(model_name=name),
29
+ ).to(self.device)
30
+ pass
31
+
32
+ def calculate_similarity_scores(self, query_embeddings, document_embeddings):
33
+
34
+ query_embeddings = query_embeddings.to(self.device)
35
+ document_embeddings = document_embeddings.to(self.device)
36
+
37
+ # Validate dimensions to ensure compatibility
38
+ if query_embeddings.dim() != 3:
39
+ raise ValueError(
40
+ f"Expected query embeddings to have 3 dimensions, but got {query_embeddings.dim()}."
41
+ )
42
+ if document_embeddings.dim() != 3:
43
+ raise ValueError(
44
+ f"Expected document embeddings to have 3 dimensions, but got {document_embeddings.dim()}."
45
+ )
46
+ if query_embeddings.size(0) not in [1, document_embeddings.size(0)]:
47
+ raise ValueError(
48
+ "There should be either one query or queries equal to the number of documents."
49
+ )
50
+
51
+ # Transpose the query embeddings to align for matrix multiplication
52
+ transposed_query_embeddings = query_embeddings.permute(0, 2, 1)
53
+ # Compute similarity scores using batch matrix multiplication
54
+ computed_scores = torch.matmul(document_embeddings, transposed_query_embeddings)
55
+ # Apply max pooling to extract the highest semantic similarity across each document's sequence
56
+ maximum_scores = torch.max(computed_scores, dim=1).values
57
+
58
+ # Sum up the maximum scores across features to get the overall document relevance scores
59
+ final_scores = maximum_scores.sum(dim=1)
60
+
61
+ normalized_scores = torch.softmax(final_scores, dim=0)
62
+
63
+ return normalized_scores.detach().cpu().numpy().astype(np.float32)
64
+
65
+ def predict(self, sentences):
66
+
67
+ query = sentences[0][0]
68
+ docs = [i[1] for i in sentences]
69
+
70
+ # Embedding the documents
71
+ embedded_docs = self.ckpt.docFromText(docs, bsize=32)[0]
72
+ # Embedding the queries
73
+ embedded_queries = self.ckpt.queryFromText([query], bsize=32)
74
+ embedded_query = embedded_queries[0]
75
+
76
+ # Calculate retrieval scores for the query against all documents
77
+ scores = self.calculate_similarity_scores(
78
+ embedded_query.unsqueeze(0), embedded_docs
79
+ )
80
+
81
+ return scores
backend/open_webui/apps/retrieval/utils.py ADDED
@@ -0,0 +1,592 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import logging
2
+ import os
3
+ import uuid
4
+ from typing import Optional, Union
5
+
6
+ import asyncio
7
+ import requests
8
+
9
+ from huggingface_hub import snapshot_download
10
+ from langchain.retrievers import ContextualCompressionRetriever, EnsembleRetriever
11
+ from langchain_community.retrievers import BM25Retriever
12
+ from langchain_core.documents import Document
13
+
14
+ from open_webui.apps.retrieval.vector.connector import VECTOR_DB_CLIENT
15
+ from open_webui.utils.misc import get_last_user_message
16
+
17
+ from open_webui.env import SRC_LOG_LEVELS
18
+ from open_webui.config import DEFAULT_RAG_TEMPLATE
19
+
20
+
21
+ log = logging.getLogger(__name__)
22
+ log.setLevel(SRC_LOG_LEVELS["RAG"])
23
+
24
+
25
+ from typing import Any
26
+
27
+ from langchain_core.callbacks import CallbackManagerForRetrieverRun
28
+ from langchain_core.retrievers import BaseRetriever
29
+
30
+
31
+ class VectorSearchRetriever(BaseRetriever):
32
+ collection_name: Any
33
+ embedding_function: Any
34
+ top_k: int
35
+
36
+ def _get_relevant_documents(
37
+ self,
38
+ query: str,
39
+ *,
40
+ run_manager: CallbackManagerForRetrieverRun,
41
+ ) -> list[Document]:
42
+ result = VECTOR_DB_CLIENT.search(
43
+ collection_name=self.collection_name,
44
+ vectors=[self.embedding_function(query)],
45
+ limit=self.top_k,
46
+ )
47
+
48
+ ids = result.ids[0]
49
+ metadatas = result.metadatas[0]
50
+ documents = result.documents[0]
51
+
52
+ results = []
53
+ for idx in range(len(ids)):
54
+ results.append(
55
+ Document(
56
+ metadata=metadatas[idx],
57
+ page_content=documents[idx],
58
+ )
59
+ )
60
+ return results
61
+
62
+
63
+ def query_doc(
64
+ collection_name: str,
65
+ query_embedding: list[float],
66
+ k: int,
67
+ ):
68
+ try:
69
+ result = VECTOR_DB_CLIENT.search(
70
+ collection_name=collection_name,
71
+ vectors=[query_embedding],
72
+ limit=k,
73
+ )
74
+
75
+ log.info(f"query_doc:result {result.ids} {result.metadatas}")
76
+ return result
77
+ except Exception as e:
78
+ print(e)
79
+ raise e
80
+
81
+
82
+ def query_doc_with_hybrid_search(
83
+ collection_name: str,
84
+ query: str,
85
+ embedding_function,
86
+ k: int,
87
+ reranking_function,
88
+ r: float,
89
+ ) -> dict:
90
+ try:
91
+ result = VECTOR_DB_CLIENT.get(collection_name=collection_name)
92
+
93
+ bm25_retriever = BM25Retriever.from_texts(
94
+ texts=result.documents[0],
95
+ metadatas=result.metadatas[0],
96
+ )
97
+ bm25_retriever.k = k
98
+
99
+ vector_search_retriever = VectorSearchRetriever(
100
+ collection_name=collection_name,
101
+ embedding_function=embedding_function,
102
+ top_k=k,
103
+ )
104
+
105
+ ensemble_retriever = EnsembleRetriever(
106
+ retrievers=[bm25_retriever, vector_search_retriever], weights=[0.5, 0.5]
107
+ )
108
+ compressor = RerankCompressor(
109
+ embedding_function=embedding_function,
110
+ top_n=k,
111
+ reranking_function=reranking_function,
112
+ r_score=r,
113
+ )
114
+
115
+ compression_retriever = ContextualCompressionRetriever(
116
+ base_compressor=compressor, base_retriever=ensemble_retriever
117
+ )
118
+
119
+ result = compression_retriever.invoke(query)
120
+ result = {
121
+ "distances": [[d.metadata.get("score") for d in result]],
122
+ "documents": [[d.page_content for d in result]],
123
+ "metadatas": [[d.metadata for d in result]],
124
+ }
125
+
126
+ log.info(
127
+ "query_doc_with_hybrid_search:result "
128
+ + f'{result["metadatas"]} {result["distances"]}'
129
+ )
130
+ return result
131
+ except Exception as e:
132
+ raise e
133
+
134
+
135
+ def merge_and_sort_query_results(
136
+ query_results: list[dict], k: int, reverse: bool = False
137
+ ) -> list[dict]:
138
+ # Initialize lists to store combined data
139
+ combined_distances = []
140
+ combined_documents = []
141
+ combined_metadatas = []
142
+
143
+ for data in query_results:
144
+ combined_distances.extend(data["distances"][0])
145
+ combined_documents.extend(data["documents"][0])
146
+ combined_metadatas.extend(data["metadatas"][0])
147
+
148
+ # Create a list of tuples (distance, document, metadata)
149
+ combined = list(zip(combined_distances, combined_documents, combined_metadatas))
150
+
151
+ # Sort the list based on distances
152
+ combined.sort(key=lambda x: x[0], reverse=reverse)
153
+
154
+ # We don't have anything :-(
155
+ if not combined:
156
+ sorted_distances = []
157
+ sorted_documents = []
158
+ sorted_metadatas = []
159
+ else:
160
+ # Unzip the sorted list
161
+ sorted_distances, sorted_documents, sorted_metadatas = zip(*combined)
162
+
163
+ # Slicing the lists to include only k elements
164
+ sorted_distances = list(sorted_distances)[:k]
165
+ sorted_documents = list(sorted_documents)[:k]
166
+ sorted_metadatas = list(sorted_metadatas)[:k]
167
+
168
+ # Create the output dictionary
169
+ result = {
170
+ "distances": [sorted_distances],
171
+ "documents": [sorted_documents],
172
+ "metadatas": [sorted_metadatas],
173
+ }
174
+
175
+ return result
176
+
177
+
178
+ def query_collection(
179
+ collection_names: list[str],
180
+ queries: list[str],
181
+ embedding_function,
182
+ k: int,
183
+ ) -> dict:
184
+ results = []
185
+ for query in queries:
186
+ query_embedding = embedding_function(query)
187
+ for collection_name in collection_names:
188
+ if collection_name:
189
+ try:
190
+ result = query_doc(
191
+ collection_name=collection_name,
192
+ k=k,
193
+ query_embedding=query_embedding,
194
+ )
195
+ if result is not None:
196
+ results.append(result.model_dump())
197
+ except Exception as e:
198
+ log.exception(f"Error when querying the collection: {e}")
199
+ else:
200
+ pass
201
+
202
+ return merge_and_sort_query_results(results, k=k)
203
+
204
+
205
+ def query_collection_with_hybrid_search(
206
+ collection_names: list[str],
207
+ queries: list[str],
208
+ embedding_function,
209
+ k: int,
210
+ reranking_function,
211
+ r: float,
212
+ ) -> dict:
213
+ results = []
214
+ error = False
215
+ for collection_name in collection_names:
216
+ try:
217
+ for query in queries:
218
+ result = query_doc_with_hybrid_search(
219
+ collection_name=collection_name,
220
+ query=query,
221
+ embedding_function=embedding_function,
222
+ k=k,
223
+ reranking_function=reranking_function,
224
+ r=r,
225
+ )
226
+ results.append(result)
227
+ except Exception as e:
228
+ log.exception(
229
+ "Error when querying the collection with " f"hybrid_search: {e}"
230
+ )
231
+ error = True
232
+
233
+ if error:
234
+ raise Exception(
235
+ "Hybrid search failed for all collections. Using Non hybrid search as fallback."
236
+ )
237
+
238
+ return merge_and_sort_query_results(results, k=k, reverse=True)
239
+
240
+
241
+ def rag_template(template: str, context: str, query: str):
242
+ if template == "":
243
+ template = DEFAULT_RAG_TEMPLATE
244
+
245
+ if "[context]" not in template and "{{CONTEXT}}" not in template:
246
+ log.debug(
247
+ "WARNING: The RAG template does not contain the '[context]' or '{{CONTEXT}}' placeholder."
248
+ )
249
+
250
+ if "<context>" in context and "</context>" in context:
251
+ log.debug(
252
+ "WARNING: Potential prompt injection attack: the RAG "
253
+ "context contains '<context>' and '</context>'. This might be "
254
+ "nothing, or the user might be trying to hack something."
255
+ )
256
+
257
+ query_placeholders = []
258
+ if "[query]" in context:
259
+ query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
260
+ template = template.replace("[query]", query_placeholder)
261
+ query_placeholders.append(query_placeholder)
262
+
263
+ if "{{QUERY}}" in context:
264
+ query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
265
+ template = template.replace("{{QUERY}}", query_placeholder)
266
+ query_placeholders.append(query_placeholder)
267
+
268
+ template = template.replace("[context]", context)
269
+ template = template.replace("{{CONTEXT}}", context)
270
+ template = template.replace("[query]", query)
271
+ template = template.replace("{{QUERY}}", query)
272
+
273
+ for query_placeholder in query_placeholders:
274
+ template = template.replace(query_placeholder, query)
275
+
276
+ return template
277
+
278
+
279
+ def get_embedding_function(
280
+ embedding_engine,
281
+ embedding_model,
282
+ embedding_function,
283
+ url,
284
+ key,
285
+ embedding_batch_size,
286
+ ):
287
+ if embedding_engine == "":
288
+ return lambda query: embedding_function.encode(query).tolist()
289
+ elif embedding_engine in ["ollama", "openai"]:
290
+ func = lambda query: generate_embeddings(
291
+ engine=embedding_engine,
292
+ model=embedding_model,
293
+ text=query,
294
+ url=url,
295
+ key=key,
296
+ )
297
+
298
+ def generate_multiple(query, func):
299
+ if isinstance(query, list):
300
+ embeddings = []
301
+ for i in range(0, len(query), embedding_batch_size):
302
+ embeddings.extend(func(query[i : i + embedding_batch_size]))
303
+ return embeddings
304
+ else:
305
+ return func(query)
306
+
307
+ return lambda query: generate_multiple(query, func)
308
+
309
+
310
+ def get_rag_context(
311
+ files,
312
+ queries,
313
+ embedding_function,
314
+ k,
315
+ reranking_function,
316
+ r,
317
+ hybrid_search,
318
+ ):
319
+ log.debug(f"files: {files} {queries} {embedding_function} {reranking_function}")
320
+
321
+ extracted_collections = []
322
+ relevant_contexts = []
323
+
324
+ for file in files:
325
+ if file.get("context") == "full":
326
+ context = {
327
+ "documents": [[file.get("file").get("data", {}).get("content")]],
328
+ "metadatas": [[{"file_id": file.get("id"), "name": file.get("name")}]],
329
+ }
330
+ else:
331
+ context = None
332
+
333
+ collection_names = []
334
+ if file.get("type") == "collection":
335
+ if file.get("legacy"):
336
+ collection_names = file.get("collection_names", [])
337
+ else:
338
+ collection_names.append(file["id"])
339
+ elif file.get("collection_name"):
340
+ collection_names.append(file["collection_name"])
341
+ elif file.get("id"):
342
+ if file.get("legacy"):
343
+ collection_names.append(f"{file['id']}")
344
+ else:
345
+ collection_names.append(f"file-{file['id']}")
346
+
347
+ collection_names = set(collection_names).difference(extracted_collections)
348
+ if not collection_names:
349
+ log.debug(f"skipping {file} as it has already been extracted")
350
+ continue
351
+
352
+ try:
353
+ context = None
354
+ if file.get("type") == "text":
355
+ context = file["content"]
356
+ else:
357
+ if hybrid_search:
358
+ try:
359
+ context = query_collection_with_hybrid_search(
360
+ collection_names=collection_names,
361
+ queries=queries,
362
+ embedding_function=embedding_function,
363
+ k=k,
364
+ reranking_function=reranking_function,
365
+ r=r,
366
+ )
367
+ except Exception as e:
368
+ log.debug(
369
+ "Error when using hybrid search, using"
370
+ " non hybrid search as fallback."
371
+ )
372
+
373
+ if (not hybrid_search) or (context is None):
374
+ context = query_collection(
375
+ collection_names=collection_names,
376
+ queries=queries,
377
+ embedding_function=embedding_function,
378
+ k=k,
379
+ )
380
+ except Exception as e:
381
+ log.exception(e)
382
+
383
+ extracted_collections.extend(collection_names)
384
+
385
+ if context:
386
+ if "data" in file:
387
+ del file["data"]
388
+ relevant_contexts.append({**context, "file": file})
389
+
390
+ contexts = []
391
+ citations = []
392
+ for context in relevant_contexts:
393
+ try:
394
+ if "documents" in context:
395
+ file_names = list(
396
+ set(
397
+ [
398
+ metadata["name"]
399
+ for metadata in context["metadatas"][0]
400
+ if metadata is not None and "name" in metadata
401
+ ]
402
+ )
403
+ )
404
+ contexts.append(
405
+ ((", ".join(file_names) + ":\n\n") if file_names else "")
406
+ + "\n\n".join(
407
+ [text for text in context["documents"][0] if text is not None]
408
+ )
409
+ )
410
+
411
+ if "metadatas" in context:
412
+ citation = {
413
+ "source": context["file"],
414
+ "document": context["documents"][0],
415
+ "metadata": context["metadatas"][0],
416
+ }
417
+ if "distances" in context and context["distances"]:
418
+ citation["distances"] = context["distances"][0]
419
+ citations.append(citation)
420
+ except Exception as e:
421
+ log.exception(e)
422
+
423
+ print("contexts", contexts)
424
+ print("citations", citations)
425
+
426
+ return contexts, citations
427
+
428
+
429
+ def get_model_path(model: str, update_model: bool = False):
430
+ # Construct huggingface_hub kwargs with local_files_only to return the snapshot path
431
+ cache_dir = os.getenv("SENTENCE_TRANSFORMERS_HOME")
432
+
433
+ local_files_only = not update_model
434
+
435
+ snapshot_kwargs = {
436
+ "cache_dir": cache_dir,
437
+ "local_files_only": local_files_only,
438
+ }
439
+
440
+ log.debug(f"model: {model}")
441
+ log.debug(f"snapshot_kwargs: {snapshot_kwargs}")
442
+
443
+ # Inspiration from upstream sentence_transformers
444
+ if (
445
+ os.path.exists(model)
446
+ or ("\\" in model or model.count("/") > 1)
447
+ and local_files_only
448
+ ):
449
+ # If fully qualified path exists, return input, else set repo_id
450
+ return model
451
+ elif "/" not in model:
452
+ # Set valid repo_id for model short-name
453
+ model = "sentence-transformers" + "/" + model
454
+
455
+ snapshot_kwargs["repo_id"] = model
456
+
457
+ # Attempt to query the huggingface_hub library to determine the local path and/or to update
458
+ try:
459
+ model_repo_path = snapshot_download(**snapshot_kwargs)
460
+ log.debug(f"model_repo_path: {model_repo_path}")
461
+ return model_repo_path
462
+ except Exception as e:
463
+ log.exception(f"Cannot determine model snapshot path: {e}")
464
+ return model
465
+
466
+
467
+ def generate_openai_batch_embeddings(
468
+ model: str, texts: list[str], url: str = "https://api.openai.com/v1", key: str = ""
469
+ ) -> Optional[list[list[float]]]:
470
+ try:
471
+ r = requests.post(
472
+ f"{url}/embeddings",
473
+ headers={
474
+ "Content-Type": "application/json",
475
+ "Authorization": f"Bearer {key}",
476
+ },
477
+ json={"input": texts, "model": model},
478
+ )
479
+ r.raise_for_status()
480
+ data = r.json()
481
+ if "data" in data:
482
+ return [elem["embedding"] for elem in data["data"]]
483
+ else:
484
+ raise "Something went wrong :/"
485
+ except Exception as e:
486
+ print(e)
487
+ return None
488
+
489
+
490
+ def generate_ollama_batch_embeddings(
491
+ model: str, texts: list[str], url: str, key: str
492
+ ) -> Optional[list[list[float]]]:
493
+ try:
494
+ r = requests.post(
495
+ f"{url}/api/embed",
496
+ headers={
497
+ "Content-Type": "application/json",
498
+ "Authorization": f"Bearer {key}",
499
+ },
500
+ json={"input": texts, "model": model},
501
+ )
502
+ r.raise_for_status()
503
+ data = r.json()
504
+
505
+ print(data)
506
+ if "embeddings" in data:
507
+ return data["embeddings"]
508
+ else:
509
+ raise "Something went wrong :/"
510
+ except Exception as e:
511
+ print(e)
512
+ return None
513
+
514
+
515
+ def generate_embeddings(engine: str, model: str, text: Union[str, list[str]], **kwargs):
516
+ url = kwargs.get("url", "")
517
+ key = kwargs.get("key", "")
518
+
519
+ if engine == "ollama":
520
+ if isinstance(text, list):
521
+ embeddings = generate_ollama_batch_embeddings(
522
+ **{"model": model, "texts": text, "url": url, "key": key}
523
+ )
524
+ else:
525
+ embeddings = generate_ollama_batch_embeddings(
526
+ **{"model": model, "texts": [text], "url": url, "key": key}
527
+ )
528
+ return embeddings[0] if isinstance(text, str) else embeddings
529
+ elif engine == "openai":
530
+ if isinstance(text, list):
531
+ embeddings = generate_openai_batch_embeddings(model, text, url, key)
532
+ else:
533
+ embeddings = generate_openai_batch_embeddings(model, [text], url, key)
534
+
535
+ return embeddings[0] if isinstance(text, str) else embeddings
536
+
537
+
538
+ import operator
539
+ from typing import Optional, Sequence
540
+
541
+ from langchain_core.callbacks import Callbacks
542
+ from langchain_core.documents import BaseDocumentCompressor, Document
543
+
544
+
545
+ class RerankCompressor(BaseDocumentCompressor):
546
+ embedding_function: Any
547
+ top_n: int
548
+ reranking_function: Any
549
+ r_score: float
550
+
551
+ class Config:
552
+ extra = "forbid"
553
+ arbitrary_types_allowed = True
554
+
555
+ def compress_documents(
556
+ self,
557
+ documents: Sequence[Document],
558
+ query: str,
559
+ callbacks: Optional[Callbacks] = None,
560
+ ) -> Sequence[Document]:
561
+ reranking = self.reranking_function is not None
562
+
563
+ if reranking:
564
+ scores = self.reranking_function.predict(
565
+ [(query, doc.page_content) for doc in documents]
566
+ )
567
+ else:
568
+ from sentence_transformers import util
569
+
570
+ query_embedding = self.embedding_function(query)
571
+ document_embedding = self.embedding_function(
572
+ [doc.page_content for doc in documents]
573
+ )
574
+ scores = util.cos_sim(query_embedding, document_embedding)[0]
575
+
576
+ docs_with_scores = list(zip(documents, scores.tolist()))
577
+ if self.r_score:
578
+ docs_with_scores = [
579
+ (d, s) for d, s in docs_with_scores if s >= self.r_score
580
+ ]
581
+
582
+ result = sorted(docs_with_scores, key=operator.itemgetter(1), reverse=True)
583
+ final_results = []
584
+ for doc, doc_score in result[: self.top_n]:
585
+ metadata = doc.metadata
586
+ metadata["score"] = doc_score
587
+ doc = Document(
588
+ page_content=doc.page_content,
589
+ metadata=metadata,
590
+ )
591
+ final_results.append(doc)
592
+ return final_results
backend/open_webui/apps/retrieval/vector/connector.py ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from open_webui.config import VECTOR_DB
2
+
3
+ if VECTOR_DB == "milvus":
4
+ from open_webui.apps.retrieval.vector.dbs.milvus import MilvusClient
5
+
6
+ VECTOR_DB_CLIENT = MilvusClient()
7
+ elif VECTOR_DB == "qdrant":
8
+ from open_webui.apps.retrieval.vector.dbs.qdrant import QdrantClient
9
+
10
+ VECTOR_DB_CLIENT = QdrantClient()
11
+ elif VECTOR_DB == "opensearch":
12
+ from open_webui.apps.retrieval.vector.dbs.opensearch import OpenSearchClient
13
+
14
+ VECTOR_DB_CLIENT = OpenSearchClient()
15
+ elif VECTOR_DB == "pgvector":
16
+ from open_webui.apps.retrieval.vector.dbs.pgvector import PgvectorClient
17
+
18
+ VECTOR_DB_CLIENT = PgvectorClient()
19
+ else:
20
+ from open_webui.apps.retrieval.vector.dbs.chroma import ChromaClient
21
+
22
+ VECTOR_DB_CLIENT = ChromaClient()
backend/open_webui/apps/retrieval/vector/dbs/chroma.py ADDED
@@ -0,0 +1,174 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import chromadb
2
+ from chromadb import Settings
3
+ from chromadb.utils.batch_utils import create_batches
4
+
5
+ from typing import Optional
6
+
7
+ from open_webui.apps.retrieval.vector.main import VectorItem, SearchResult, GetResult
8
+ from open_webui.config import (
9
+ CHROMA_DATA_PATH,
10
+ CHROMA_HTTP_HOST,
11
+ CHROMA_HTTP_PORT,
12
+ CHROMA_HTTP_HEADERS,
13
+ CHROMA_HTTP_SSL,
14
+ CHROMA_TENANT,
15
+ CHROMA_DATABASE,
16
+ CHROMA_CLIENT_AUTH_PROVIDER,
17
+ CHROMA_CLIENT_AUTH_CREDENTIALS,
18
+ )
19
+
20
+
21
+ class ChromaClient:
22
+ def __init__(self):
23
+ settings_dict = {
24
+ "allow_reset": True,
25
+ "anonymized_telemetry": False,
26
+ }
27
+ if CHROMA_CLIENT_AUTH_PROVIDER is not None:
28
+ settings_dict["chroma_client_auth_provider"] = CHROMA_CLIENT_AUTH_PROVIDER
29
+ if CHROMA_CLIENT_AUTH_CREDENTIALS is not None:
30
+ settings_dict["chroma_client_auth_credentials"] = (
31
+ CHROMA_CLIENT_AUTH_CREDENTIALS
32
+ )
33
+
34
+ if CHROMA_HTTP_HOST != "":
35
+ self.client = chromadb.HttpClient(
36
+ host=CHROMA_HTTP_HOST,
37
+ port=CHROMA_HTTP_PORT,
38
+ headers=CHROMA_HTTP_HEADERS,
39
+ ssl=CHROMA_HTTP_SSL,
40
+ tenant=CHROMA_TENANT,
41
+ database=CHROMA_DATABASE,
42
+ settings=Settings(**settings_dict),
43
+ )
44
+ else:
45
+ self.client = chromadb.PersistentClient(
46
+ path=CHROMA_DATA_PATH,
47
+ settings=Settings(**settings_dict),
48
+ tenant=CHROMA_TENANT,
49
+ database=CHROMA_DATABASE,
50
+ )
51
+
52
+ def has_collection(self, collection_name: str) -> bool:
53
+ # Check if the collection exists based on the collection name.
54
+ collections = self.client.list_collections()
55
+ return collection_name in [collection.name for collection in collections]
56
+
57
+ def delete_collection(self, collection_name: str):
58
+ # Delete the collection based on the collection name.
59
+ return self.client.delete_collection(name=collection_name)
60
+
61
+ def search(
62
+ self, collection_name: str, vectors: list[list[float | int]], limit: int
63
+ ) -> Optional[SearchResult]:
64
+ # Search for the nearest neighbor items based on the vectors and return 'limit' number of results.
65
+ try:
66
+ collection = self.client.get_collection(name=collection_name)
67
+ if collection:
68
+ result = collection.query(
69
+ query_embeddings=vectors,
70
+ n_results=limit,
71
+ )
72
+
73
+ return SearchResult(
74
+ **{
75
+ "ids": result["ids"],
76
+ "distances": result["distances"],
77
+ "documents": result["documents"],
78
+ "metadatas": result["metadatas"],
79
+ }
80
+ )
81
+ return None
82
+ except Exception as e:
83
+ return None
84
+
85
+ def query(
86
+ self, collection_name: str, filter: dict, limit: Optional[int] = None
87
+ ) -> Optional[GetResult]:
88
+ # Query the items from the collection based on the filter.
89
+ try:
90
+ collection = self.client.get_collection(name=collection_name)
91
+ if collection:
92
+ result = collection.get(
93
+ where=filter,
94
+ limit=limit,
95
+ )
96
+
97
+ return GetResult(
98
+ **{
99
+ "ids": [result["ids"]],
100
+ "documents": [result["documents"]],
101
+ "metadatas": [result["metadatas"]],
102
+ }
103
+ )
104
+ return None
105
+ except Exception as e:
106
+ print(e)
107
+ return None
108
+
109
+ def get(self, collection_name: str) -> Optional[GetResult]:
110
+ # Get all the items in the collection.
111
+ collection = self.client.get_collection(name=collection_name)
112
+ if collection:
113
+ result = collection.get()
114
+ return GetResult(
115
+ **{
116
+ "ids": [result["ids"]],
117
+ "documents": [result["documents"]],
118
+ "metadatas": [result["metadatas"]],
119
+ }
120
+ )
121
+ return None
122
+
123
+ def insert(self, collection_name: str, items: list[VectorItem]):
124
+ # Insert the items into the collection, if the collection does not exist, it will be created.
125
+ collection = self.client.get_or_create_collection(
126
+ name=collection_name, metadata={"hnsw:space": "cosine"}
127
+ )
128
+
129
+ ids = [item["id"] for item in items]
130
+ documents = [item["text"] for item in items]
131
+ embeddings = [item["vector"] for item in items]
132
+ metadatas = [item["metadata"] for item in items]
133
+
134
+ for batch in create_batches(
135
+ api=self.client,
136
+ documents=documents,
137
+ embeddings=embeddings,
138
+ ids=ids,
139
+ metadatas=metadatas,
140
+ ):
141
+ collection.add(*batch)
142
+
143
+ def upsert(self, collection_name: str, items: list[VectorItem]):
144
+ # Update the items in the collection, if the items are not present, insert them. If the collection does not exist, it will be created.
145
+ collection = self.client.get_or_create_collection(
146
+ name=collection_name, metadata={"hnsw:space": "cosine"}
147
+ )
148
+
149
+ ids = [item["id"] for item in items]
150
+ documents = [item["text"] for item in items]
151
+ embeddings = [item["vector"] for item in items]
152
+ metadatas = [item["metadata"] for item in items]
153
+
154
+ collection.upsert(
155
+ ids=ids, documents=documents, embeddings=embeddings, metadatas=metadatas
156
+ )
157
+
158
+ def delete(
159
+ self,
160
+ collection_name: str,
161
+ ids: Optional[list[str]] = None,
162
+ filter: Optional[dict] = None,
163
+ ):
164
+ # Delete the items from the collection based on the ids.
165
+ collection = self.client.get_collection(name=collection_name)
166
+ if collection:
167
+ if ids:
168
+ collection.delete(ids=ids)
169
+ elif filter:
170
+ collection.delete(where=filter)
171
+
172
+ def reset(self):
173
+ # Resets the database. This will delete all collections and item entries.
174
+ return self.client.reset()
backend/open_webui/apps/retrieval/vector/dbs/milvus.py ADDED
@@ -0,0 +1,286 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from pymilvus import MilvusClient as Client
2
+ from pymilvus import FieldSchema, DataType
3
+ import json
4
+
5
+ from typing import Optional
6
+
7
+ from open_webui.apps.retrieval.vector.main import VectorItem, SearchResult, GetResult
8
+ from open_webui.config import (
9
+ MILVUS_URI,
10
+ )
11
+
12
+
13
+ class MilvusClient:
14
+ def __init__(self):
15
+ self.collection_prefix = "open_webui"
16
+ self.client = Client(uri=MILVUS_URI)
17
+
18
+ def _result_to_get_result(self, result) -> GetResult:
19
+ ids = []
20
+ documents = []
21
+ metadatas = []
22
+
23
+ for match in result:
24
+ _ids = []
25
+ _documents = []
26
+ _metadatas = []
27
+ for item in match:
28
+ _ids.append(item.get("id"))
29
+ _documents.append(item.get("data", {}).get("text"))
30
+ _metadatas.append(item.get("metadata"))
31
+
32
+ ids.append(_ids)
33
+ documents.append(_documents)
34
+ metadatas.append(_metadatas)
35
+
36
+ return GetResult(
37
+ **{
38
+ "ids": ids,
39
+ "documents": documents,
40
+ "metadatas": metadatas,
41
+ }
42
+ )
43
+
44
+ def _result_to_search_result(self, result) -> SearchResult:
45
+ ids = []
46
+ distances = []
47
+ documents = []
48
+ metadatas = []
49
+
50
+ for match in result:
51
+ _ids = []
52
+ _distances = []
53
+ _documents = []
54
+ _metadatas = []
55
+
56
+ for item in match:
57
+ _ids.append(item.get("id"))
58
+ _distances.append(item.get("distance"))
59
+ _documents.append(item.get("entity", {}).get("data", {}).get("text"))
60
+ _metadatas.append(item.get("entity", {}).get("metadata"))
61
+
62
+ ids.append(_ids)
63
+ distances.append(_distances)
64
+ documents.append(_documents)
65
+ metadatas.append(_metadatas)
66
+
67
+ return SearchResult(
68
+ **{
69
+ "ids": ids,
70
+ "distances": distances,
71
+ "documents": documents,
72
+ "metadatas": metadatas,
73
+ }
74
+ )
75
+
76
+ def _create_collection(self, collection_name: str, dimension: int):
77
+ schema = self.client.create_schema(
78
+ auto_id=False,
79
+ enable_dynamic_field=True,
80
+ )
81
+ schema.add_field(
82
+ field_name="id",
83
+ datatype=DataType.VARCHAR,
84
+ is_primary=True,
85
+ max_length=65535,
86
+ )
87
+ schema.add_field(
88
+ field_name="vector",
89
+ datatype=DataType.FLOAT_VECTOR,
90
+ dim=dimension,
91
+ description="vector",
92
+ )
93
+ schema.add_field(field_name="data", datatype=DataType.JSON, description="data")
94
+ schema.add_field(
95
+ field_name="metadata", datatype=DataType.JSON, description="metadata"
96
+ )
97
+
98
+ index_params = self.client.prepare_index_params()
99
+ index_params.add_index(
100
+ field_name="vector",
101
+ index_type="HNSW",
102
+ metric_type="COSINE",
103
+ params={"M": 16, "efConstruction": 100},
104
+ )
105
+
106
+ self.client.create_collection(
107
+ collection_name=f"{self.collection_prefix}_{collection_name}",
108
+ schema=schema,
109
+ index_params=index_params,
110
+ )
111
+
112
+ def has_collection(self, collection_name: str) -> bool:
113
+ # Check if the collection exists based on the collection name.
114
+ collection_name = collection_name.replace("-", "_")
115
+ return self.client.has_collection(
116
+ collection_name=f"{self.collection_prefix}_{collection_name}"
117
+ )
118
+
119
+ def delete_collection(self, collection_name: str):
120
+ # Delete the collection based on the collection name.
121
+ collection_name = collection_name.replace("-", "_")
122
+ return self.client.drop_collection(
123
+ collection_name=f"{self.collection_prefix}_{collection_name}"
124
+ )
125
+
126
+ def search(
127
+ self, collection_name: str, vectors: list[list[float | int]], limit: int
128
+ ) -> Optional[SearchResult]:
129
+ # Search for the nearest neighbor items based on the vectors and return 'limit' number of results.
130
+ collection_name = collection_name.replace("-", "_")
131
+ result = self.client.search(
132
+ collection_name=f"{self.collection_prefix}_{collection_name}",
133
+ data=vectors,
134
+ limit=limit,
135
+ output_fields=["data", "metadata"],
136
+ )
137
+
138
+ return self._result_to_search_result(result)
139
+
140
+ def query(self, collection_name: str, filter: dict, limit: Optional[int] = None):
141
+ # Construct the filter string for querying
142
+ collection_name = collection_name.replace("-", "_")
143
+ if not self.has_collection(collection_name):
144
+ return None
145
+
146
+ filter_string = " && ".join(
147
+ [
148
+ f'metadata["{key}"] == {json.dumps(value)}'
149
+ for key, value in filter.items()
150
+ ]
151
+ )
152
+
153
+ max_limit = 16383 # The maximum number of records per request
154
+ all_results = []
155
+
156
+ if limit is None:
157
+ limit = float("inf") # Use infinity as a placeholder for no limit
158
+
159
+ # Initialize offset and remaining to handle pagination
160
+ offset = 0
161
+ remaining = limit
162
+
163
+ try:
164
+ # Loop until there are no more items to fetch or the desired limit is reached
165
+ while remaining > 0:
166
+ print("remaining", remaining)
167
+ current_fetch = min(
168
+ max_limit, remaining
169
+ ) # Determine how many items to fetch in this iteration
170
+
171
+ results = self.client.query(
172
+ collection_name=f"{self.collection_prefix}_{collection_name}",
173
+ filter=filter_string,
174
+ output_fields=["*"],
175
+ limit=current_fetch,
176
+ offset=offset,
177
+ )
178
+
179
+ if not results:
180
+ break
181
+
182
+ all_results.extend(results)
183
+ results_count = len(results)
184
+ remaining -= (
185
+ results_count # Decrease remaining by the number of items fetched
186
+ )
187
+ offset += results_count
188
+
189
+ # Break the loop if the results returned are less than the requested fetch count
190
+ if results_count < current_fetch:
191
+ break
192
+
193
+ print(all_results)
194
+ return self._result_to_get_result([all_results])
195
+ except Exception as e:
196
+ print(e)
197
+ return None
198
+
199
+ def get(self, collection_name: str) -> Optional[GetResult]:
200
+ # Get all the items in the collection.
201
+ collection_name = collection_name.replace("-", "_")
202
+ result = self.client.query(
203
+ collection_name=f"{self.collection_prefix}_{collection_name}",
204
+ filter='id != ""',
205
+ )
206
+ return self._result_to_get_result([result])
207
+
208
+ def insert(self, collection_name: str, items: list[VectorItem]):
209
+ # Insert the items into the collection, if the collection does not exist, it will be created.
210
+ collection_name = collection_name.replace("-", "_")
211
+ if not self.client.has_collection(
212
+ collection_name=f"{self.collection_prefix}_{collection_name}"
213
+ ):
214
+ self._create_collection(
215
+ collection_name=collection_name, dimension=len(items[0]["vector"])
216
+ )
217
+
218
+ return self.client.insert(
219
+ collection_name=f"{self.collection_prefix}_{collection_name}",
220
+ data=[
221
+ {
222
+ "id": item["id"],
223
+ "vector": item["vector"],
224
+ "data": {"text": item["text"]},
225
+ "metadata": item["metadata"],
226
+ }
227
+ for item in items
228
+ ],
229
+ )
230
+
231
+ def upsert(self, collection_name: str, items: list[VectorItem]):
232
+ # Update the items in the collection, if the items are not present, insert them. If the collection does not exist, it will be created.
233
+ collection_name = collection_name.replace("-", "_")
234
+ if not self.client.has_collection(
235
+ collection_name=f"{self.collection_prefix}_{collection_name}"
236
+ ):
237
+ self._create_collection(
238
+ collection_name=collection_name, dimension=len(items[0]["vector"])
239
+ )
240
+
241
+ return self.client.upsert(
242
+ collection_name=f"{self.collection_prefix}_{collection_name}",
243
+ data=[
244
+ {
245
+ "id": item["id"],
246
+ "vector": item["vector"],
247
+ "data": {"text": item["text"]},
248
+ "metadata": item["metadata"],
249
+ }
250
+ for item in items
251
+ ],
252
+ )
253
+
254
+ def delete(
255
+ self,
256
+ collection_name: str,
257
+ ids: Optional[list[str]] = None,
258
+ filter: Optional[dict] = None,
259
+ ):
260
+ # Delete the items from the collection based on the ids.
261
+ collection_name = collection_name.replace("-", "_")
262
+ if ids:
263
+ return self.client.delete(
264
+ collection_name=f"{self.collection_prefix}_{collection_name}",
265
+ ids=ids,
266
+ )
267
+ elif filter:
268
+ # Convert the filter dictionary to a string using JSON_CONTAINS.
269
+ filter_string = " && ".join(
270
+ [
271
+ f'metadata["{key}"] == {json.dumps(value)}'
272
+ for key, value in filter.items()
273
+ ]
274
+ )
275
+
276
+ return self.client.delete(
277
+ collection_name=f"{self.collection_prefix}_{collection_name}",
278
+ filter=filter_string,
279
+ )
280
+
281
+ def reset(self):
282
+ # Resets the database. This will delete all collections and item entries.
283
+ collection_names = self.client.list_collections()
284
+ for collection_name in collection_names:
285
+ if collection_name.startswith(self.collection_prefix):
286
+ self.client.drop_collection(collection_name=collection_name)