fix

Fix
fix
2026-02-22 10:15:46 +00:00 · 2023-11-03 00:45:31 -07:00 · 2023-11-03 00:36:57 -07:00 · 2023-11-03 00:33:29 -07:00 · 2023-11-03 00:28:54 -07:00 · 2023-11-03 00:25:42 -07:00
1152 changed files with 22578 additions and 115145 deletions
--- a/.github/pull_request_template.md
+++ b/.github/pull_request_template.md
@@ -1,25 +0,0 @@
-## Description
-[Provide a brief description of the changes in this PR]
-
-
-## How Has This Been Tested?
-[Describe the tests you ran to verify your changes]
-
-
-## Accepted Risk
-[Any know risks or failure modes to point out to reviewers]
-
-
-## Related Issue(s)
-[If applicable, link to the issue(s) this PR addresses]
-
-
-## Checklist:
- [ ] All of the automated tests pass
- [ ] All PR comments are addressed and marked resolved
- [ ] If there are migrations, they have been rebased to latest main
- [ ] If there are new dependencies, they are added to the requirements
- [ ] If there are new environment variables, they are added to all of the deployment methods
- [ ] If there are new APIs that don't require auth, they are added to PUBLIC_ENDPOINT_SPECS
- [ ] Docker images build and basic functionalities work
- [ ] Author has done a final read through of the PR right before merge
--- a/.github/workflows/docker-build-backend-container-on-merge-group.yml
+++ b/.github/workflows/docker-build-backend-container-on-merge-group.yml
@@ -1,33 +0,0 @@
-name: Build Backend Image on Merge Group
-
-on:
-  merge_group:
-    types: [checks_requested]
-
-env:
-  REGISTRY_IMAGE: danswer/danswer-backend
-
-jobs:
-  build:
-    # TODO: make this a matrix build like the web containers
-    runs-on: 
-      group: amd64-image-builders
-      
-    steps:
-    - name: Checkout code
-      uses: actions/checkout@v2
-
-    - name: Set up Docker Buildx
-      uses: docker/setup-buildx-action@v3
-
-    - name: Backend Image Docker Build
-      uses: docker/build-push-action@v5
-      with:
-        context: ./backend
-        file: ./backend/Dockerfile
-        platforms: linux/amd64,linux/arm64
-        push: false
-        tags: |
-          ${{ env.REGISTRY_IMAGE }}:latest
-        build-args: |
-          DANSWER_VERSION=v0.0.1
--- a/.github/workflows/docker-build-push-backend-container-on-tag.yml
+++ b/.github/workflows/docker-build-push-backend-container-on-tag.yml
@@ -1,49 +1,34 @@
-name: Build and Push Backend Image on Tag
+name: Build and Push Backend Images on Tagging

 on:
  push:
    tags:
      - '*'

-env:
-  REGISTRY_IMAGE: danswer/danswer-backend
-
 jobs:
  build-and-push:
-    # TODO: make this a matrix build like the web containers
-    runs-on: 
-      group: amd64-image-builders
+    runs-on: ubuntu-latest

    steps:
    - name: Checkout code
      uses: actions/checkout@v2

    - name: Set up Docker Buildx
-      uses: docker/setup-buildx-action@v3
+      uses: docker/setup-buildx-action@v1

    - name: Login to Docker Hub
-      uses: docker/login-action@v3
+      uses: docker/login-action@v1
      with:
        username: ${{ secrets.DOCKER_USERNAME }}
        password: ${{ secrets.DOCKER_TOKEN }}

    - name: Backend Image Docker Build and Push
-      uses: docker/build-push-action@v5
+      uses: docker/build-push-action@v2
      with:
        context: ./backend
        file: ./backend/Dockerfile
        platforms: linux/amd64,linux/arm64
        push: true
        tags: |
-          ${{ env.REGISTRY_IMAGE }}:${{ github.ref_name }}
-          ${{ env.REGISTRY_IMAGE }}:latest
-        build-args: |
-          DANSWER_VERSION=${{ github.ref_name }}
-
-    - name: Run Trivy vulnerability scanner
-      uses: aquasecurity/trivy-action@master
-      with:
-        # To run locally: trivy image --severity HIGH,CRITICAL danswer/danswer-backend
-        image-ref: docker.io/${{ env.REGISTRY_IMAGE }}:${{ github.ref_name }}
-        severity: 'CRITICAL,HIGH'
-        trivyignores: ./backend/.trivyignore
+          danswer/danswer-backend:${{ github.ref_name }}
+          danswer/danswer-backend:latest
--- a/.github/workflows/docker-build-push-model-server-container-on-tag.yml
+++ b/.github/workflows/docker-build-push-model-server-container-on-tag.yml
@@ -1,43 +0,0 @@
-name: Build and Push Model Server Image on Tag
-
-on:
-  push:
-    tags:
-      - '*'
-
-jobs:
-  build-and-push:
-    runs-on: 
-      group: amd64-image-builders
-
-    steps:
-    - name: Checkout code
-      uses: actions/checkout@v2
-
-    - name: Set up Docker Buildx
-      uses: docker/setup-buildx-action@v3
-
-    - name: Login to Docker Hub
-      uses: docker/login-action@v3
-      with:
-        username: ${{ secrets.DOCKER_USERNAME }}
-        password: ${{ secrets.DOCKER_TOKEN }}
-
-    - name: Model Server Image Docker Build and Push
-      uses: docker/build-push-action@v5
-      with:
-        context: ./backend
-        file: ./backend/Dockerfile.model_server
-        platforms: linux/amd64,linux/arm64
-        push: true
-        tags: |
-          danswer/danswer-model-server:${{ github.ref_name }}
-          danswer/danswer-model-server:latest
-        build-args: |
-          DANSWER_VERSION=${{ github.ref_name }}
-
-    - name: Run Trivy vulnerability scanner
-      uses: aquasecurity/trivy-action@master
-      with:
-        image-ref: docker.io/danswer/danswer-model-server:${{ github.ref_name }}
-        severity: 'CRITICAL,HIGH'
--- a/.github/workflows/docker-build-push-web-container-on-tag.yml
+++ b/.github/workflows/docker-build-push-web-container-on-tag.yml
@@ -1,119 +1,34 @@
-name: Build and Push Web Image on Tag
+name: Build and Push Web Images on Tagging

 on:
  push:
    tags:
      - '*'

-env:
-  REGISTRY_IMAGE: danswer/danswer-web-server
-
 jobs:
-  build:
-    runs-on: 
-      group: ${{ matrix.platform == 'linux/amd64' && 'amd64-image-builders' || 'arm64-image-builders' }}
-    strategy:
-      fail-fast: false
-      matrix:
-        platform:
-          - linux/amd64
-          - linux/arm64
-
-    steps:
-      - name: Prepare
-        run: |
-          platform=${{ matrix.platform }}
-          echo "PLATFORM_PAIR=${platform//\//-}" >> $GITHUB_ENV          
-      
-      - name: Checkout
-        uses: actions/checkout@v4
-      
-      - name: Docker meta
-        id: meta
-        uses: docker/metadata-action@v5
-        with:
-          images: ${{ env.REGISTRY_IMAGE }}
-          tags: |
-            type=raw,value=${{ env.REGISTRY_IMAGE }}:${{ github.ref_name }}
-            type=raw,value=${{ env.REGISTRY_IMAGE }}:latest
-      
-      - name: Set up Docker Buildx
-        uses: docker/setup-buildx-action@v3
-      
-      - name: Login to Docker Hub
-        uses: docker/login-action@v3
-        with:
-          username: ${{ secrets.DOCKER_USERNAME }}
-          password: ${{ secrets.DOCKER_TOKEN }}
-    
-      - name: Build and push by digest
-        id: build
-        uses: docker/build-push-action@v5
-        with:
-          context: ./web
-          file: ./web/Dockerfile
-          platforms: ${{ matrix.platform }}
-          push: true
-          build-args: |
-            DANSWER_VERSION=${{ github.ref_name }}
-          # needed due to weird interactions with the builds for different platforms  
-          no-cache: true
-          labels: ${{ steps.meta.outputs.labels }}
-          outputs: type=image,name=${{ env.REGISTRY_IMAGE }},push-by-digest=true,name-canonical=true,push=true
-      
-      - name: Export digest
-        run: |
-          mkdir -p /tmp/digests
-          digest="${{ steps.build.outputs.digest }}"
-          touch "/tmp/digests/${digest#sha256:}"          
-      
-      - name: Upload digest
-        uses: actions/upload-artifact@v4
-        with:
-          name: digests-${{ env.PLATFORM_PAIR }}
-          path: /tmp/digests/*
-          if-no-files-found: error
-          retention-days: 1
-
-  merge:
+  build-and-push:
    runs-on: ubuntu-latest
-    needs:
-      - build
-    steps:
-      - name: Download digests
-        uses: actions/download-artifact@v4
-        with:
-          path: /tmp/digests
-          pattern: digests-*
-          merge-multiple: true
-      
-      - name: Set up Docker Buildx
-        uses: docker/setup-buildx-action@v3
-      
-      - name: Docker meta
-        id: meta
-        uses: docker/metadata-action@v5
-        with:
-          images: ${{ env.REGISTRY_IMAGE }}
-      
-      - name: Login to Docker Hub
-        uses: docker/login-action@v3
-        with:
-          username: ${{ secrets.DOCKER_USERNAME }}
-          password: ${{ secrets.DOCKER_TOKEN }}
-      
-      - name: Create manifest list and push
-        working-directory: /tmp/digests
-        run: |
-          docker buildx imagetools create $(jq -cr '.tags | map("-t " + .) | join(" ")' <<< "$DOCKER_METADATA_OUTPUT_JSON") \
-            $(printf '${{ env.REGISTRY_IMAGE }}@sha256:%s ' *)          
-      
-      - name: Inspect image
-        run: |
-          docker buildx imagetools inspect ${{ env.REGISTRY_IMAGE }}:${{ steps.meta.outputs.version }}

-      - name: Run Trivy vulnerability scanner
-        uses: aquasecurity/trivy-action@master
-        with:
-          image-ref: docker.io/${{ env.REGISTRY_IMAGE }}:${{ github.ref_name }}
-          severity: 'CRITICAL,HIGH'
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v2
+
+    - name: Set up Docker Buildx
+      uses: docker/setup-buildx-action@v1
+
+    - name: Login to Docker Hub
+      uses: docker/login-action@v1
+      with:
+        username: ${{ secrets.DOCKER_USERNAME }}
+        password: ${{ secrets.DOCKER_TOKEN }}
+
+    - name: Web Image Docker Build and Push
+      uses: docker/build-push-action@v2
+      with:
+        context: ./web
+        file: ./web/Dockerfile
+        platforms: linux/amd64,linux/arm64
+        push: true
+        tags: |
+          danswer/danswer-web-server:${{ github.ref_name }}
+          danswer/danswer-web-server:latest
--- a/.github/workflows/docker-build-web-container-on-merge-group.yml
+++ b/.github/workflows/docker-build-web-container-on-merge-group.yml
@@ -1,53 +0,0 @@
-name: Build Web Image on Merge Group
-
-on:
-  merge_group:
-    types: [checks_requested]
-
-env:
-  REGISTRY_IMAGE: danswer/danswer-web-server
-
-jobs:
-  build:
-    runs-on: 
-      group: ${{ matrix.platform == 'linux/amd64' && 'amd64-image-builders' || 'arm64-image-builders' }}
-    strategy:
-      fail-fast: false
-      matrix:
-        platform:
-          - linux/amd64
-          - linux/arm64
-
-    steps:
-      - name: Prepare
-        run: |
-          platform=${{ matrix.platform }}
-          echo "PLATFORM_PAIR=${platform//\//-}" >> $GITHUB_ENV          
-      
-      - name: Checkout
-        uses: actions/checkout@v4
-      
-      - name: Docker meta
-        id: meta
-        uses: docker/metadata-action@v5
-        with:
-          images: ${{ env.REGISTRY_IMAGE }}
-          tags: |
-            type=raw,value=${{ env.REGISTRY_IMAGE }}:latest
-      
-      - name: Set up Docker Buildx
-        uses: docker/setup-buildx-action@v3
-    
-      - name: Build by digest
-        id: build
-        uses: docker/build-push-action@v5
-        with:
-          context: ./web
-          file: ./web/Dockerfile
-          platforms: ${{ matrix.platform }}
-          push: false
-          build-args: |
-            DANSWER_VERSION=v0.0.1
-          # needed due to weird interactions with the builds for different platforms  
-          no-cache: true
-          labels: ${{ steps.meta.outputs.labels }}
--- a/.github/workflows/pr-python-checks.yml
+++ b/.github/workflows/pr-python-checks.yml
@@ -20,12 +20,10 @@ jobs:
        cache-dependency-path: |
          backend/requirements/default.txt
          backend/requirements/dev.txt
-          backend/requirements/model_server.txt
    - run: |
        python -m pip install --upgrade pip
        pip install -r backend/requirements/default.txt
        pip install -r backend/requirements/dev.txt
-        pip install -r backend/requirements/model_server.txt

    - name: Run MyPy
      run: |
--- a/.github/workflows/pr-python-tests.yml
+++ b/.github/workflows/pr-python-tests.yml
@@ -1,35 +0,0 @@
-name: Python Unit Tests
-
-on:
-  pull_request:
-    branches: [ main ]
-
-jobs:
-  backend-check:
-    runs-on: ubuntu-latest
-
-    env:
-      PYTHONPATH: ./backend
-
-    steps:
-    - name: Checkout code
-      uses: actions/checkout@v4
-
-    - name: Set up Python
-      uses: actions/setup-python@v4
-      with:
-        python-version: '3.11'
-        cache: 'pip'
-        cache-dependency-path: |
-          backend/requirements/default.txt
-          backend/requirements/dev.txt
-
-    - name: Install Dependencies
-      run: |
-        python -m pip install --upgrade pip
-        pip install -r backend/requirements/default.txt
-        pip install -r backend/requirements/dev.txt
-
-    - name: Run Tests
-      shell: script -q -e -c "bash --noprofile --norc -eo pipefail {0}"
-      run: py.test -o junit_family=xunit2 -xv --ff backend/tests/unit
--- a/.github/workflows/pr-quality-checks.yml
+++ b/.github/workflows/pr-quality-checks.yml
@@ -1,21 +0,0 @@
-name: Quality Checks PR
-concurrency:
-  group: Quality-Checks-PR-${{ github.head_ref }}
-  cancel-in-progress: true
-
-on:
-  pull_request: null
-
-jobs:
-  quality-checks:
-    runs-on: ubuntu-latest
-    steps:
-    - uses: actions/checkout@v4
-      with:
-        fetch-depth: 0
-    - uses: actions/setup-python@v5
-      with:
-        python-version: '3.11'
-    - uses: pre-commit/action@v3.0.0
-      with:
-        extra_args: --from-ref ${{ github.event.pull_request.base.sha }} --to-ref ${{ github.event.pull_request.head.sha }}
--- a/.gitignore
+++ b/.gitignore
@@ -1,9 +1,3 @@
 .env
 .DS_store
-.venv
-.mypy_cache
-.idea
-/deployment/data/nginx/app.conf
-.vscode/launch.json
-*.sw?
-/backend/tests/regression/answer_quality/search_test_config.yaml
+.venv
--- a/.vscode/env_template.txt
+++ b/.vscode/env_template.txt
@@ -1,52 +0,0 @@
-# Copy this file to .env at the base of the repo and fill in the <REPLACE THIS> values
-# This will help with development iteration speed and reduce repeat tasks for dev
-# Also check out danswer/backend/scripts/restart_containers.sh for a script to restart the containers which Danswer relies on outside of VSCode/Cursor processes
-
-# For local dev, often user Authentication is not needed
-AUTH_TYPE=disabled
-
-
-# Always keep these on for Dev
-# Logs all model prompts to stdout
-LOG_DANSWER_MODEL_INTERACTIONS=True
-# More verbose logging
-LOG_LEVEL=debug
-
-
-# This passes top N results to LLM an additional time for reranking prior to answer generation
-# This step is quite heavy on token usage so we disable it for dev generally
-DISABLE_LLM_DOC_RELEVANCE=True
-
-
-# Useful if you want to toggle auth on/off (google_oauth/OIDC specifically)
-OAUTH_CLIENT_ID=<REPLACE THIS>
-OAUTH_CLIENT_SECRET=<REPLACE THIS>
-# Generally not useful for dev, we don't generally want to set up an SMTP server for dev
-REQUIRE_EMAIL_VERIFICATION=False
-
-
-# Set these so if you wipe the DB, you don't end up having to go through the UI every time
-GEN_AI_API_KEY=<REPLACE THIS>
-# If answer quality isn't important for dev, use 3.5 turbo due to it being cheaper
-GEN_AI_MODEL_VERSION=gpt-3.5-turbo
-FAST_GEN_AI_MODEL_VERSION=gpt-3.5-turbo
-
-# For Danswer Slack Bot, overrides the UI values so no need to set this up via UI every time
-# Only needed if using DanswerBot
-#DANSWER_BOT_SLACK_APP_TOKEN=<REPLACE THIS>
-#DANSWER_BOT_SLACK_BOT_TOKEN=<REPLACE THIS>
-
-
-# Python stuff
-PYTHONPATH=./backend
-PYTHONUNBUFFERED=1
-
-
-# Internet Search 
-BING_API_KEY=<REPLACE THIS>
-
-
-# Enable the full set of Danswer Enterprise Edition features
-# NOTE: DO NOT ENABLE THIS UNLESS YOU HAVE A PAID ENTERPRISE LICENSE (or if you are using this for local testing/development)
-ENABLE_PAID_ENTERPRISE_EDITION_FEATURES=False
-
--- a/.vscode/launch.template.jsonc
+++ b/.vscode/launch.template.jsonc
@@ -11,135 +11,72 @@
    // For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387
    "version": "0.2.0",
    "configurations": [
-        {
-            "name": "Web Server",
-            "type": "node",
-            "request": "launch",
-            "cwd": "${workspaceRoot}/web",
-            "runtimeExecutable": "npm",
-            "envFile": "${workspaceFolder}/.env",
-            "runtimeArgs": [
-                "run", "dev"
-            ],
-            "console": "integratedTerminal"
-        },
-        {
-            "name": "Model Server",
-            "type": "python",
-            "request": "launch",
-            "module": "uvicorn",
-            "cwd": "${workspaceFolder}/backend",
-            "envFile": "${workspaceFolder}/.env",
-            "env": {
-                "LOG_LEVEL": "DEBUG",
-                "PYTHONUNBUFFERED": "1"
-            },
-            "args": [
-                "model_server.main:app",
-                "--reload",
-                "--port",
-                "9000"
-            ],
-            "consoleTitle": "Model Server"
-        },
        {
            "name": "API Server",
            "type": "python",
            "request": "launch",
            "module": "uvicorn",
            "cwd": "${workspaceFolder}/backend",
-            "envFile": "${workspaceFolder}/.env",
            "env": {
-                "LOG_DANSWER_MODEL_INTERACTIONS": "True",
                "LOG_LEVEL": "DEBUG",
-                "PYTHONUNBUFFERED": "1"
+                "DISABLE_AUTH": "True",
+                "TYPESENSE_API_KEY": "typesense_api_key",
+                "DYNAMIC_CONFIG_DIR_PATH": "./dynamic_config_storage"
            },
            "args": [
                "danswer.main:app",
                "--reload",
                "--port",
                "8080"
-            ],
-            "consoleTitle": "API Server"
+            ]
        },
        {
-            "name": "Indexing",
+            "name": "Indexer",
            "type": "python",
            "request": "launch",
            "program": "danswer/background/update.py",
            "cwd": "${workspaceFolder}/backend",
-            "envFile": "${workspaceFolder}/.env",
            "env": {
-                "ENABLE_MULTIPASS_INDEXING": "false",
                "LOG_LEVEL": "DEBUG",
-                "PYTHONUNBUFFERED": "1",
-                "PYTHONPATH": "."
-            },
-            "consoleTitle": "Indexing"
+                "PYTHONPATH": ".",
+                "TYPESENSE_API_KEY": "typesense_api_key",
+                "DYNAMIC_CONFIG_DIR_PATH": "./dynamic_config_storage"
+            }
        },
-        // Celery and all async jobs, usually would include indexing as well but this is handled separately above for dev
        {
-            "name": "Background Jobs",
+            "name": "Temp File Deletion",
            "type": "python",
            "request": "launch",
-            "program": "scripts/dev_run_background_jobs.py",
+            "program": "danswer/background/file_deletion.py",
            "cwd": "${workspaceFolder}/backend",
-            "envFile": "${workspaceFolder}/.env",
            "env": {
-                "LOG_DANSWER_MODEL_INTERACTIONS": "True",
                "LOG_LEVEL": "DEBUG",
-                "PYTHONUNBUFFERED": "1",
-                "PYTHONPATH": "."
-            },
-            "args": [
-                "--no-indexing"
-            ],
-            "consoleTitle": "Background Jobs"
+                "PYTHONPATH": "${workspaceFolder}/backend"
+            }
        },
        // For the listner to access the Slack API,
        // DANSWER_BOT_SLACK_APP_TOKEN & DANSWER_BOT_SLACK_BOT_TOKEN need to be set in .env file located in the root of the project
        {
-            "name": "Slack Bot",
+            "name": "Slack Bot Listener",
            "type": "python",
            "request": "launch",
-            "program": "danswer/danswerbot/slack/listener.py",
+            "program": "danswer/listeners/slack_listener.py",
            "cwd": "${workspaceFolder}/backend",
            "envFile": "${workspaceFolder}/.env",
            "env": {
-                "LOG_LEVEL": "DEBUG",
-                "PYTHONUNBUFFERED": "1",
-                "PYTHONPATH": "."
+                "LOG_LEVEL": "DEBUG"
            }
        },
        {
-            "name": "Pytest",
-            "type": "python",
+            "name": "Web Server",
+            "type": "node",
            "request": "launch",
-            "module": "pytest",
-            "cwd": "${workspaceFolder}/backend",
-            "envFile": "${workspaceFolder}/.env",
-            "env": {
-                "LOG_LEVEL": "DEBUG",
-                "PYTHONUNBUFFERED": "1",
-                "PYTHONPATH": "."
-            },
-            "args": [
-                "-v"
-                // Specify a sepcific module/test to run or provide nothing to run all tests
-                //"tests/unit/danswer/llm/answering/test_prune_and_merge.py"
-            ]
-        }
-    ],
-    "compounds": [
-        {
-            "name": "Run Danswer",
-            "configurations": [
-                "Web Server",
-                "Model Server",
-                "API Server",
-                "Indexing",
-                "Background Jobs",
-            ]
+            "cwd": "${workspaceRoot}/web",
+            "runtimeExecutable": "npm",
+            "runtimeArgs": [
+                "run", "dev"
+            ],
+            "console": "integratedTerminal"
        }
    ]
-}
+}
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -1,5 +1,3 @@
-<!-- DANSWER_METADATA={"link": "https://github.com/danswer-ai/danswer/blob/main/CONTRIBUTING.md"} -->
-
 # Contributing to Danswer
 Hey there! We are so excited that you're interested in Danswer.

@@ -22,7 +20,7 @@ Your input is vital to making sure that Danswer moves in the right direction.
 Before starting on implementation, please raise a GitHub issue.

 And always feel free to message us (Chris Weaver / Yuhong Sun) on 
-[Slack](https://join.slack.com/t/danswer/shared_invite/zt-2afut44lv-Rw3kSWu6_OmdAXRpCv80DQ) / 
+[Slack](https://join.slack.com/t/danswer/shared_invite/zt-1u3h3ke3b-VGh1idW19R8oiNRiKBYv2w) / 
 [Discord](https://discord.gg/TDJ59cGV2X) directly about anything at all. 


@@ -40,7 +38,7 @@ Our goal is to make contributing as easy as possible. If you run into any issues
 That way we can help future contributors and users can avoid the same issue.

 We also have support channels and generally interesting discussions on our
-[Slack](https://join.slack.com/t/danswer/shared_invite/zt-2afut44lv-Rw3kSWu6_OmdAXRpCv80DQ)
+[Slack](https://join.slack.com/t/danswer/shared_invite/zt-1u3h3ke3b-VGh1idW19R8oiNRiKBYv2w)
 and 
 [Discord](https://discord.gg/TDJ59cGV2X).

@@ -58,10 +56,9 @@ development purposes but also feel free to just use the containers and update wi


 ### Local Set Up
-It is recommended to use Python version 3.11
+It is recommended to use Python versions >= 3.11.

-If using a lower version, modifications will have to be made to the code.
-If using a higher version, the version of Tensorflow we use may not be available for your platform.
+This guide skips setting up User Authentication for the purpose of simplicity


 #### Installing Requirements
@@ -72,24 +69,15 @@ For convenience here's a command for it:
 python -m venv .venv
 source .venv/bin/activate
 ```
-
--> Note that this virtual environment MUST NOT be set up WITHIN the danswer
-directory
-
-_For Windows, activate the virtual environment using Command Prompt:_
+_For Windows activate via:_
 ```bash
 .venv\Scripts\activate
 ```
-If using PowerShell, the command slightly differs:
-```powershell
-.venv\Scripts\Activate.ps1
-```

 Install the required python dependencies:
 ```bash
 pip install -r danswer/backend/requirements/default.txt
 pip install -r danswer/backend/requirements/dev.txt
-pip install -r danswer/backend/requirements/model_server.txt
 ```

 Install [Node.js and npm](https://docs.npmjs.com/downloading-and-installing-node-js-and-npm) for the frontend.
@@ -98,12 +86,7 @@ Once the above is done, navigate to `danswer/web` run:
 npm i
 ```

-Install Playwright (required by the Web Connector)
-
-> Note: If you have just done the pip install, open a new terminal and source the python virtual-env again.
-This will update the path to include playwright
-
-Then install Playwright by running:
+Install Playwright (required by the Web Connector), with the python venv active, run:
 ```bash
 playwright install
 ```
@@ -117,24 +100,26 @@ docker compose -f docker-compose.dev.yml -p danswer-stack up -d index relational
 (index refers to Vespa and relational_db refers to Postgres)

 #### Running Danswer
+
+Setup a folder to store config. Navigate to `danswer/backend` and run:
+```bash
+mkdir dynamic_config_storage
+```
+
 To start the frontend, navigate to `danswer/web` and run:
 ```bash
 npm run dev
 ```

-Next, start the model server which runs the local NLP models.
-Navigate to `danswer/backend` and run:
-```bash
-uvicorn model_server.main:app --reload --port 9000
-```
-_For Windows (for compatibility with both PowerShell and Command Prompt):_
-```bash
-powershell -Command "
-    uvicorn model_server.main:app --reload --port 9000
-"
-```
+Package the Vespa schema. This will only need to be done when the Vespa schema is updated locally.

-The first time running Danswer, you will need to run the DB migrations for Postgres.
+Nagivate to `danswer/backend/danswer/document_index/vespa/app_config` and run:
+```bash
+zip -r ../vespa-app.zip .
+```
+- Note: If you don't have the `zip` utility, you will need to install it prior to running the above
+
+The first time running Danswer, you will also need to run the DB migrations for Postgres.
 After the first time, this is no longer required unless the DB models change.

 Navigate to `danswer/backend` and with the venv active, run:
@@ -152,12 +137,17 @@ python ./scripts/dev_run_background_jobs.py

 To run the backend API server, navigate back to `danswer/backend` and run:
 ```bash
-AUTH_TYPE=disabled uvicorn danswer.main:app --reload --port 8080
+AUTH_TYPE=disabled \
+DYNAMIC_CONFIG_DIR_PATH=./dynamic_config_storage \
+VESPA_DEPLOYMENT_ZIP=./danswer/document_index/vespa/vespa-app.zip \
+uvicorn danswer.main:app --reload --port 8080
 ```
 _For Windows (for compatibility with both PowerShell and Command Prompt):_
 ```bash
 powershell -Command "
    $env:AUTH_TYPE='disabled'
+    $env:DYNAMIC_CONFIG_DIR_PATH='./dynamic_config_storage'
+    $env:VESPA_DEPLOYMENT_ZIP='./danswer/document_index/vespa/vespa-app.zip'
    uvicorn danswer.main:app --reload --port 8080 
 "
 ```
@@ -176,16 +166,20 @@ pre-commit install

 Additionally, we use `mypy` for static type checking.
 Danswer is fully type-annotated, and we would like to keep it that way! 
-To run the mypy checks manually, run `python -m mypy .` from the `danswer/backend` directory.
+Right now, there is no automated type checking at the moment (coming soon), but we ask you to manually run it before
+creating a pull requests with `python -m mypy .` from the `danswer/backend` directory.


 #### Web
 We use `prettier` for formatting. The desired version (2.8.8) will be installed via a `npm i` from the `danswer/web` directory. 
 To run the formatter, use `npx prettier --write .` from the `danswer/web` directory.
-Please double check that prettier passes before creating a pull request.
+Like `mypy`, we have no automated formatting yet (coming soon), but we request that, for now,
+you run this manually before creating a pull request.


 ### Release Process
 Danswer follows the semver versioning standard.
 A set of Docker containers will be pushed automatically to DockerHub with every tag.
 You can see the containers [here](https://hub.docker.com/search?q=danswer%2F).
+
+As pre-1.0 software, even patch releases may contain breaking or non-backwards-compatible changes.
--- a/8
+++ b/8
@@ -1,10 +1,6 @@
-Copyright (c) 2023-present DanswerAI, Inc.
+MIT License

-Portions of this software are licensed as follows:
-
-* All content that resides under "ee" directories of this repository, if that directory exists, is licensed under the license defined in "backend/ee/LICENSE". Specifically all content under "backend/ee" and "web/src/app/ee" is licensed under the license defined in "backend/ee/LICENSE".
-* All third party components incorporated into the Danswer Software are licensed under the original license provided by the owner of the applicable component.
-* Content outside of the above mentioned directories or restrictions above is available under the "MIT Expat" license as defined below.
+Copyright (c) 2023 Yuhong Sun, Chris Weaver

 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
--- a/README.md
+++ b/README.md
@@ -1,17 +1,15 @@
-<!-- DANSWER_METADATA={"link": "https://github.com/danswer-ai/danswer/blob/main/README.md"} -->
-
 <h2 align="center">
 <a href="https://www.danswer.ai/"> <img width="50%" src="https://github.com/danswer-owners/danswer/blob/1fabd9372d66cd54238847197c33f091a724803b/DanswerWithName.png?raw=true)" /></a>
 </h2>

 <p align="center">
-<p align="center">Open Source Gen-AI Chat + Unified Search.</p>
+<p align="center">OpenSource Enterprise Question-Answering</p>

 <p align="center">
 <a href="https://docs.danswer.dev/" target="_blank">
    <img src="https://img.shields.io/badge/docs-view-blue" alt="Documentation">
 </a>
-<a href="https://join.slack.com/t/danswer/shared_invite/zt-2lcmqw703-071hBuZBfNEOGUsLa5PXvQ" target="_blank">
+<a href="https://join.slack.com/t/danswer/shared_invite/zt-1u5ycen3o-6SJbWfivLWP5LPyp_jftuw" target="_blank">
    <img src="https://img.shields.io/badge/slack-join-blue.svg?logo=slack" alt="Slack">
 </a>
 <a href="https://discord.gg/TDJ59cGV2X" target="_blank">
@@ -22,108 +20,62 @@
 </a>
 </p>

-<strong>[Danswer](https://www.danswer.ai/)</strong> is the AI Assistant connected to your company's docs, apps, and people. 
-Danswer provides a Chat interface and plugs into any LLM of your choice. Danswer can be deployed anywhere and for any 
-scale - on a laptop, on-premise, or to cloud. Since you own the deployment, your user data and chats are fully in your 
-own control. Danswer is MIT licensed and designed to be modular and easily extensible. The system also comes fully ready 
-for production usage with user authentication, role management (admin/basic users), chat persistence, and a UI for 
-configuring Personas (AI Assistants) and their Prompts.
-
-Danswer also serves as a Unified Search across all common workplace tools such as Slack, Google Drive, Confluence, etc.
-By combining LLMs and team specific knowledge, Danswer becomes a subject matter expert for the team. Imagine ChatGPT if
-it had access to your team's unique knowledge! It enables questions such as "A customer wants feature X, is this already
-supported?" or "Where's the pull request for feature Y?"
+<strong>[Danswer](https://www.danswer.ai/)</strong> allows you to ask natural language questions against internal documents and get back reliable answers backed by quotes and references from the source material so that you can always trust what you get back. You can connect to a number of common tools such as Slack, GitHub, Confluence, amongst others.

 <h3>Usage</h3>

-Danswer Web App:
-
-https://github.com/danswer-ai/danswer/assets/32520769/563be14c-9304-47b5-bf0a-9049c2b6f410
+Danswer provides a fully-featured web UI:


-Or, plug Danswer into your existing Slack workflows (more integrations to come 😁):
+https://github.com/danswer-ai/danswer/assets/25087905/619607a1-4ad2-41a0-9728-351752acc26e
+
+
+Or, if you prefer, you can plug Danswer into your existing Slack workflows (more integrations to come 😁):
+

 https://github.com/danswer-ai/danswer/assets/25087905/3e19739b-d178-4371-9a38-011430bdec1b


-For more details on the Admin UI to manage connectors and users, check out our 
-<strong><a href="https://www.youtube.com/watch?v=geNzY1nbCnU">Full Video Demo</a></strong>!
+For more details on the admin controls, check out our <strong><a href="https://www.youtube.com/watch?v=geNzY1nbCnU">Full Video Demo</a></strong>!

-## Deployment
+<h3>Deployment</h3>

-Danswer can easily be run locally (even on a laptop) or deployed on a virtual machine with a single
-`docker compose` command. Checkout our [docs](https://docs.danswer.dev/quickstart) to learn more.
+Danswer can easily be tested locally or deployed on a virtual machine with a single `docker compose` command. Checkout our [docs](https://docs.danswer.dev/quickstart) to learn more.

 We also have built-in support for deployment on Kubernetes. Files for that can be found [here](https://github.com/danswer-ai/danswer/tree/main/deployment/kubernetes).

+## 💃 Features 
+* Direct QA powered by Generative AI models with answers backed by quotes and source links.
+* Intelligent Document Retrieval (Semantic Search/Reranking) using the latest LLMs.
+* An AI Helper backed by a custom Deep Learning model to interpret user intent.
+* User authentication and document level access management.
+* Support for an LLM of your choice (GPT-4, Llama2, Orca, etc.)
+* Management Dashboard to manage connectors and set up features such as live update fetching.
+* One line Docker Compose (or Kubernetes) deployment to host Danswer anywhere.

-## 💃 Main Features 
-* Chat UI with the ability to select documents to chat with.
-* Create custom AI Assistants with different prompts and backing knowledge sets.
-* Connect Danswer with LLM of your choice (self-host for a fully airgapped solution).
-* Document Search + AI Answers for natural language queries.
-* Connectors to all common workplace tools like Google Drive, Confluence, Slack, etc.
-* Slack integration to get answers and search results directly in Slack.
+## 🔌 Connectors 

-
-## 🚧 Roadmap
-* Chat/Prompt sharing with specific teammates and user groups.
-* Multi-Model model support, chat with images, video etc.
-* Choosing between LLMs and parameters during chat session.
-* Tool calling and agent configurations options.
-* Organizational understanding and ability to locate and suggest experts from your team.
-
-
-## Other Noteable Benefits of Danswer
-* User Authentication with document level access management.
-* Best in class Hybrid Search across all sources (BM-25 + prefix aware embedding models).
-* Admin Dashboard to configure connectors, document-sets, access, etc.
-* Custom deep learning models + learn from user feedback.
-* Easy deployment and ability to host Danswer anywhere of your choosing.
-
-
-## 🔌 Connectors
-Efficiently pulls the latest changes from:
+Danswer currently syncs documents (every 10 minutes) from:
  * Slack
  * GitHub
  * Google Drive
  * Confluence
  * Jira
-  * Zendesk
-  * Gmail
  * Notion
-  * Gong
  * Slab
  * Linear
  * Productboard
  * Guru
+  * Zulip
  * Bookstack
-  * Document360
-  * Sharepoint
-  * Hubspot
  * Local Files
  * Websites
-  * And more ...
+  * With more to come...

-## 📚 Editions
-
-There are two editions of Danswer:
-
-  * Danswer Community Edition (CE) is available freely under the MIT Expat license. This version has ALL the core features discussed above. This is the version of Danswer you will get if you follow the Deployment guide above.
-  * Danswer Enterprise Edition (EE) includes extra features that are primarily useful for larger organizations. Specifically, this includes:
-    * Single Sign-On (SSO), with support for both SAML and OIDC
-    * Role-based access control
-    * Document permission inheritance from connected sources
-    * Usage analytics and query history accessible to admins
-    * Whitelabeling
-    * API key authentication
-    * Encryption of secrets
-    * Any many more! Checkout [our website](https://www.danswer.ai/) for the latest.
-
-To try the Danswer Enterprise Edition: 
-
-  1. Checkout our [Cloud product](https://app.danswer.ai/signup).
-  2. For self-hosting, contact us at [founders@danswer.ai](mailto:founders@danswer.ai) or book a call with us on our [Cal](https://cal.com/team/danswer/founders).
+## 🚧 Roadmap
+* Chat/Conversation support.
+* Organizational understanding.
+* Ability to locate and suggest experts.

 ## 💡 Contributing
 Looking to contribute? Please check out the [Contribution Guide](CONTRIBUTING.md) for more details.
--- a/backend/.dockerignore
+++ b/backend/.dockerignore
@@ -1,17 +0,0 @@
-**/__pycache__
-venv/
-env/
-*.egg-info
-.cache
-.git/
-.svn/
-.vscode/
-.idea/
-*.log
-log/
-.env
-secrets.yaml
-build/
-dist/
-.coverage
-htmlcov/
--- a/backend/.gitignore
+++ b/backend/.gitignore
@@ -1,11 +1,9 @@
 __pycache__/
-.mypy_cache
 .idea/
 site_crawls/
 .ipynb_checkpoints/
 api_keys.py
 *ipynb
-.env*
+.env
 vespa-app.zip
 dynamic_config_storage/
-celerybeat-schedule*
--- a/backend/.pre-commit-config.yaml
+++ b/backend/.pre-commit-config.yaml
@@ -28,13 +28,6 @@ repos:
    rev: v0.0.286
    hooks:
      - id: ruff
-  - repo: https://github.com/pre-commit/mirrors-prettier
-    rev: v3.1.0
-    hooks:
-    - id: prettier
-      types_or: [html, css, javascript, ts, tsx]
-      additional_dependencies:
-      - prettier

  # We would like to have a mypy pre-commit hook, but due to the fact that
  # pre-commit runs in it's own isolated environment, we would need to install
--- a/backend/.trivyignore
+++ b/backend/.trivyignore
@@ -1,46 +0,0 @@
-# https://github.com/madler/zlib/issues/868
-# Pulled in with base Debian image, it's part of the contrib folder but unused
-# zlib1g is fine
-# Will be gone with Debian image upgrade
-# No impact in our settings
-CVE-2023-45853
-
-# krb5 related, worst case is denial of service by resource exhaustion
-# Accept the risk
-CVE-2024-26458
-CVE-2024-26461
-CVE-2024-26462
-CVE-2024-26458
-CVE-2024-26461
-CVE-2024-26462
-CVE-2024-26458
-CVE-2024-26461
-CVE-2024-26462
-CVE-2024-26458
-CVE-2024-26461
-CVE-2024-26462
-
-# Specific to Firefox which we do not use
-# No impact in our settings
-CVE-2024-0743
-
-# bind9 related, worst case is denial of service by CPU resource exhaustion
-# Accept the risk
-CVE-2023-50387
-CVE-2023-50868
-CVE-2023-50387
-CVE-2023-50868
-
-# libexpat1, XML parsing resource exhaustion
-# We don't parse any user provided XMLs
-# No impact in our settings
-CVE-2023-52425
-CVE-2024-28757
-
-# sqlite, only used by NLTK library to grab word lemmatizer and stopwords
-# No impact in our settings
-CVE-2023-7104
-
-# libharfbuzz0b, O(n^2) growth, worst case is denial of service
-# Accept the risk
-CVE-2023-25193
--- a/backend/Dockerfile
+++ b/backend/Dockerfile
@@ -1,102 +1,57 @@
-FROM python:3.11.7-slim-bookworm
+FROM python:3.11.4-slim-bookworm

-LABEL com.danswer.maintainer="founders@danswer.ai"
-LABEL com.danswer.description="This image is the web/frontend container of Danswer which \
-contains code for both the Community and Enterprise editions of Danswer. If you do not \
-have a contract or agreement with DanswerAI, you are not permitted to use the Enterprise \
-Edition features outside of personal development or testing purposes. Please reach out to \
-founders@danswer.ai for more information. Please visit https://github.com/danswer-ai/danswer"
-
-# Default DANSWER_VERSION, typically overriden during builds by GitHub Actions.
-ARG DANSWER_VERSION=0.3-dev
-ENV DANSWER_VERSION=${DANSWER_VERSION}
-
-RUN echo "DANSWER_VERSION: ${DANSWER_VERSION}"
 # Install system dependencies
-# cmake needed for psycopg (postgres)
-# libpq-dev needed for psycopg (postgres)
-# curl included just for users' convenience
-# zip for Vespa step futher down
-# ca-certificates for HTTPS
 RUN apt-get update && \
-    apt-get install -y \
-        cmake \
-        curl \
-        zip \
-        ca-certificates \
-        libgnutls30=3.7.9-2+deb12u3 \
-        libblkid1=2.38.1-5+deb12u1 \
-        libmount1=2.38.1-5+deb12u1 \
-        libsmartcols1=2.38.1-5+deb12u1 \
-        libuuid1=2.38.1-5+deb12u1 \
-        libxmlsec1-dev \
-        pkg-config \
-        gcc && \
+    apt-get install -y git cmake pkg-config libprotobuf-c-dev protobuf-compiler \
+       libprotobuf-dev libgoogle-perftools-dev libpq-dev build-essential cron curl \
+       supervisor zip ca-certificates gnupg && \
    rm -rf /var/lib/apt/lists/* && \
    apt-get clean

 # Install Python dependencies
 # Remove py which is pulled in by retry, py is not needed and is a CVE
 COPY ./requirements/default.txt /tmp/requirements.txt
-COPY ./requirements/ee.txt /tmp/ee-requirements.txt
-RUN pip install --no-cache-dir --upgrade \
-        -r /tmp/requirements.txt \
-        -r /tmp/ee-requirements.txt && \
+RUN pip install --no-cache-dir --upgrade -r /tmp/requirements.txt && \
    pip uninstall -y py && \
    playwright install chromium && \
-    playwright install-deps chromium && \
-    ln -s /usr/local/bin/supervisord /usr/bin/supervisord
+    playwright install-deps chromium
+
+# install nodejs and replace nodejs packaged with playwright (18.17.0) with the one installed below
+# based on the instructions found here:
+# https://nodejs.org/en/download/package-manager#debian-and-ubuntu-based-linux-distributions
+# this is temporarily needed until playwright updates their packaged node version to
+# 20.5.1+
+RUN mkdir -p /etc/apt/keyrings && \
+    curl -fsSL https://deb.nodesource.com/gpgkey/nodesource-repo.gpg.key | gpg --dearmor -o /etc/apt/keyrings/nodesource.gpg && \
+    echo "deb [signed-by=/etc/apt/keyrings/nodesource.gpg] https://deb.nodesource.com/node_20.x nodistro main" | tee /etc/apt/sources.list.d/nodesource.list && \
+    apt-get update && \
+    apt-get install -y nodejs && \
+    cp /usr/bin/node /usr/local/lib/python3.11/site-packages/playwright/driver/node && \
+    apt-get remove -y nodejs

 # Cleanup for CVEs and size reduction
+# Remove tornado test key to placate vulnerability scanners
+# More details can be found here:
 # https://github.com/tornadoweb/tornado/issues/3107
-# xserver-common and xvfb included by playwright installation but not needed after
-# perl-base is part of the base Python Debian image but not needed for Danswer functionality
-# perl-base could only be removed with --allow-remove-essential
-RUN apt-get update && \
-    apt-get remove -y --allow-remove-essential \
-        perl-base \
-        xserver-common \
-        xvfb \
-        cmake \
-        libldap-2.5-0 \
-        libxmlsec1-dev \
-        pkg-config \
-        gcc && \
-    apt-get install -y libxmlsec1-openssl && \
+RUN apt-get remove -y linux-libc-dev && \
    apt-get autoremove -y && \
    rm -rf /var/lib/apt/lists/* && \
-    rm -f /usr/local/lib/python3.11/site-packages/tornado/test/test.key
-
-# Pre-downloading models for setups with limited egress
-RUN python -c "from tokenizers import Tokenizer; \
-Tokenizer.from_pretrained('nomic-ai/nomic-embed-text-v1')"
-
-
-# Pre-downloading NLTK for setups with limited egress
-RUN python -c "import nltk; \
-nltk.download('stopwords', quiet=True); \
-nltk.download('wordnet', quiet=True); \
-nltk.download('punkt', quiet=True);"
+    rm /usr/local/lib/python3.11/site-packages/tornado/test/test.key

 # Set up application files
 WORKDIR /app
-
-# Enterprise Version Files
-COPY ./ee /app/ee
-COPY supervisord.conf /etc/supervisor/conf.d/supervisord.conf
-
-# Set up application files
 COPY ./danswer /app/danswer
-COPY ./shared_configs /app/shared_configs
 COPY ./alembic /app/alembic
 COPY ./alembic.ini /app/alembic.ini
-COPY supervisord.conf /usr/etc/supervisord.conf
+COPY supervisord.conf /etc/supervisor/conf.d/supervisord.conf

-# Escape hatch
-COPY ./scripts/force_delete_connector_by_id.py /app/scripts/force_delete_connector_by_id.py
+# Create Vespa app zip
+WORKDIR /app/danswer/document_index/vespa/app_config
+RUN zip -r /app/danswer/vespa-app.zip .
+WORKDIR /app

-# Put logo in assets
-COPY ./assets /app/assets
+# TODO: remove this once all users have migrated
+COPY ./scripts/migrate_vespa_to_acl.py /app/migrate_vespa_to_acl.py

 ENV PYTHONPATH /app

--- a/backend/Dockerfile.model_server
+++ b/backend/Dockerfile.model_server
@@ -1,50 +0,0 @@
-FROM python:3.11.7-slim-bookworm
-
-LABEL com.danswer.maintainer="founders@danswer.ai"
-LABEL com.danswer.description="This image is for the Danswer model server which runs all of the \
-AI models for Danswer. This container and all the code is MIT Licensed and free for all to use. \
-You can find it at https://hub.docker.com/r/danswer/danswer-model-server. For more details, \
-visit https://github.com/danswer-ai/danswer."
-
-# Default DANSWER_VERSION, typically overriden during builds by GitHub Actions.
-ARG DANSWER_VERSION=0.3-dev
-ENV DANSWER_VERSION=${DANSWER_VERSION}
-RUN echo "DANSWER_VERSION: ${DANSWER_VERSION}"
-
-COPY ./requirements/model_server.txt /tmp/requirements.txt
-RUN pip install --no-cache-dir --upgrade -r /tmp/requirements.txt
-
-RUN apt-get remove -y --allow-remove-essential perl-base && \
-    apt-get autoremove -y
-
-# Pre-downloading models for setups with limited egress
-# Download tokenizers, distilbert for the Danswer model
-# Download model weights
-# Run Nomic to pull in the custom architecture and have it cached locally
-RUN python -c "from transformers import AutoTokenizer; \
-AutoTokenizer.from_pretrained('distilbert-base-uncased', cache_folder='/root/.cache/temp_huggingface/hub/'); \
-AutoTokenizer.from_pretrained('mixedbread-ai/mxbai-rerank-xsmall-v1', cache_folder='/root/.cache/temp_huggingface/hub/'); \
-from huggingface_hub import snapshot_download; \
-snapshot_download(repo_id='danswer/hybrid-intent-token-classifier', revision='v1.0.3', cache_dir='/root/.cache/temp_huggingface/hub/'); \
-snapshot_download('nomic-ai/nomic-embed-text-v1', cache_dir='/root/.cache/temp_huggingface/hub/'); \
-snapshot_download('mixedbread-ai/mxbai-rerank-xsmall-v1', cache_dir='/root/.cache/temp_huggingface/hub/'); \
-from sentence_transformers import SentenceTransformer; \
-SentenceTransformer(model_name_or_path='nomic-ai/nomic-embed-text-v1', trust_remote_code=True, cache_folder='/root/.cache/temp_huggingface/hub/');"
-
-WORKDIR /app
-
-# Utils used by model server
-COPY ./danswer/utils/logger.py /app/danswer/utils/logger.py
-
-# Place to fetch version information
-COPY ./danswer/__init__.py /app/danswer/__init__.py
-
-# Shared between Danswer Backend and Model Server
-COPY ./shared_configs /app/shared_configs
-
-# Model Server main code
-COPY ./model_server /app/model_server
-
-ENV PYTHONPATH /app
-
-CMD ["uvicorn", "model_server.main:app", "--host", "0.0.0.0", "--port", "9000"]
--- a/backend/alembic/README.md
+++ b/backend/alembic/README.md
@@ -1,8 +1,4 @@
-<!-- DANSWER_METADATA={"link": "https://github.com/danswer-ai/danswer/blob/main/backend/alembic/README.md"} -->
-
-# Alembic DB Migrations
-These files are for creating/updating the tables in the Relational DB (Postgres).
-Danswer migrations use a generic single-database configuration with an async dbapi.
+Generic single-database configuration with an async dbapi.

 ## To generate new migrations: 
 run from danswer/backend:
@@ -11,6 +7,7 @@ run from danswer/backend:
 More info can be found here: https://alembic.sqlalchemy.org/en/latest/autogenerate.html

 ## Running migrations
+
 To run all un-applied migrations:
 `alembic upgrade head`

--- a/backend/alembic/versions/0568ccf46a6b_add_thread_specific_model_selection.py
+++ b/backend/alembic/versions/0568ccf46a6b_add_thread_specific_model_selection.py
@@ -1,27 +0,0 @@
-"""Add thread specific model selection
-
-Revision ID: 0568ccf46a6b
-Revises: e209dc5a8156
-Create Date: 2024-06-19 14:25:36.376046
-
-"""
-
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "0568ccf46a6b"
-down_revision = "e209dc5a8156"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "chat_session",
-        sa.Column("current_alternate_model", sa.String(), nullable=True),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("chat_session", "current_alternate_model")
--- a/backend/alembic/versions/05c07bf07c00_add_search_doc_relevance_details.py
+++ b/backend/alembic/versions/05c07bf07c00_add_search_doc_relevance_details.py
@@ -1,32 +0,0 @@
-"""add search doc relevance details
-
-Revision ID: 05c07bf07c00
-Revises: b896bbd0d5a7
-Create Date: 2024-07-10 17:48:15.886653
-
-"""
-
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "05c07bf07c00"
-down_revision = "b896bbd0d5a7"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "search_doc",
-        sa.Column("is_relevant", sa.Boolean(), nullable=True),
-    )
-    op.add_column(
-        "search_doc",
-        sa.Column("relevance_explanation", sa.String(), nullable=True),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("search_doc", "relevance_explanation")
-    op.drop_column("search_doc", "is_relevant")
--- a/backend/alembic/versions/08a1eda20fe1_add_earliest_indexing_to_connector.py
+++ b/backend/alembic/versions/08a1eda20fe1_add_earliest_indexing_to_connector.py
@@ -1,26 +0,0 @@
-"""add_indexing_start_to_connector
-
-Revision ID: 08a1eda20fe1
-Revises: 8a87bd6ec550
-Create Date: 2024-07-23 11:12:39.462397
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-
-# revision identifiers, used by Alembic.
-revision = "08a1eda20fe1"
-down_revision = "8a87bd6ec550"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "connector", sa.Column("indexing_start", sa.DateTime(), nullable=True)
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("connector", "indexing_start")
--- a/backend/alembic/versions/0a2b51deb0b8_add_starter_prompts.py
+++ b/backend/alembic/versions/0a2b51deb0b8_add_starter_prompts.py
@@ -1,31 +0,0 @@
-"""Add starter prompts
-
-Revision ID: 0a2b51deb0b8
-Revises: 5f4b8568a221
-Create Date: 2024-03-02 23:23:49.960309
-
-"""
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-
-# revision identifiers, used by Alembic.
-revision = "0a2b51deb0b8"
-down_revision = "5f4b8568a221"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "persona",
-        sa.Column(
-            "starter_messages",
-            postgresql.JSONB(astext_type=sa.Text()),
-            nullable=True,
-        ),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("persona", "starter_messages")
--- a/backend/alembic/versions/0a98909f2757_enable_encrypted_fields.py
+++ b/backend/alembic/versions/0a98909f2757_enable_encrypted_fields.py
@@ -1,113 +0,0 @@
-"""Enable Encrypted Fields
-
-Revision ID: 0a98909f2757
-Revises: 570282d33c49
-Create Date: 2024-05-05 19:30:34.317972
-
-"""
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.sql import table
-from sqlalchemy.dialects import postgresql
-import json
-
-from danswer.utils.encryption import encrypt_string_to_bytes
-
-# revision identifiers, used by Alembic.
-revision = "0a98909f2757"
-down_revision = "570282d33c49"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    connection = op.get_bind()
-
-    op.alter_column("key_value_store", "value", nullable=True)
-    op.add_column(
-        "key_value_store",
-        sa.Column(
-            "encrypted_value",
-            sa.LargeBinary,
-            nullable=True,
-        ),
-    )
-
-    # Need a temporary column to translate the JSONB to binary
-    op.add_column("credential", sa.Column("temp_column", sa.LargeBinary()))
-
-    creds_table = table(
-        "credential",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column(
-            "credential_json",
-            postgresql.JSONB(astext_type=sa.Text()),
-            nullable=False,
-        ),
-        sa.Column(
-            "temp_column",
-            sa.LargeBinary(),
-            nullable=False,
-        ),
-    )
-
-    results = connection.execute(sa.select(creds_table))
-
-    # This uses the MIT encrypt which does not actually encrypt the credentials
-    # In other words, this upgrade does not apply the encryption. Porting existing sensitive data
-    # and key rotation currently is not supported and will come out in the future
-    for row_id, creds, _ in results:
-        creds_binary = encrypt_string_to_bytes(json.dumps(creds))
-        connection.execute(
-            creds_table.update()
-            .where(creds_table.c.id == row_id)
-            .values(temp_column=creds_binary)
-        )
-
-    op.drop_column("credential", "credential_json")
-    op.alter_column("credential", "temp_column", new_column_name="credential_json")
-
-    op.add_column("llm_provider", sa.Column("temp_column", sa.LargeBinary()))
-
-    llm_table = table(
-        "llm_provider",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column(
-            "api_key",
-            sa.String(),
-            nullable=False,
-        ),
-        sa.Column(
-            "temp_column",
-            sa.LargeBinary(),
-            nullable=False,
-        ),
-    )
-    results = connection.execute(sa.select(llm_table))
-
-    for row_id, api_key, _ in results:
-        llm_key = encrypt_string_to_bytes(api_key)
-        connection.execute(
-            llm_table.update()
-            .where(llm_table.c.id == row_id)
-            .values(temp_column=llm_key)
-        )
-
-    op.drop_column("llm_provider", "api_key")
-    op.alter_column("llm_provider", "temp_column", new_column_name="api_key")
-
-
-def downgrade() -> None:
-    # Some information loss but this is ok. Should not allow decryption via downgrade.
-    op.drop_column("credential", "credential_json")
-    op.drop_column("llm_provider", "api_key")
-
-    op.add_column("llm_provider", sa.Column("api_key", sa.String()))
-    op.add_column(
-        "credential",
-        sa.Column("credential_json", postgresql.JSONB(astext_type=sa.Text())),
-    )
-
-    op.execute("DELETE FROM key_value_store WHERE value IS NULL")
-    op.alter_column("key_value_store", "value", nullable=False)
-    op.drop_column("key_value_store", "encrypted_value")
--- a/backend/alembic/versions/15326fcec57e_introduce_danswer_apis.py
+++ b/backend/alembic/versions/15326fcec57e_introduce_danswer_apis.py
@@ -1,37 +0,0 @@
-"""Introduce Danswer APIs
-
-Revision ID: 15326fcec57e
-Revises: 77d07dffae64
-Create Date: 2023-11-11 20:51:24.228999
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-from danswer.configs.constants import DocumentSource
-
-# revision identifiers, used by Alembic.
-revision = "15326fcec57e"
-down_revision = "77d07dffae64"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.alter_column("credential", "is_admin", new_column_name="admin_public")
-    op.add_column(
-        "document",
-        sa.Column("from_ingestion_api", sa.Boolean(), nullable=True),
-    )
-    op.alter_column(
-        "connector",
-        "source",
-        type_=sa.String(length=50),
-        existing_type=sa.Enum(DocumentSource, native_enum=False),
-        existing_nullable=False,
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("document", "from_ingestion_api")
-    op.alter_column("credential", "admin_public", new_column_name="is_admin")
--- a/backend/alembic/versions/173cae5bba26_port_config_store.py
+++ b/backend/alembic/versions/173cae5bba26_port_config_store.py
@@ -1,29 +0,0 @@
-"""Port Config Store
-
-Revision ID: 173cae5bba26
-Revises: e50154680a5c
-Create Date: 2024-03-19 15:30:44.425436
-
-"""
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-
-# revision identifiers, used by Alembic.
-revision = "173cae5bba26"
-down_revision = "e50154680a5c"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "key_value_store",
-        sa.Column("key", sa.String(), nullable=False),
-        sa.Column("value", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
-        sa.PrimaryKeyConstraint("key"),
-    )
-
-
-def downgrade() -> None:
-    op.drop_table("key_value_store")
--- a/backend/alembic/versions/213fd978c6d8_notifications.py
+++ b/backend/alembic/versions/213fd978c6d8_notifications.py
@@ -1,44 +0,0 @@
-"""notifications
-
-Revision ID: 213fd978c6d8
-Revises: 5fc1f54cc252
-Create Date: 2024-08-10 11:13:36.070790
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "213fd978c6d8"
-down_revision = "5fc1f54cc252"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "notification",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column(
-            "notif_type",
-            sa.String(),
-            nullable=False,
-        ),
-        sa.Column(
-            "user_id",
-            sa.UUID(),
-            nullable=True,
-        ),
-        sa.Column("dismissed", sa.Boolean(), nullable=False),
-        sa.Column("last_shown", sa.DateTime(timezone=True), nullable=False),
-        sa.Column("first_shown", sa.DateTime(timezone=True), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["user_id"],
-            ["user.id"],
-        ),
-        sa.PrimaryKeyConstraint("id"),
-    )
-
-
-def downgrade() -> None:
-    op.drop_table("notification")
--- a/backend/alembic/versions/23957775e5f5_remove_feedback_foreignkey_constraint.py
+++ b/backend/alembic/versions/23957775e5f5_remove_feedback_foreignkey_constraint.py
@@ -1,86 +0,0 @@
-"""remove-feedback-foreignkey-constraint
-
-Revision ID: 23957775e5f5
-Revises: bc9771dccadf
-Create Date: 2024-06-27 16:04:51.480437
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "23957775e5f5"
-down_revision = "bc9771dccadf"
-branch_labels = None  # type: ignore
-depends_on = None  # type: ignore
-
-
-def upgrade() -> None:
-    op.drop_constraint(
-        "chat_feedback__chat_message_fk", "chat_feedback", type_="foreignkey"
-    )
-    op.create_foreign_key(
-        "chat_feedback__chat_message_fk",
-        "chat_feedback",
-        "chat_message",
-        ["chat_message_id"],
-        ["id"],
-        ondelete="SET NULL",
-    )
-    op.alter_column(
-        "chat_feedback", "chat_message_id", existing_type=sa.Integer(), nullable=True
-    )
-    op.drop_constraint(
-        "document_retrieval_feedback__chat_message_fk",
-        "document_retrieval_feedback",
-        type_="foreignkey",
-    )
-    op.create_foreign_key(
-        "document_retrieval_feedback__chat_message_fk",
-        "document_retrieval_feedback",
-        "chat_message",
-        ["chat_message_id"],
-        ["id"],
-        ondelete="SET NULL",
-    )
-    op.alter_column(
-        "document_retrieval_feedback",
-        "chat_message_id",
-        existing_type=sa.Integer(),
-        nullable=True,
-    )
-
-
-def downgrade() -> None:
-    op.alter_column(
-        "chat_feedback", "chat_message_id", existing_type=sa.Integer(), nullable=False
-    )
-    op.drop_constraint(
-        "chat_feedback__chat_message_fk", "chat_feedback", type_="foreignkey"
-    )
-    op.create_foreign_key(
-        "chat_feedback__chat_message_fk",
-        "chat_feedback",
-        "chat_message",
-        ["chat_message_id"],
-        ["id"],
-    )
-
-    op.alter_column(
-        "document_retrieval_feedback",
-        "chat_message_id",
-        existing_type=sa.Integer(),
-        nullable=False,
-    )
-    op.drop_constraint(
-        "document_retrieval_feedback__chat_message_fk",
-        "document_retrieval_feedback",
-        type_="foreignkey",
-    )
-    op.create_foreign_key(
-        "document_retrieval_feedback__chat_message_fk",
-        "document_retrieval_feedback",
-        "chat_message",
-        ["chat_message_id"],
-        ["id"],
-    )
--- a/backend/alembic/versions/2666d766cb9b_google_oauth2.py
+++ b/backend/alembic/versions/2666d766cb9b_google_oauth2.py
@@ -13,8 +13,8 @@ from alembic import op
 # revision identifiers, used by Alembic.
 revision = "2666d766cb9b"
 down_revision = "6d387b3196c2"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/27c6ecc08586_permission_framework.py
+++ b/backend/alembic/versions/27c6ecc08586_permission_framework.py
@@ -13,8 +13,8 @@ from sqlalchemy.dialects import postgresql
 # revision identifiers, used by Alembic.
 revision = "27c6ecc08586"
 down_revision = "2666d766cb9b"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
@@ -160,28 +160,12 @@ def downgrade() -> None:
            nullable=False,
        ),
    )
-
-    # Check if the constraint exists before dropping
-    conn = op.get_bind()
-    inspector = sa.inspect(conn)
-    constraints = inspector.get_foreign_keys("index_attempt")
-
-    if any(
-        constraint["name"] == "fk_index_attempt_credential_id"
-        for constraint in constraints
-    ):
-        op.drop_constraint(
-            "fk_index_attempt_credential_id", "index_attempt", type_="foreignkey"
-        )
-
-    if any(
-        constraint["name"] == "fk_index_attempt_connector_id"
-        for constraint in constraints
-    ):
-        op.drop_constraint(
-            "fk_index_attempt_connector_id", "index_attempt", type_="foreignkey"
-        )
-
+    op.drop_constraint(
+        "fk_index_attempt_credential_id", "index_attempt", type_="foreignkey"
+    )
+    op.drop_constraint(
+        "fk_index_attempt_connector_id", "index_attempt", type_="foreignkey"
+    )
    op.drop_column("index_attempt", "credential_id")
    op.drop_column("index_attempt", "connector_id")
    op.drop_table("connector_credential_pair")
--- a/backend/alembic/versions/30c1d5744104_persona_datetime_aware.py
+++ b/backend/alembic/versions/30c1d5744104_persona_datetime_aware.py
@@ -11,8 +11,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "30c1d5744104"
 down_revision = "7f99be1cb9f5"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/325975216eb3_add_icon_color_and_icon_shape_to_persona.py
+++ b/backend/alembic/versions/325975216eb3_add_icon_color_and_icon_shape_to_persona.py
@@ -1,70 +0,0 @@
-"""Add icon_color and icon_shape to Persona
-
-Revision ID: 325975216eb3
-Revises: 91ffac7e65b3
-Create Date: 2024-07-24 21:29:31.784562
-
-"""
-import random
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.sql import table, column, select
-
-# revision identifiers, used by Alembic.
-revision = "325975216eb3"
-down_revision = "91ffac7e65b3"
-branch_labels: None = None
-depends_on: None = None
-
-
-colorOptions = [
-    "#FF6FBF",
-    "#6FB1FF",
-    "#B76FFF",
-    "#FFB56F",
-    "#6FFF8D",
-    "#FF6F6F",
-    "#6FFFFF",
-]
-
-
-# Function to generate a random shape ensuring at least 3 of the middle 4 squares are filled
-def generate_random_shape() -> int:
-    center_squares = [12, 10, 6, 14, 13, 11, 7, 15]
-    center_fill = random.choice(center_squares)
-    remaining_squares = [i for i in range(16) if not (center_fill & (1 << i))]
-    random.shuffle(remaining_squares)
-    for i in range(10 - bin(center_fill).count("1")):
-        center_fill |= 1 << remaining_squares[i]
-    return center_fill
-
-
-def upgrade() -> None:
-    op.add_column("persona", sa.Column("icon_color", sa.String(), nullable=True))
-    op.add_column("persona", sa.Column("icon_shape", sa.Integer(), nullable=True))
-    op.add_column("persona", sa.Column("uploaded_image_id", sa.String(), nullable=True))
-
-    persona = table(
-        "persona",
-        column("id", sa.Integer),
-        column("icon_color", sa.String),
-        column("icon_shape", sa.Integer),
-    )
-
-    conn = op.get_bind()
-    personas = conn.execute(select(persona.c.id))
-
-    for persona_id in personas:
-        random_color = random.choice(colorOptions)
-        random_shape = generate_random_shape()
-        conn.execute(
-            persona.update()
-            .where(persona.c.id == persona_id[0])
-            .values(icon_color=random_color, icon_shape=random_shape)
-        )
-
-
-def downgrade() -> None:
-    op.drop_column("persona", "icon_shape")
-    op.drop_column("persona", "uploaded_image_id")
-    op.drop_column("persona", "icon_color")
--- a/backend/alembic/versions/3879338f8ba1_add_tool_table.py
+++ b/backend/alembic/versions/3879338f8ba1_add_tool_table.py
@@ -1,45 +0,0 @@
-"""Add tool table
-
-Revision ID: 3879338f8ba1
-Revises: f1c6478c3fd8
-Create Date: 2024-05-11 16:11:23.718084
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "3879338f8ba1"
-down_revision = "f1c6478c3fd8"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "tool",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("name", sa.String(), nullable=False),
-        sa.Column("description", sa.Text(), nullable=True),
-        sa.Column("in_code_tool_id", sa.String(), nullable=True),
-        sa.PrimaryKeyConstraint("id"),
-    )
-    op.create_table(
-        "persona__tool",
-        sa.Column("persona_id", sa.Integer(), nullable=False),
-        sa.Column("tool_id", sa.Integer(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["persona_id"],
-            ["persona.id"],
-        ),
-        sa.ForeignKeyConstraint(
-            ["tool_id"],
-            ["tool.id"],
-        ),
-        sa.PrimaryKeyConstraint("persona_id", "tool_id"),
-    )
-
-
-def downgrade() -> None:
-    op.drop_table("persona__tool")
-    op.drop_table("tool")
--- a/backend/alembic/versions/38eda64af7fe_add_chat_session_sharing.py
+++ b/backend/alembic/versions/38eda64af7fe_add_chat_session_sharing.py
@@ -1,41 +0,0 @@
-"""Add chat session sharing
-
-Revision ID: 38eda64af7fe
-Revises: 776b3bbe9092
-Create Date: 2024-03-27 19:41:29.073594
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "38eda64af7fe"
-down_revision = "776b3bbe9092"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "chat_session",
-        sa.Column(
-            "shared_status",
-            sa.Enum(
-                "PUBLIC",
-                "PRIVATE",
-                name="chatsessionsharedstatus",
-                native_enum=False,
-            ),
-            nullable=True,
-        ),
-    )
-    op.execute("UPDATE chat_session SET shared_status='PRIVATE'")
-    op.alter_column(
-        "chat_session",
-        "shared_status",
-        nullable=False,
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("chat_session", "shared_status")
--- a/backend/alembic/versions/3a7802814195_add_alternate_assistant_to_chat_message.py
+++ b/backend/alembic/versions/3a7802814195_add_alternate_assistant_to_chat_message.py
@@ -1,35 +0,0 @@
-"""add alternate assistant to chat message
-
-Revision ID: 3a7802814195
-Revises: 23957775e5f5
-Create Date: 2024-06-05 11:18:49.966333
-
-"""
-
-from alembic import op
-import sqlalchemy as sa
-
-
-# revision identifiers, used by Alembic.
-revision = "3a7802814195"
-down_revision = "23957775e5f5"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "chat_message", sa.Column("alternate_assistant_id", sa.Integer(), nullable=True)
-    )
-    op.create_foreign_key(
-        "fk_chat_message_persona",
-        "chat_message",
-        "persona",
-        ["alternate_assistant_id"],
-        ["id"],
-    )
-
-
-def downgrade() -> None:
-    op.drop_constraint("fk_chat_message_persona", "chat_message", type_="foreignkey")
-    op.drop_column("chat_message", "alternate_assistant_id")
--- a/backend/alembic/versions/3b25685ff73c_move_is_public_to_cc_pair.py
+++ b/backend/alembic/versions/3b25685ff73c_move_is_public_to_cc_pair.py
@@ -11,8 +11,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "3b25685ff73c"
 down_revision = "e0a68a81d434"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/3c5e35aa9af0_polling_document_count.py
+++ b/backend/alembic/versions/3c5e35aa9af0_polling_document_count.py
@@ -12,8 +12,8 @@ from alembic import op
 # revision identifiers, used by Alembic.
 revision = "3c5e35aa9af0"
 down_revision = "27c6ecc08586"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/401c1ac29467_add_tables_for_ui_based_llm_.py
+++ b/backend/alembic/versions/401c1ac29467_add_tables_for_ui_based_llm_.py
@@ -1,49 +0,0 @@
-"""Add tables for UI-based LLM configuration
-
-Revision ID: 401c1ac29467
-Revises: 703313b75876
-Create Date: 2024-04-13 18:07:29.153817
-
-"""
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-
-# revision identifiers, used by Alembic.
-revision = "401c1ac29467"
-down_revision = "703313b75876"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "llm_provider",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("name", sa.String(), nullable=False),
-        sa.Column("api_key", sa.String(), nullable=True),
-        sa.Column("api_base", sa.String(), nullable=True),
-        sa.Column("api_version", sa.String(), nullable=True),
-        sa.Column(
-            "custom_config",
-            postgresql.JSONB(astext_type=sa.Text()),
-            nullable=True,
-        ),
-        sa.Column("default_model_name", sa.String(), nullable=False),
-        sa.Column("fast_default_model_name", sa.String(), nullable=True),
-        sa.Column("is_default_provider", sa.Boolean(), unique=True, nullable=True),
-        sa.Column("model_names", postgresql.ARRAY(sa.String()), nullable=True),
-        sa.PrimaryKeyConstraint("id"),
-        sa.UniqueConstraint("name"),
-    )
-
-    op.add_column(
-        "persona",
-        sa.Column("llm_model_provider_override", sa.String(), nullable=True),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("persona", "llm_model_provider_override")
-
-    op.drop_table("llm_provider")
--- a/backend/alembic/versions/43cbbb3f5e6a_rename_index_origin_to_index_recursively.py
+++ b/backend/alembic/versions/43cbbb3f5e6a_rename_index_origin_to_index_recursively.py
@@ -1,42 +0,0 @@
-"""Rename index_origin to index_recursively
-
-Revision ID: 1d6ad76d1f37
-Revises: e1392f05e840
-Create Date: 2024-08-01 12:38:54.466081
-
-"""
-from alembic import op
-
-# revision identifiers, used by Alembic.
-revision = "1d6ad76d1f37"
-down_revision = "e1392f05e840"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.execute(
-        """
-        UPDATE connector
-        SET connector_specific_config = jsonb_set(
-            connector_specific_config,
-            '{index_recursively}',
-            'true'::jsonb
-        ) - 'index_origin'
-        WHERE connector_specific_config ? 'index_origin'
-    """
-    )
-
-
-def downgrade() -> None:
-    op.execute(
-        """
-        UPDATE connector
-        SET connector_specific_config = jsonb_set(
-            connector_specific_config,
-            '{index_origin}',
-            connector_specific_config->'index_recursively'
-        ) - 'index_recursively'
-        WHERE connector_specific_config ? 'index_recursively'
-    """
-    )
--- a/backend/alembic/versions/44f856ae2a4a_add_cloud_embedding_model.py
+++ b/backend/alembic/versions/44f856ae2a4a_add_cloud_embedding_model.py
@@ -1,65 +0,0 @@
-"""add cloud embedding model and update embedding_model
-
-Revision ID: 44f856ae2a4a
-Revises: d716b0791ddd
-Create Date: 2024-06-28 20:01:05.927647
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "44f856ae2a4a"
-down_revision = "d716b0791ddd"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    # Create embedding_provider table
-    op.create_table(
-        "embedding_provider",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("name", sa.String(), nullable=False),
-        sa.Column("api_key", sa.LargeBinary(), nullable=True),
-        sa.Column("default_model_id", sa.Integer(), nullable=True),
-        sa.PrimaryKeyConstraint("id"),
-        sa.UniqueConstraint("name"),
-    )
-
-    # Add cloud_provider_id to embedding_model table
-    op.add_column(
-        "embedding_model", sa.Column("cloud_provider_id", sa.Integer(), nullable=True)
-    )
-
-    # Add foreign key constraints
-    op.create_foreign_key(
-        "fk_embedding_model_cloud_provider",
-        "embedding_model",
-        "embedding_provider",
-        ["cloud_provider_id"],
-        ["id"],
-    )
-    op.create_foreign_key(
-        "fk_embedding_provider_default_model",
-        "embedding_provider",
-        "embedding_model",
-        ["default_model_id"],
-        ["id"],
-    )
-
-
-def downgrade() -> None:
-    # Remove foreign key constraints
-    op.drop_constraint(
-        "fk_embedding_model_cloud_provider", "embedding_model", type_="foreignkey"
-    )
-    op.drop_constraint(
-        "fk_embedding_provider_default_model", "embedding_provider", type_="foreignkey"
-    )
-
-    # Remove cloud_provider_id column
-    op.drop_column("embedding_model", "cloud_provider_id")
-
-    # Drop embedding_provider table
-    op.drop_table("embedding_provider")
--- a/backend/alembic/versions/4505fd7302e1_added_is_internet_to_dbdoc.py
+++ b/backend/alembic/versions/4505fd7302e1_added_is_internet_to_dbdoc.py
@@ -1,23 +0,0 @@
-"""added is_internet to DBDoc
-
-Revision ID: 4505fd7302e1
-Revises: c18cdf4b497e
-Create Date: 2024-06-18 20:46:09.095034
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "4505fd7302e1"
-down_revision = "c18cdf4b497e"
-
-
-def upgrade() -> None:
-    op.add_column("search_doc", sa.Column("is_internet", sa.Boolean(), nullable=True))
-    op.add_column("tool", sa.Column("display_name", sa.String(), nullable=True))
-
-
-def downgrade() -> None:
-    op.drop_column("tool", "display_name")
-    op.drop_column("search_doc", "is_internet")
--- a/backend/alembic/versions/465f78d9b7f9_larger_access_tokens_for_oauth.py
+++ b/backend/alembic/versions/465f78d9b7f9_larger_access_tokens_for_oauth.py
@@ -12,8 +12,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "465f78d9b7f9"
 down_revision = "3c5e35aa9af0"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/46625e4745d4_remove_native_enum.py
+++ b/backend/alembic/versions/46625e4745d4_remove_native_enum.py
@@ -11,8 +11,8 @@ from sqlalchemy import String
 # revision identifiers, used by Alembic.
 revision = "46625e4745d4"
 down_revision = "9d97fecfab7f"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/4738e4b3bae1_pg_file_store.py
+++ b/backend/alembic/versions/4738e4b3bae1_pg_file_store.py
@@ -1,28 +0,0 @@
-"""PG File Store
-
-Revision ID: 4738e4b3bae1
-Revises: e91df4e935ef
-Create Date: 2024-03-20 18:53:32.461518
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "4738e4b3bae1"
-down_revision = "e91df4e935ef"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "file_store",
-        sa.Column("file_name", sa.String(), nullable=False),
-        sa.Column("lobj_oid", sa.Integer(), nullable=False),
-        sa.PrimaryKeyConstraint("file_name"),
-    )
-
-
-def downgrade() -> None:
-    op.drop_table("file_store")
--- a/backend/alembic/versions/473a1a7ca408_add_display_model_names_to_llm_provider.py
+++ b/backend/alembic/versions/473a1a7ca408_add_display_model_names_to_llm_provider.py
@@ -1,49 +0,0 @@
-"""Add display_model_names to llm_provider
-
-Revision ID: 473a1a7ca408
-Revises: 325975216eb3
-Create Date: 2024-07-25 14:31:02.002917
-
-"""
-
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-
-# revision identifiers, used by Alembic.
-revision = "473a1a7ca408"
-down_revision = "325975216eb3"
-branch_labels: None = None
-depends_on: None = None
-
-default_models_by_provider = {
-    "openai": ["gpt-4", "gpt-4o", "gpt-4o-mini"],
-    "bedrock": [
-        "meta.llama3-1-70b-instruct-v1:0",
-        "meta.llama3-1-8b-instruct-v1:0",
-        "anthropic.claude-3-opus-20240229-v1:0",
-        "mistral.mistral-large-2402-v1:0",
-        "anthropic.claude-3-5-sonnet-20240620-v1:0",
-    ],
-    "anthropic": ["claude-3-opus-20240229", "claude-3-5-sonnet-20240620"],
-}
-
-
-def upgrade() -> None:
-    op.add_column(
-        "llm_provider",
-        sa.Column("display_model_names", postgresql.ARRAY(sa.String()), nullable=True),
-    )
-
-    connection = op.get_bind()
-    for provider, models in default_models_by_provider.items():
-        connection.execute(
-            sa.text(
-                "UPDATE llm_provider SET display_model_names = :models WHERE provider = :provider"
-            ),
-            {"models": models, "provider": provider},
-        )
-
-
-def downgrade() -> None:
-    op.drop_column("llm_provider", "display_model_names")
--- a/backend/alembic/versions/47433d30de82_create_indexattempt_table.py
+++ b/backend/alembic/versions/47433d30de82_create_indexattempt_table.py
@@ -11,9 +11,9 @@ from sqlalchemy.dialects import postgresql

 # revision identifiers, used by Alembic.
 revision = "47433d30de82"
-down_revision: None = None
-branch_labels: None = None
-depends_on: None = None
+down_revision = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/475fcefe8826_add_name_to_api_key.py
+++ b/backend/alembic/versions/475fcefe8826_add_name_to_api_key.py
@@ -1,23 +0,0 @@
-"""Add name to api_key
-
-Revision ID: 475fcefe8826
-Revises: ecab2b3f1a3b
-Create Date: 2024-04-11 11:05:18.414438
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "475fcefe8826"
-down_revision = "ecab2b3f1a3b"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column("api_key", sa.Column("name", sa.String(), nullable=True))
-
-
-def downgrade() -> None:
-    op.drop_column("api_key", "name")
--- a/backend/alembic/versions/48d14957fe80_add_support_for_custom_tools.py
+++ b/backend/alembic/versions/48d14957fe80_add_support_for_custom_tools.py
@@ -1,61 +0,0 @@
-"""Add support for custom tools
-
-Revision ID: 48d14957fe80
-Revises: b85f02ec1308
-Create Date: 2024-06-09 14:58:19.946509
-
-"""
-from alembic import op
-import fastapi_users_db_sqlalchemy
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-
-# revision identifiers, used by Alembic.
-revision = "48d14957fe80"
-down_revision = "b85f02ec1308"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "tool",
-        sa.Column(
-            "openapi_schema",
-            postgresql.JSONB(astext_type=sa.Text()),
-            nullable=True,
-        ),
-    )
-    op.add_column(
-        "tool",
-        sa.Column(
-            "user_id",
-            fastapi_users_db_sqlalchemy.generics.GUID(),
-            nullable=True,
-        ),
-    )
-    op.create_foreign_key("tool_user_fk", "tool", "user", ["user_id"], ["id"])
-
-    op.create_table(
-        "tool_call",
-        sa.Column("id", sa.Integer(), primary_key=True),
-        sa.Column("tool_id", sa.Integer(), nullable=False),
-        sa.Column("tool_name", sa.String(), nullable=False),
-        sa.Column(
-            "tool_arguments", postgresql.JSONB(astext_type=sa.Text()), nullable=False
-        ),
-        sa.Column(
-            "tool_result", postgresql.JSONB(astext_type=sa.Text()), nullable=False
-        ),
-        sa.Column(
-            "message_id", sa.Integer(), sa.ForeignKey("chat_message.id"), nullable=False
-        ),
-    )
-
-
-def downgrade() -> None:
-    op.drop_table("tool_call")
-
-    op.drop_constraint("tool_user_fk", "tool", type_="foreignkey")
-    op.drop_column("tool", "user_id")
-    op.drop_column("tool", "openapi_schema")
--- a/backend/alembic/versions/4a951134c801_moved_status_to_connector_credential_.py
+++ b/backend/alembic/versions/4a951134c801_moved_status_to_connector_credential_.py
@@ -1,80 +0,0 @@
-"""Moved status to connector credential pair
-
-Revision ID: 4a951134c801
-Revises: 7477a5f5d728
-Create Date: 2024-08-10 19:20:34.527559
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "4a951134c801"
-down_revision = "7477a5f5d728"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "connector_credential_pair",
-        sa.Column(
-            "status",
-            sa.Enum(
-                "ACTIVE",
-                "PAUSED",
-                "DELETING",
-                name="connectorcredentialpairstatus",
-                native_enum=False,
-            ),
-            nullable=True,
-        ),
-    )
-
-    # Update status of connector_credential_pair based on connector's disabled status
-    op.execute(
-        """
-        UPDATE connector_credential_pair
-        SET status = CASE
-            WHEN (
-                SELECT disabled
-                FROM connector
-                WHERE connector.id = connector_credential_pair.connector_id
-            ) = FALSE THEN 'ACTIVE'
-            ELSE 'PAUSED'
-        END
-        """
-    )
-
-    # Make the status column not nullable after setting values
-    op.alter_column("connector_credential_pair", "status", nullable=False)
-
-    op.drop_column("connector", "disabled")
-
-
-def downgrade() -> None:
-    op.add_column(
-        "connector",
-        sa.Column("disabled", sa.BOOLEAN(), autoincrement=False, nullable=True),
-    )
-
-    # Update disabled status of connector based on connector_credential_pair's status
-    op.execute(
-        """
-        UPDATE connector
-        SET disabled = CASE
-            WHEN EXISTS (
-                SELECT 1
-                FROM connector_credential_pair
-                WHERE connector_credential_pair.connector_id = connector.id
-                AND connector_credential_pair.status = 'ACTIVE'
-            ) THEN FALSE
-            ELSE TRUE
-        END
-        """
-    )
-
-    # Make the disabled column not nullable after setting values
-    op.alter_column("connector", "disabled", nullable=False)
-
-    op.drop_column("connector_credential_pair", "status")
--- a/backend/alembic/versions/4ea2c93919c1_add_type_to_credentials.py
+++ b/backend/alembic/versions/4ea2c93919c1_add_type_to_credentials.py
@@ -1,72 +0,0 @@
-"""Add type to credentials
-
-Revision ID: 4ea2c93919c1
-Revises: 473a1a7ca408
-Create Date: 2024-07-18 13:07:13.655895
-
-"""
-
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "4ea2c93919c1"
-down_revision = "473a1a7ca408"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    # Add the new 'source' column to the 'credential' table
-    op.add_column(
-        "credential",
-        sa.Column(
-            "source",
-            sa.String(length=100),  # Use String instead of Enum
-            nullable=True,  # Initially allow NULL values
-        ),
-    )
-    op.add_column(
-        "credential",
-        sa.Column(
-            "name",
-            sa.String(),
-            nullable=True,
-        ),
-    )
-
-    # Create a temporary table that maps each credential to a single connector source.
-    # This is needed because a credential can be associated with multiple connectors,
-    # but we want to assign a single source to each credential.
-    # We use DISTINCT ON to ensure we only get one row per credential_id.
-    op.execute(
-        """
-    CREATE TEMPORARY TABLE temp_connector_credential AS
-    SELECT DISTINCT ON (cc.credential_id)
-        cc.credential_id,
-        c.source AS connector_source
-    FROM connector_credential_pair cc
-    JOIN connector c ON cc.connector_id = c.id
-    """
-    )
-
-    # Update the 'source' column in the 'credential' table
-    op.execute(
-        """
-    UPDATE credential cred
-    SET source = COALESCE(
-        (SELECT connector_source
-         FROM temp_connector_credential temp
-         WHERE cred.id = temp.credential_id),
-        'NOT_APPLICABLE'
-    )
-    """
-    )
-    # If no exception was raised, alter the column
-    op.alter_column("credential", "source", nullable=True)  # TODO modify
-    # # ### end Alembic commands ###
-
-
-def downgrade() -> None:
-    op.drop_column("credential", "source")
-    op.drop_column("credential", "name")
--- a/backend/alembic/versions/50b683a8295c_add_additional_retrieval_controls_to_.py
+++ b/backend/alembic/versions/50b683a8295c_add_additional_retrieval_controls_to_.py
@@ -1,28 +0,0 @@
-"""Add additional retrieval controls to Persona
-
-Revision ID: 50b683a8295c
-Revises: 7da0ae5ad583
-Create Date: 2023-11-27 17:23:29.668422
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "50b683a8295c"
-down_revision = "7da0ae5ad583"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column("persona", sa.Column("num_chunks", sa.Integer(), nullable=True))
-    op.add_column(
-        "persona",
-        sa.Column("apply_llm_relevance_filter", sa.Boolean(), nullable=True),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("persona", "apply_llm_relevance_filter")
-    op.drop_column("persona", "num_chunks")
--- a/backend/alembic/versions/570282d33c49_track_danswerbot_explicitly.py
+++ b/backend/alembic/versions/570282d33c49_track_danswerbot_explicitly.py
@@ -1,27 +0,0 @@
-"""Track Danswerbot Explicitly
-
-Revision ID: 570282d33c49
-Revises: 7547d982db8f
-Create Date: 2024-05-04 17:49:28.568109
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "570282d33c49"
-down_revision = "7547d982db8f"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "chat_session", sa.Column("danswerbot_flow", sa.Boolean(), nullable=True)
-    )
-    op.execute("UPDATE chat_session SET danswerbot_flow = one_shot")
-    op.alter_column("chat_session", "danswerbot_flow", nullable=False)
-
-
-def downgrade() -> None:
-    op.drop_column("chat_session", "danswerbot_flow")
--- a/backend/alembic/versions/57b53544726e_add_document_set_tables.py
+++ b/backend/alembic/versions/57b53544726e_add_document_set_tables.py
@@ -12,8 +12,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "57b53544726e"
 down_revision = "800f48024ae9"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/5809c0787398_add_chat_sessions.py
+++ b/backend/alembic/versions/5809c0787398_add_chat_sessions.py
@@ -13,8 +13,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "5809c0787398"
 down_revision = "d929f0c1c6af"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/5e84129c8be3_add_docs_indexed_column_to_index_.py
+++ b/backend/alembic/versions/5e84129c8be3_add_docs_indexed_column_to_index_.py
@@ -12,8 +12,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "5e84129c8be3"
 down_revision = "e6a4bbc13fe4"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/5f4b8568a221_add_removed_documents_to_index_attempt.py
+++ b/backend/alembic/versions/5f4b8568a221_add_removed_documents_to_index_attempt.py
@@ -1,27 +0,0 @@
-"""add removed documents to index_attempt
-
-Revision ID: 5f4b8568a221
-Revises: dbaa756c2ccf
-Create Date: 2024-02-16 15:02:03.319907
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "5f4b8568a221"
-down_revision = "8987770549c0"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "index_attempt",
-        sa.Column("docs_removed_from_index", sa.Integer()),
-    )
-    op.execute("UPDATE index_attempt SET docs_removed_from_index = 0")
-
-
-def downgrade() -> None:
-    op.drop_column("index_attempt", "docs_removed_from_index")
--- a/backend/alembic/versions/5fc1f54cc252_hybrid_enum.py
+++ b/backend/alembic/versions/5fc1f54cc252_hybrid_enum.py
@@ -1,25 +0,0 @@
-"""hybrid-enum
-
-Revision ID: 5fc1f54cc252
-Revises: 1d6ad76d1f37
-Create Date: 2024-08-06 15:35:40.278485
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "5fc1f54cc252"
-down_revision = "1d6ad76d1f37"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.drop_column("persona", "search_type")
-
-
-def downgrade() -> None:
-    op.add_column("persona", sa.Column("search_type", sa.String(), nullable=True))
-    op.execute("UPDATE persona SET search_type = 'SEMANTIC'")
-    op.alter_column("persona", "search_type", nullable=False)
--- a/backend/alembic/versions/643a84a42a33_add_user_configured_names_to_llmprovider.py
+++ b/backend/alembic/versions/643a84a42a33_add_user_configured_names_to_llmprovider.py
@@ -1,45 +0,0 @@
-"""Add user-configured names to LLMProvider
-
-Revision ID: 643a84a42a33
-Revises: 0a98909f2757
-Create Date: 2024-05-07 14:54:55.493100
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "643a84a42a33"
-down_revision = "0a98909f2757"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column("llm_provider", sa.Column("provider", sa.String(), nullable=True))
-    # move "name" -> "provider" to match the new schema
-    op.execute("UPDATE llm_provider SET provider = name")
-    # pretty up display name
-    op.execute("UPDATE llm_provider SET name = 'OpenAI' WHERE name = 'openai'")
-    op.execute("UPDATE llm_provider SET name = 'Anthropic' WHERE name = 'anthropic'")
-    op.execute("UPDATE llm_provider SET name = 'Azure OpenAI' WHERE name = 'azure'")
-    op.execute("UPDATE llm_provider SET name = 'AWS Bedrock' WHERE name = 'bedrock'")
-
-    # update personas to use the new provider names
-    op.execute(
-        "UPDATE persona SET llm_model_provider_override = 'OpenAI' WHERE llm_model_provider_override = 'openai'"
-    )
-    op.execute(
-        "UPDATE persona SET llm_model_provider_override = 'Anthropic' WHERE llm_model_provider_override = 'anthropic'"
-    )
-    op.execute(
-        "UPDATE persona SET llm_model_provider_override = 'Azure OpenAI' WHERE llm_model_provider_override = 'azure'"
-    )
-    op.execute(
-        "UPDATE persona SET llm_model_provider_override = 'AWS Bedrock' WHERE llm_model_provider_override = 'bedrock'"
-    )
-
-
-def downgrade() -> None:
-    op.execute("UPDATE llm_provider SET name = provider")
-    op.drop_column("llm_provider", "provider")
--- a/backend/alembic/versions/6d387b3196c2_basic_auth.py
+++ b/backend/alembic/versions/6d387b3196c2_basic_auth.py
@@ -13,8 +13,8 @@ from sqlalchemy.dialects import postgresql
 # revision identifiers, used by Alembic.
 revision = "6d387b3196c2"
 down_revision = "47433d30de82"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/703313b75876_add_tokenratelimit_tables.py
+++ b/backend/alembic/versions/703313b75876_add_tokenratelimit_tables.py
@@ -1,83 +0,0 @@
-"""Add TokenRateLimit Tables
-
-Revision ID: 703313b75876
-Revises: fad14119fb92
-Create Date: 2024-04-15 01:36:02.952809
-
-"""
-import json
-from typing import cast
-from alembic import op
-import sqlalchemy as sa
-from danswer.dynamic_configs.factory import get_dynamic_config_store
-
-# revision identifiers, used by Alembic.
-revision = "703313b75876"
-down_revision = "fad14119fb92"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "token_rate_limit",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("enabled", sa.Boolean(), nullable=False),
-        sa.Column("token_budget", sa.Integer(), nullable=False),
-        sa.Column("period_hours", sa.Integer(), nullable=False),
-        sa.Column(
-            "scope",
-            sa.String(length=10),
-            nullable=False,
-        ),
-        sa.Column(
-            "created_at",
-            sa.DateTime(timezone=True),
-            server_default=sa.text("now()"),
-            nullable=False,
-        ),
-        sa.PrimaryKeyConstraint("id"),
-    )
-    op.create_table(
-        "token_rate_limit__user_group",
-        sa.Column("rate_limit_id", sa.Integer(), nullable=False),
-        sa.Column("user_group_id", sa.Integer(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["rate_limit_id"],
-            ["token_rate_limit.id"],
-        ),
-        sa.ForeignKeyConstraint(
-            ["user_group_id"],
-            ["user_group.id"],
-        ),
-        sa.PrimaryKeyConstraint("rate_limit_id", "user_group_id"),
-    )
-
-    try:
-        settings_json = cast(
-            str, get_dynamic_config_store().load("token_budget_settings")
-        )
-        settings = json.loads(settings_json)
-
-        is_enabled = settings.get("enable_token_budget", False)
-        token_budget = settings.get("token_budget", -1)
-        period_hours = settings.get("period_hours", -1)
-
-        if is_enabled and token_budget > 0 and period_hours > 0:
-            op.execute(
-                f"INSERT INTO token_rate_limit \
-                    (enabled, token_budget, period_hours, scope) VALUES \
-                        ({is_enabled}, {token_budget}, {period_hours}, 'GLOBAL')"
-            )
-
-        # Delete the dynamic config
-        get_dynamic_config_store().delete("token_budget_settings")
-
-    except Exception:
-        # Ignore if the dynamic config is not found
-        pass
-
-
-def downgrade() -> None:
-    op.drop_table("token_rate_limit__user_group")
-    op.drop_table("token_rate_limit")
--- a/backend/alembic/versions/70f00c45c0f2_more_descriptive_filestore.py
+++ b/backend/alembic/versions/70f00c45c0f2_more_descriptive_filestore.py
@@ -1,68 +0,0 @@
-"""More Descriptive Filestore
-
-Revision ID: 70f00c45c0f2
-Revises: 3879338f8ba1
-Create Date: 2024-05-17 17:51:41.926893
-
-"""
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-
-# revision identifiers, used by Alembic.
-revision = "70f00c45c0f2"
-down_revision = "3879338f8ba1"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column("file_store", sa.Column("display_name", sa.String(), nullable=True))
-    op.add_column(
-        "file_store",
-        sa.Column(
-            "file_origin",
-            sa.String(),
-            nullable=False,
-            server_default="connector",  # Default to connector
-        ),
-    )
-    op.add_column(
-        "file_store",
-        sa.Column(
-            "file_type", sa.String(), nullable=False, server_default="text/plain"
-        ),
-    )
-    op.add_column(
-        "file_store",
-        sa.Column(
-            "file_metadata",
-            postgresql.JSONB(astext_type=sa.Text()),
-            nullable=True,
-        ),
-    )
-
-    op.execute(
-        """
-        UPDATE file_store
-        SET file_origin = CASE
-            WHEN file_name LIKE 'chat__%' THEN 'chat_upload'
-            ELSE 'connector'
-        END,
-        file_name = CASE
-            WHEN file_name LIKE 'chat__%' THEN SUBSTR(file_name, 7)
-            ELSE file_name
-        END,
-        file_type = CASE
-            WHEN file_name LIKE 'chat__%' THEN 'image/png'
-            ELSE 'text/plain'
-        END
-    """
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("file_store", "file_metadata")
-    op.drop_column("file_store", "file_type")
-    op.drop_column("file_store", "file_origin")
-    op.drop_column("file_store", "display_name")
--- a/backend/alembic/versions/72bdc9929a46_permission_auto_sync_framework.py
+++ b/backend/alembic/versions/72bdc9929a46_permission_auto_sync_framework.py
@@ -1,81 +0,0 @@
-"""Permission Auto Sync Framework
-
-Revision ID: 72bdc9929a46
-Revises: 475fcefe8826
-Create Date: 2024-04-14 21:15:28.659634
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "72bdc9929a46"
-down_revision = "475fcefe8826"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "email_to_external_user_cache",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("external_user_id", sa.String(), nullable=False),
-        sa.Column("user_id", sa.UUID(), nullable=True),
-        sa.Column("user_email", sa.String(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["user_id"],
-            ["user.id"],
-        ),
-        sa.PrimaryKeyConstraint("id"),
-    )
-    op.create_table(
-        "external_permission",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("user_id", sa.UUID(), nullable=True),
-        sa.Column("user_email", sa.String(), nullable=False),
-        sa.Column(
-            "source_type",
-            sa.String(),
-            nullable=False,
-        ),
-        sa.Column("external_permission_group", sa.String(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["user_id"],
-            ["user.id"],
-        ),
-        sa.PrimaryKeyConstraint("id"),
-    )
-    op.create_table(
-        "permission_sync_run",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column(
-            "source_type",
-            sa.String(),
-            nullable=False,
-        ),
-        sa.Column("update_type", sa.String(), nullable=False),
-        sa.Column("cc_pair_id", sa.Integer(), nullable=True),
-        sa.Column(
-            "status",
-            sa.String(),
-            nullable=False,
-        ),
-        sa.Column("error_msg", sa.Text(), nullable=True),
-        sa.Column(
-            "updated_at",
-            sa.DateTime(timezone=True),
-            server_default=sa.text("now()"),
-            nullable=False,
-        ),
-        sa.ForeignKeyConstraint(
-            ["cc_pair_id"],
-            ["connector_credential_pair.id"],
-        ),
-        sa.PrimaryKeyConstraint("id"),
-    )
-
-
-def downgrade() -> None:
-    op.drop_table("permission_sync_run")
-    op.drop_table("external_permission")
-    op.drop_table("email_to_external_user_cache")
--- a/backend/alembic/versions/7477a5f5d728_added_model_defaults_for_users.py
+++ b/backend/alembic/versions/7477a5f5d728_added_model_defaults_for_users.py
@@ -1,24 +0,0 @@
-"""Added model defaults for users
-
-Revision ID: 7477a5f5d728
-Revises: 213fd978c6d8
-Create Date: 2024-08-04 19:00:04.512634
-
-"""
-
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "7477a5f5d728"
-down_revision = "213fd978c6d8"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column("user", sa.Column("default_model", sa.Text(), nullable=True))
-
-
-def downgrade() -> None:
-    op.drop_column("user", "default_model")
--- a/backend/alembic/versions/7547d982db8f_chat_folders.py
+++ b/backend/alembic/versions/7547d982db8f_chat_folders.py
@@ -1,51 +0,0 @@
-"""Chat Folders
-
-Revision ID: 7547d982db8f
-Revises: ef7da92f7213
-Create Date: 2024-05-02 15:18:56.573347
-
-"""
-from alembic import op
-import sqlalchemy as sa
-import fastapi_users_db_sqlalchemy
-
-# revision identifiers, used by Alembic.
-revision = "7547d982db8f"
-down_revision = "ef7da92f7213"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "chat_folder",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column(
-            "user_id",
-            fastapi_users_db_sqlalchemy.generics.GUID(),
-            nullable=True,
-        ),
-        sa.Column("name", sa.String(), nullable=True),
-        sa.Column("display_priority", sa.Integer(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["user_id"],
-            ["user.id"],
-        ),
-        sa.PrimaryKeyConstraint("id"),
-    )
-    op.add_column("chat_session", sa.Column("folder_id", sa.Integer(), nullable=True))
-    op.create_foreign_key(
-        "chat_session_chat_folder_fk",
-        "chat_session",
-        "chat_folder",
-        ["folder_id"],
-        ["id"],
-    )
-
-
-def downgrade() -> None:
-    op.drop_constraint(
-        "chat_session_chat_folder_fk", "chat_session", type_="foreignkey"
-    )
-    op.drop_column("chat_session", "folder_id")
-    op.drop_table("chat_folder")
--- a/backend/alembic/versions/767f1c2a00eb_count_chat_tokens.py
+++ b/backend/alembic/versions/767f1c2a00eb_count_chat_tokens.py
@@ -12,8 +12,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "767f1c2a00eb"
 down_revision = "dba7f71618f5"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/76b60d407dfb_cc_pair_name_not_unique.py
+++ b/backend/alembic/versions/76b60d407dfb_cc_pair_name_not_unique.py
@@ -1,36 +0,0 @@
-"""CC-Pair Name not Unique
-
-Revision ID: 76b60d407dfb
-Revises: b156fa702355
-Create Date: 2023-12-22 21:42:10.018804
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "76b60d407dfb"
-down_revision = "b156fa702355"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.execute("DELETE FROM connector_credential_pair WHERE name IS NULL")
-    op.drop_constraint(
-        "connector_credential_pair__name__key",
-        "connector_credential_pair",
-        type_="unique",
-    )
-    op.alter_column(
-        "connector_credential_pair", "name", existing_type=sa.String(), nullable=False
-    )
-
-
-def downgrade() -> None:
-    op.create_unique_constraint(
-        "connector_credential_pair__name__key", "connector_credential_pair", ["name"]
-    )
-    op.alter_column(
-        "connector_credential_pair", "name", existing_type=sa.String(), nullable=True
-    )
--- a/backend/alembic/versions/776b3bbe9092_remove_remaining_enums.py
+++ b/backend/alembic/versions/776b3bbe9092_remove_remaining_enums.py
@@ -1,71 +0,0 @@
-"""Remove Remaining Enums
-
-Revision ID: 776b3bbe9092
-Revises: 4738e4b3bae1
-Create Date: 2024-03-22 21:34:27.629444
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-from danswer.db.models import IndexModelStatus
-from danswer.search.enums import RecencyBiasSetting
-from danswer.search.models import SearchType
-
-# revision identifiers, used by Alembic.
-revision = "776b3bbe9092"
-down_revision = "4738e4b3bae1"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.alter_column(
-        "persona",
-        "search_type",
-        type_=sa.String,
-        existing_type=sa.Enum(SearchType, native_enum=False),
-        existing_nullable=False,
-    )
-    op.alter_column(
-        "persona",
-        "recency_bias",
-        type_=sa.String,
-        existing_type=sa.Enum(RecencyBiasSetting, native_enum=False),
-        existing_nullable=False,
-    )
-
-    # Because the indexmodelstatus enum does not have a mapping to a string type
-    # we need this workaround instead of directly changing the type
-    op.add_column("embedding_model", sa.Column("temp_status", sa.String))
-    op.execute("UPDATE embedding_model SET temp_status = status::text")
-    op.drop_column("embedding_model", "status")
-    op.alter_column("embedding_model", "temp_status", new_column_name="status")
-
-    op.execute("DROP TYPE IF EXISTS searchtype")
-    op.execute("DROP TYPE IF EXISTS recencybiassetting")
-    op.execute("DROP TYPE IF EXISTS indexmodelstatus")
-
-
-def downgrade() -> None:
-    op.alter_column(
-        "persona",
-        "search_type",
-        type_=sa.Enum(SearchType, native_enum=False),
-        existing_type=sa.String(length=50),
-        existing_nullable=False,
-    )
-    op.alter_column(
-        "persona",
-        "recency_bias",
-        type_=sa.Enum(RecencyBiasSetting, native_enum=False),
-        existing_type=sa.String(length=50),
-        existing_nullable=False,
-    )
-    op.alter_column(
-        "embedding_model",
-        "status",
-        type_=sa.Enum(IndexModelStatus, native_enum=False),
-        existing_type=sa.String(length=50),
-        existing_nullable=False,
-    )
--- a/backend/alembic/versions/77d07dffae64_forcibly_remove_more_enum_types_from_.py
+++ b/backend/alembic/versions/77d07dffae64_forcibly_remove_more_enum_types_from_.py
@@ -12,8 +12,8 @@ from sqlalchemy import String
 # revision identifiers, used by Alembic.
 revision = "77d07dffae64"
 down_revision = "d61e513bef0a"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/78dbe7e38469_task_tracking.py
+++ b/backend/alembic/versions/78dbe7e38469_task_tracking.py
@@ -11,8 +11,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "78dbe7e38469"
 down_revision = "7ccea01261f6"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/795b20b85b4b_add_llm_group_permissions_control.py
+++ b/backend/alembic/versions/795b20b85b4b_add_llm_group_permissions_control.py
@@ -1,41 +0,0 @@
-"""add_llm_group_permissions_control
-
-Revision ID: 795b20b85b4b
-Revises: 05c07bf07c00
-Create Date: 2024-07-19 11:54:35.701558
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-
-revision = "795b20b85b4b"
-down_revision = "05c07bf07c00"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "llm_provider__user_group",
-        sa.Column("llm_provider_id", sa.Integer(), nullable=False),
-        sa.Column("user_group_id", sa.Integer(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["llm_provider_id"],
-            ["llm_provider.id"],
-        ),
-        sa.ForeignKeyConstraint(
-            ["user_group_id"],
-            ["user_group.id"],
-        ),
-        sa.PrimaryKeyConstraint("llm_provider_id", "user_group_id"),
-    )
-    op.add_column(
-        "llm_provider",
-        sa.Column("is_public", sa.Boolean(), nullable=False, server_default="true"),
-    )
-
-
-def downgrade() -> None:
-    op.drop_table("llm_provider__user_group")
-    op.drop_column("llm_provider", "is_public")
--- a/backend/alembic/versions/79acd316403a_add_api_key_table.py
+++ b/backend/alembic/versions/79acd316403a_add_api_key_table.py
@@ -1,48 +0,0 @@
-"""Add api_key table
-
-Revision ID: 79acd316403a
-Revises: 904e5138fffb
-Create Date: 2024-01-11 17:56:37.934381
-
-"""
-from alembic import op
-import fastapi_users_db_sqlalchemy
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "79acd316403a"
-down_revision = "904e5138fffb"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "api_key",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("hashed_api_key", sa.String(), nullable=False),
-        sa.Column("api_key_display", sa.String(), nullable=False),
-        sa.Column(
-            "user_id",
-            fastapi_users_db_sqlalchemy.generics.GUID(),
-            nullable=False,
-        ),
-        sa.Column(
-            "owner_id",
-            fastapi_users_db_sqlalchemy.generics.GUID(),
-            nullable=True,
-        ),
-        sa.Column(
-            "created_at",
-            sa.DateTime(timezone=True),
-            server_default=sa.text("now()"),
-            nullable=False,
-        ),
-        sa.PrimaryKeyConstraint("id"),
-        sa.UniqueConstraint("api_key_display"),
-        sa.UniqueConstraint("hashed_api_key"),
-    )
-
-
-def downgrade() -> None:
-    op.drop_table("api_key")
--- a/backend/alembic/versions/7aea705850d5_added_slack_auto_filter.py
+++ b/backend/alembic/versions/7aea705850d5_added_slack_auto_filter.py
@@ -1,35 +0,0 @@
-"""added slack_auto_filter
-
-Revision ID: 7aea705850d5
-Revises: 4505fd7302e1
-Create Date: 2024-07-10 11:01:23.581015
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-revision = "7aea705850d5"
-down_revision = "4505fd7302e1"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "slack_bot_config",
-        sa.Column("enable_auto_filters", sa.Boolean(), nullable=True),
-    )
-    op.execute(
-        "UPDATE slack_bot_config SET enable_auto_filters = FALSE WHERE enable_auto_filters IS NULL"
-    )
-    op.alter_column(
-        "slack_bot_config",
-        "enable_auto_filters",
-        existing_type=sa.Boolean(),
-        nullable=False,
-        server_default=sa.false(),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("slack_bot_config", "enable_auto_filters")
--- a/backend/alembic/versions/7ccea01261f6_store_chat_retrieval_docs.py
+++ b/backend/alembic/versions/7ccea01261f6_store_chat_retrieval_docs.py
@@ -12,8 +12,8 @@ from sqlalchemy.dialects import postgresql
 # revision identifiers, used by Alembic.
 revision = "7ccea01261f6"
 down_revision = "a570b80a5f20"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/7da0ae5ad583_add_description_to_persona.py
+++ b/backend/alembic/versions/7da0ae5ad583_add_description_to_persona.py
@@ -1,23 +0,0 @@
-"""Add description to persona
-
-Revision ID: 7da0ae5ad583
-Revises: e86866a9c78a
-Create Date: 2023-11-27 00:16:19.959414
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "7da0ae5ad583"
-down_revision = "e86866a9c78a"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column("persona", sa.Column("description", sa.String(), nullable=True))
-
-
-def downgrade() -> None:
-    op.drop_column("persona", "description")
--- a/backend/alembic/versions/7da543f5672f_add_slackbotconfig_table.py
+++ b/backend/alembic/versions/7da543f5672f_add_slackbotconfig_table.py
@@ -12,8 +12,8 @@ from sqlalchemy.dialects import postgresql
 # revision identifiers, used by Alembic.
 revision = "7da543f5672f"
 down_revision = "febe9eaa0644"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/7f726bad5367_slack_followup.py
+++ b/backend/alembic/versions/7f726bad5367_slack_followup.py
@@ -1,26 +0,0 @@
-"""Slack Followup
-
-Revision ID: 7f726bad5367
-Revises: 79acd316403a
-Create Date: 2024-01-15 00:19:55.991224
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "7f726bad5367"
-down_revision = "79acd316403a"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "chat_feedback",
-        sa.Column("required_followup", sa.Boolean(), nullable=True),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("chat_feedback", "required_followup")
--- a/backend/alembic/versions/7f99be1cb9f5_add_index_for_getting_documents_just_by_.py
+++ b/backend/alembic/versions/7f99be1cb9f5_add_index_for_getting_documents_just_by_.py
@@ -11,8 +11,8 @@ from alembic import op
 # revision identifiers, used by Alembic.
 revision = "7f99be1cb9f5"
 down_revision = "78dbe7e38469"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/800f48024ae9_add_id_to_connectorcredentialpair.py
+++ b/backend/alembic/versions/800f48024ae9_add_id_to_connectorcredentialpair.py
@@ -12,8 +12,8 @@ from sqlalchemy.schema import Sequence, CreateSequence
 # revision identifiers, used by Alembic.
 revision = "800f48024ae9"
 down_revision = "767f1c2a00eb"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/80696cf850ae_add_chat_session_to_query_event.py
+++ b/backend/alembic/versions/80696cf850ae_add_chat_session_to_query_event.py
@@ -1,36 +0,0 @@
-"""Add chat session to query_event
-
-Revision ID: 80696cf850ae
-Revises: 15326fcec57e
-Create Date: 2023-11-26 02:38:35.008070
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "80696cf850ae"
-down_revision = "15326fcec57e"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "query_event",
-        sa.Column("chat_session_id", sa.Integer(), nullable=True),
-    )
-    op.create_foreign_key(
-        "fk_query_event_chat_session_id",
-        "query_event",
-        "chat_session",
-        ["chat_session_id"],
-        ["id"],
-    )
-
-
-def downgrade() -> None:
-    op.drop_constraint(
-        "fk_query_event_chat_session_id", "query_event", type_="foreignkey"
-    )
-    op.drop_column("query_event", "chat_session_id")
--- a/backend/alembic/versions/891cd83c87a8_add_is_visible_to_persona.py
+++ b/backend/alembic/versions/891cd83c87a8_add_is_visible_to_persona.py
@@ -1,34 +0,0 @@
-"""Add is_visible to Persona
-
-Revision ID: 891cd83c87a8
-Revises: 76b60d407dfb
-Create Date: 2023-12-21 11:55:54.132279
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "891cd83c87a8"
-down_revision = "76b60d407dfb"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "persona",
-        sa.Column("is_visible", sa.Boolean(), nullable=True),
-    )
-    op.execute("UPDATE persona SET is_visible = true")
-    op.alter_column("persona", "is_visible", nullable=False)
-
-    op.add_column(
-        "persona",
-        sa.Column("display_priority", sa.Integer(), nullable=True),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("persona", "is_visible")
-    op.drop_column("persona", "display_priority")
--- a/backend/alembic/versions/8987770549c0_add_full_exception_stack_trace.py
+++ b/backend/alembic/versions/8987770549c0_add_full_exception_stack_trace.py
@@ -1,25 +0,0 @@
-"""Add full exception stack trace
-
-Revision ID: 8987770549c0
-Revises: ec3ec2eabf7b
-Create Date: 2024-02-10 19:31:28.339135
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "8987770549c0"
-down_revision = "ec3ec2eabf7b"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "index_attempt", sa.Column("full_exception_trace", sa.Text(), nullable=True)
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("index_attempt", "full_exception_trace")
--- a/backend/alembic/versions/8a87bd6ec550_associate_index_attempts_with_ccpair.py
+++ b/backend/alembic/versions/8a87bd6ec550_associate_index_attempts_with_ccpair.py
@@ -1,103 +0,0 @@
-"""associate index attempts with ccpair
-
-Revision ID: 8a87bd6ec550
-Revises: 4ea2c93919c1
-Create Date: 2024-07-22 15:15:52.558451
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "8a87bd6ec550"
-down_revision = "4ea2c93919c1"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    # Add the new connector_credential_pair_id column
-    op.add_column(
-        "index_attempt",
-        sa.Column("connector_credential_pair_id", sa.Integer(), nullable=True),
-    )
-
-    # Create a foreign key constraint to the connector_credential_pair table
-    op.create_foreign_key(
-        "fk_index_attempt_connector_credential_pair_id",
-        "index_attempt",
-        "connector_credential_pair",
-        ["connector_credential_pair_id"],
-        ["id"],
-    )
-
-    # Populate the new connector_credential_pair_id column using existing connector_id and credential_id
-    op.execute(
-        """
-        UPDATE index_attempt ia
-        SET connector_credential_pair_id =
-            CASE
-                WHEN ia.credential_id IS NULL THEN
-                    (SELECT id FROM connector_credential_pair
-                     WHERE connector_id = ia.connector_id
-                     LIMIT 1)
-                ELSE
-                    (SELECT id FROM connector_credential_pair
-                     WHERE connector_id = ia.connector_id
-                     AND credential_id = ia.credential_id)
-            END
-        WHERE ia.connector_id IS NOT NULL
-        """
-    )
-
-    # Make the new connector_credential_pair_id column non-nullable
-    op.alter_column("index_attempt", "connector_credential_pair_id", nullable=False)
-
-    # Drop the old connector_id and credential_id columns
-    op.drop_column("index_attempt", "connector_id")
-    op.drop_column("index_attempt", "credential_id")
-
-    # Update the index to use connector_credential_pair_id
-    op.create_index(
-        "ix_index_attempt_latest_for_connector_credential_pair",
-        "index_attempt",
-        ["connector_credential_pair_id", "time_created"],
-    )
-
-
-def downgrade() -> None:
-    # Add back the old connector_id and credential_id columns
-    op.add_column(
-        "index_attempt", sa.Column("connector_id", sa.Integer(), nullable=True)
-    )
-    op.add_column(
-        "index_attempt", sa.Column("credential_id", sa.Integer(), nullable=True)
-    )
-
-    # Populate the old connector_id and credential_id columns using the connector_credential_pair_id
-    op.execute(
-        """
-        UPDATE index_attempt ia
-        SET connector_id = ccp.connector_id, credential_id = ccp.credential_id
-        FROM connector_credential_pair ccp
-        WHERE ia.connector_credential_pair_id = ccp.id
-        """
-    )
-
-    # Make the old connector_id and credential_id columns non-nullable
-    op.alter_column("index_attempt", "connector_id", nullable=False)
-    op.alter_column("index_attempt", "credential_id", nullable=False)
-
-    # Drop the new connector_credential_pair_id column
-    op.drop_constraint(
-        "fk_index_attempt_connector_credential_pair_id",
-        "index_attempt",
-        type_="foreignkey",
-    )
-    op.drop_column("index_attempt", "connector_credential_pair_id")
-
-    op.create_index(
-        "ix_index_attempt_latest_for_connector_credential_pair",
-        "index_attempt",
-        ["connector_id", "credential_id", "time_created"],
-    )
--- a/backend/alembic/versions/8aabb57f3b49_restructure_document_indices.py
+++ b/backend/alembic/versions/8aabb57f3b49_restructure_document_indices.py
@@ -12,8 +12,8 @@ from sqlalchemy.dialects import postgresql
 # revision identifiers, used by Alembic.
 revision = "8aabb57f3b49"
 down_revision = "5e84129c8be3"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/8e26726b7683_chat_context_addition.py
+++ b/backend/alembic/versions/8e26726b7683_chat_context_addition.py
@@ -12,8 +12,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "8e26726b7683"
 down_revision = "5809c0787398"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/904451035c9b_store_tool_details.py
+++ b/backend/alembic/versions/904451035c9b_store_tool_details.py
@@ -12,8 +12,8 @@ from sqlalchemy.dialects import postgresql
 # revision identifiers, used by Alembic.
 revision = "904451035c9b"
 down_revision = "3b25685ff73c"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/904e5138fffb_tags.py
+++ b/backend/alembic/versions/904e5138fffb_tags.py
@@ -1,61 +0,0 @@
-"""Tags
-
-Revision ID: 904e5138fffb
-Revises: 891cd83c87a8
-Create Date: 2024-01-01 10:44:43.733974
-
-"""
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-
-# revision identifiers, used by Alembic.
-revision = "904e5138fffb"
-down_revision = "891cd83c87a8"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "tag",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("tag_key", sa.String(), nullable=False),
-        sa.Column("tag_value", sa.String(), nullable=False),
-        sa.Column("source", sa.String(), nullable=False),
-        sa.PrimaryKeyConstraint("id"),
-        sa.UniqueConstraint(
-            "tag_key", "tag_value", "source", name="_tag_key_value_source_uc"
-        ),
-    )
-    op.create_table(
-        "document__tag",
-        sa.Column("document_id", sa.String(), nullable=False),
-        sa.Column("tag_id", sa.Integer(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["document_id"],
-            ["document.id"],
-        ),
-        sa.ForeignKeyConstraint(
-            ["tag_id"],
-            ["tag.id"],
-        ),
-        sa.PrimaryKeyConstraint("document_id", "tag_id"),
-    )
-
-    op.add_column(
-        "search_doc",
-        sa.Column(
-            "doc_metadata",
-            postgresql.JSONB(astext_type=sa.Text()),
-            nullable=True,
-        ),
-    )
-    op.execute("UPDATE search_doc SET doc_metadata = '{}' WHERE doc_metadata IS NULL")
-    op.alter_column("search_doc", "doc_metadata", nullable=False)
-
-
-def downgrade() -> None:
-    op.drop_table("document__tag")
-    op.drop_table("tag")
-    op.drop_column("search_doc", "doc_metadata")
--- a/backend/alembic/versions/91fd3b470d1a_remove_documentsource_from_tag.py
+++ b/backend/alembic/versions/91fd3b470d1a_remove_documentsource_from_tag.py
@@ -1,36 +0,0 @@
-"""Remove DocumentSource from Tag
-
-Revision ID: 91fd3b470d1a
-Revises: 173cae5bba26
-Create Date: 2024-03-21 12:05:23.956734
-
-"""
-from alembic import op
-import sqlalchemy as sa
-from danswer.configs.constants import DocumentSource
-
-# revision identifiers, used by Alembic.
-revision = "91fd3b470d1a"
-down_revision = "173cae5bba26"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.alter_column(
-        "tag",
-        "source",
-        type_=sa.String(length=50),
-        existing_type=sa.Enum(DocumentSource, native_enum=False),
-        existing_nullable=False,
-    )
-
-
-def downgrade() -> None:
-    op.alter_column(
-        "tag",
-        "source",
-        type_=sa.Enum(DocumentSource, native_enum=False),
-        existing_type=sa.String(length=50),
-        existing_nullable=False,
-    )
--- a/backend/alembic/versions/91ffac7e65b3_add_expiry_time.py
+++ b/backend/alembic/versions/91ffac7e65b3_add_expiry_time.py
@@ -1,26 +0,0 @@
-"""add expiry time
-
-Revision ID: 91ffac7e65b3
-Revises: bc9771dccadf
-Create Date: 2024-06-24 09:39:56.462242
-
-"""
-
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "91ffac7e65b3"
-down_revision = "795b20b85b4b"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "user", sa.Column("oidc_expiry", sa.DateTime(timezone=True), nullable=True)
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("user", "oidc_expiry")
--- a/backend/alembic/versions/9d97fecfab7f_added_retrieved_docs_to_query_event.py
+++ b/backend/alembic/versions/9d97fecfab7f_added_retrieved_docs_to_query_event.py
@@ -12,8 +12,8 @@ from sqlalchemy.dialects import postgresql
 # revision identifiers, used by Alembic.
 revision = "9d97fecfab7f"
 down_revision = "ffc707a226b4"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/a3bfd0d64902_add_chosen_assistants_to_user_table.py
+++ b/backend/alembic/versions/a3bfd0d64902_add_chosen_assistants_to_user_table.py
@@ -1,27 +0,0 @@
-"""Add chosen_assistants to User table
-
-Revision ID: a3bfd0d64902
-Revises: ec85f2b3c544
-Create Date: 2024-05-26 17:22:24.834741
-
-"""
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-
-# revision identifiers, used by Alembic.
-revision = "a3bfd0d64902"
-down_revision = "ec85f2b3c544"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "user",
-        sa.Column("chosen_assistants", postgresql.ARRAY(sa.Integer()), nullable=True),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("user", "chosen_assistants")
--- a/backend/alembic/versions/a570b80a5f20_usergroup_tables.py
+++ b/backend/alembic/versions/a570b80a5f20_usergroup_tables.py
@@ -12,8 +12,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "a570b80a5f20"
 down_revision = "904451035c9b"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/ae62505e3acc_add_saml_accounts.py
+++ b/backend/alembic/versions/ae62505e3acc_add_saml_accounts.py
@@ -12,8 +12,8 @@ import sqlalchemy as sa
 # revision identifiers, used by Alembic.
 revision = "ae62505e3acc"
 down_revision = "7da543f5672f"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
--- a/backend/alembic/versions/b082fec533f0_make_last_attempt_status_nullable.py
+++ b/backend/alembic/versions/b082fec533f0_make_last_attempt_status_nullable.py
@@ -11,11 +11,12 @@ from sqlalchemy.dialects import postgresql
 # revision identifiers, used by Alembic.
 revision = "b082fec533f0"
 down_revision = "df0c7ad8a076"
-branch_labels: None = None
-depends_on: None = None
+branch_labels = None
+depends_on = None


 def upgrade() -> None:
+    # ### commands auto generated by Alembic - please adjust! ###
    op.alter_column(
        "connector_credential_pair",
        "last_attempt_status",
@@ -28,9 +29,11 @@ def upgrade() -> None:
        ),
        nullable=True,
    )
+    # ### end Alembic commands ###


 def downgrade() -> None:
+    # ### commands auto generated by Alembic - please adjust! ###
    op.alter_column(
        "connector_credential_pair",
        "last_attempt_status",
@@ -43,3 +46,4 @@ def downgrade() -> None:
        ),
        nullable=False,
    )
+    # ### end Alembic commands ###
--- a/backend/alembic/versions/b156fa702355_chat_reworked.py
+++ b/backend/alembic/versions/b156fa702355_chat_reworked.py
@@ -1,520 +0,0 @@
-"""Chat Reworked
-
-Revision ID: b156fa702355
-Revises: baf71f781b9e
-Create Date: 2023-12-12 00:57:41.823371
-
-"""
-import fastapi_users_db_sqlalchemy
-from alembic import op
-import sqlalchemy as sa
-from sqlalchemy.dialects import postgresql
-from sqlalchemy.dialects.postgresql import ENUM
-from danswer.configs.constants import DocumentSource
-
-# revision identifiers, used by Alembic.
-revision = "b156fa702355"
-down_revision = "baf71f781b9e"
-branch_labels: None = None
-depends_on: None = None
-
-
-searchtype_enum = ENUM(
-    "KEYWORD", "SEMANTIC", "HYBRID", name="searchtype", create_type=True
-)
-recencybiassetting_enum = ENUM(
-    "FAVOR_RECENT",
-    "BASE_DECAY",
-    "NO_DECAY",
-    "AUTO",
-    name="recencybiassetting",
-    create_type=True,
-)
-
-
-def upgrade() -> None:
-    bind = op.get_bind()
-    searchtype_enum.create(bind)
-    recencybiassetting_enum.create(bind)
-
-    # This is irrecoverable, whatever
-    op.execute("DELETE FROM chat_feedback")
-    op.execute("DELETE FROM document_retrieval_feedback")
-
-    op.create_table(
-        "search_doc",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column("document_id", sa.String(), nullable=False),
-        sa.Column("chunk_ind", sa.Integer(), nullable=False),
-        sa.Column("semantic_id", sa.String(), nullable=False),
-        sa.Column("link", sa.String(), nullable=True),
-        sa.Column("blurb", sa.String(), nullable=False),
-        sa.Column("boost", sa.Integer(), nullable=False),
-        sa.Column(
-            "source_type",
-            sa.Enum(DocumentSource, native=False),
-            nullable=False,
-        ),
-        sa.Column("hidden", sa.Boolean(), nullable=False),
-        sa.Column("score", sa.Float(), nullable=False),
-        sa.Column("match_highlights", postgresql.ARRAY(sa.String()), nullable=False),
-        sa.Column("updated_at", sa.DateTime(timezone=True), nullable=True),
-        sa.Column("primary_owners", postgresql.ARRAY(sa.String()), nullable=True),
-        sa.Column("secondary_owners", postgresql.ARRAY(sa.String()), nullable=True),
-        sa.PrimaryKeyConstraint("id"),
-    )
-    op.create_table(
-        "prompt",
-        sa.Column("id", sa.Integer(), nullable=False),
-        sa.Column(
-            "user_id",
-            fastapi_users_db_sqlalchemy.generics.GUID(),
-            nullable=True,
-        ),
-        sa.Column("name", sa.String(), nullable=False),
-        sa.Column("description", sa.String(), nullable=False),
-        sa.Column("system_prompt", sa.Text(), nullable=False),
-        sa.Column("task_prompt", sa.Text(), nullable=False),
-        sa.Column("include_citations", sa.Boolean(), nullable=False),
-        sa.Column("datetime_aware", sa.Boolean(), nullable=False),
-        sa.Column("default_prompt", sa.Boolean(), nullable=False),
-        sa.Column("deleted", sa.Boolean(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["user_id"],
-            ["user.id"],
-        ),
-        sa.PrimaryKeyConstraint("id"),
-    )
-    op.create_table(
-        "persona__prompt",
-        sa.Column("persona_id", sa.Integer(), nullable=False),
-        sa.Column("prompt_id", sa.Integer(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["persona_id"],
-            ["persona.id"],
-        ),
-        sa.ForeignKeyConstraint(
-            ["prompt_id"],
-            ["prompt.id"],
-        ),
-        sa.PrimaryKeyConstraint("persona_id", "prompt_id"),
-    )
-
-    # Changes to persona first so chat_sessions can have the right persona
-    # The empty persona will be overwritten on server startup
-    op.add_column(
-        "persona",
-        sa.Column(
-            "user_id",
-            fastapi_users_db_sqlalchemy.generics.GUID(),
-            nullable=True,
-        ),
-    )
-    op.add_column(
-        "persona",
-        sa.Column(
-            "search_type",
-            searchtype_enum,
-            nullable=True,
-        ),
-    )
-    op.execute("UPDATE persona SET search_type = 'HYBRID'")
-    op.alter_column("persona", "search_type", nullable=False)
-    op.add_column(
-        "persona",
-        sa.Column("llm_relevance_filter", sa.Boolean(), nullable=True),
-    )
-    op.execute("UPDATE persona SET llm_relevance_filter = TRUE")
-    op.alter_column("persona", "llm_relevance_filter", nullable=False)
-    op.add_column(
-        "persona",
-        sa.Column("llm_filter_extraction", sa.Boolean(), nullable=True),
-    )
-    op.execute("UPDATE persona SET llm_filter_extraction = TRUE")
-    op.alter_column("persona", "llm_filter_extraction", nullable=False)
-    op.add_column(
-        "persona",
-        sa.Column(
-            "recency_bias",
-            recencybiassetting_enum,
-            nullable=True,
-        ),
-    )
-    op.execute("UPDATE persona SET recency_bias = 'BASE_DECAY'")
-    op.alter_column("persona", "recency_bias", nullable=False)
-    op.alter_column("persona", "description", existing_type=sa.VARCHAR(), nullable=True)
-    op.execute("UPDATE persona SET description = ''")
-    op.alter_column("persona", "description", nullable=False)
-    op.create_foreign_key("persona__user_fk", "persona", "user", ["user_id"], ["id"])
-    op.drop_column("persona", "datetime_aware")
-    op.drop_column("persona", "tools")
-    op.drop_column("persona", "hint_text")
-    op.drop_column("persona", "apply_llm_relevance_filter")
-    op.drop_column("persona", "retrieval_enabled")
-    op.drop_column("persona", "system_text")
-
-    # Need to create a persona row so fk can work
-    result = bind.execute(sa.text("SELECT 1 FROM persona WHERE id = 0"))
-    exists = result.fetchone()
-    if not exists:
-        op.execute(
-            sa.text(
-                """
-                INSERT INTO persona (
-                    id, user_id, name, description, search_type, num_chunks,
-                    llm_relevance_filter, llm_filter_extraction, recency_bias,
-                    llm_model_version_override, default_persona, deleted
-                ) VALUES (
-                    0, NULL, '', '', 'HYBRID', NULL,
-                    TRUE, TRUE, 'BASE_DECAY', NULL, TRUE, FALSE
-                )
-                """
-            )
-        )
-    delete_statement = sa.text(
-        """
-        DELETE FROM persona
-        WHERE name = 'Danswer' AND default_persona = TRUE AND id != 0
-        """
-    )
-
-    bind.execute(delete_statement)
-
-    op.add_column(
-        "chat_feedback",
-        sa.Column("chat_message_id", sa.Integer(), nullable=False),
-    )
-    op.drop_constraint(
-        "chat_feedback_chat_message_chat_session_id_chat_message_me_fkey",
-        "chat_feedback",
-        type_="foreignkey",
-    )
-    op.drop_column("chat_feedback", "chat_message_edit_number")
-    op.drop_column("chat_feedback", "chat_message_chat_session_id")
-    op.drop_column("chat_feedback", "chat_message_message_number")
-    op.add_column(
-        "chat_message",
-        sa.Column(
-            "id",
-            sa.Integer(),
-            primary_key=True,
-            autoincrement=True,
-            nullable=False,
-            unique=True,
-        ),
-    )
-    op.add_column(
-        "chat_message",
-        sa.Column("parent_message", sa.Integer(), nullable=True),
-    )
-    op.add_column(
-        "chat_message",
-        sa.Column("latest_child_message", sa.Integer(), nullable=True),
-    )
-    op.add_column(
-        "chat_message", sa.Column("rephrased_query", sa.Text(), nullable=True)
-    )
-    op.add_column("chat_message", sa.Column("prompt_id", sa.Integer(), nullable=True))
-    op.add_column(
-        "chat_message",
-        sa.Column("citations", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
-    )
-    op.add_column("chat_message", sa.Column("error", sa.Text(), nullable=True))
-    op.drop_constraint("fk_chat_message_persona_id", "chat_message", type_="foreignkey")
-    op.create_foreign_key(
-        "chat_message__prompt_fk", "chat_message", "prompt", ["prompt_id"], ["id"]
-    )
-    op.drop_column("chat_message", "parent_edit_number")
-    op.drop_column("chat_message", "persona_id")
-    op.drop_column("chat_message", "reference_docs")
-    op.drop_column("chat_message", "edit_number")
-    op.drop_column("chat_message", "latest")
-    op.drop_column("chat_message", "message_number")
-    op.add_column("chat_session", sa.Column("one_shot", sa.Boolean(), nullable=True))
-    op.execute("UPDATE chat_session SET one_shot = TRUE")
-    op.alter_column("chat_session", "one_shot", nullable=False)
-    op.alter_column(
-        "chat_session",
-        "persona_id",
-        existing_type=sa.INTEGER(),
-        nullable=True,
-    )
-    op.execute("UPDATE chat_session SET persona_id = 0")
-    op.alter_column("chat_session", "persona_id", nullable=False)
-    op.add_column(
-        "document_retrieval_feedback",
-        sa.Column("chat_message_id", sa.Integer(), nullable=False),
-    )
-    op.drop_constraint(
-        "document_retrieval_feedback_qa_event_id_fkey",
-        "document_retrieval_feedback",
-        type_="foreignkey",
-    )
-    op.create_foreign_key(
-        "document_retrieval_feedback__chat_message_fk",
-        "document_retrieval_feedback",
-        "chat_message",
-        ["chat_message_id"],
-        ["id"],
-    )
-    op.drop_column("document_retrieval_feedback", "qa_event_id")
-
-    # Relation table must be created after the other tables are correct
-    op.create_table(
-        "chat_message__search_doc",
-        sa.Column("chat_message_id", sa.Integer(), nullable=False),
-        sa.Column("search_doc_id", sa.Integer(), nullable=False),
-        sa.ForeignKeyConstraint(
-            ["chat_message_id"],
-            ["chat_message.id"],
-        ),
-        sa.ForeignKeyConstraint(
-            ["search_doc_id"],
-            ["search_doc.id"],
-        ),
-        sa.PrimaryKeyConstraint("chat_message_id", "search_doc_id"),
-    )
-
-    # Needs to be created after chat_message id field is added
-    op.create_foreign_key(
-        "chat_feedback__chat_message_fk",
-        "chat_feedback",
-        "chat_message",
-        ["chat_message_id"],
-        ["id"],
-    )
-
-    op.drop_table("query_event")
-
-
-def downgrade() -> None:
-    op.drop_constraint(
-        "chat_feedback__chat_message_fk", "chat_feedback", type_="foreignkey"
-    )
-    op.drop_constraint(
-        "document_retrieval_feedback__chat_message_fk",
-        "document_retrieval_feedback",
-        type_="foreignkey",
-    )
-    op.drop_constraint("persona__user_fk", "persona", type_="foreignkey")
-    op.drop_constraint("chat_message__prompt_fk", "chat_message", type_="foreignkey")
-    op.drop_constraint(
-        "chat_message__search_doc_chat_message_id_fkey",
-        "chat_message__search_doc",
-        type_="foreignkey",
-    )
-    op.add_column(
-        "persona",
-        sa.Column("system_text", sa.TEXT(), autoincrement=False, nullable=True),
-    )
-    op.add_column(
-        "persona",
-        sa.Column(
-            "retrieval_enabled",
-            sa.BOOLEAN(),
-            autoincrement=False,
-            nullable=True,
-        ),
-    )
-    op.execute("UPDATE persona SET retrieval_enabled = TRUE")
-    op.alter_column("persona", "retrieval_enabled", nullable=False)
-    op.add_column(
-        "persona",
-        sa.Column(
-            "apply_llm_relevance_filter",
-            sa.BOOLEAN(),
-            autoincrement=False,
-            nullable=True,
-        ),
-    )
-    op.add_column(
-        "persona",
-        sa.Column("hint_text", sa.TEXT(), autoincrement=False, nullable=True),
-    )
-    op.add_column(
-        "persona",
-        sa.Column(
-            "tools",
-            postgresql.JSONB(astext_type=sa.Text()),
-            autoincrement=False,
-            nullable=True,
-        ),
-    )
-    op.add_column(
-        "persona",
-        sa.Column("datetime_aware", sa.BOOLEAN(), autoincrement=False, nullable=True),
-    )
-    op.execute("UPDATE persona SET datetime_aware = TRUE")
-    op.alter_column("persona", "datetime_aware", nullable=False)
-    op.alter_column("persona", "description", existing_type=sa.VARCHAR(), nullable=True)
-    op.drop_column("persona", "recency_bias")
-    op.drop_column("persona", "llm_filter_extraction")
-    op.drop_column("persona", "llm_relevance_filter")
-    op.drop_column("persona", "search_type")
-    op.drop_column("persona", "user_id")
-    op.add_column(
-        "document_retrieval_feedback",
-        sa.Column("qa_event_id", sa.INTEGER(), autoincrement=False, nullable=False),
-    )
-    op.drop_column("document_retrieval_feedback", "chat_message_id")
-    op.alter_column(
-        "chat_session", "persona_id", existing_type=sa.INTEGER(), nullable=True
-    )
-    op.drop_column("chat_session", "one_shot")
-    op.add_column(
-        "chat_message",
-        sa.Column(
-            "message_number",
-            sa.INTEGER(),
-            autoincrement=False,
-            nullable=False,
-            primary_key=True,
-        ),
-    )
-    op.add_column(
-        "chat_message",
-        sa.Column("latest", sa.BOOLEAN(), autoincrement=False, nullable=False),
-    )
-    op.add_column(
-        "chat_message",
-        sa.Column(
-            "edit_number",
-            sa.INTEGER(),
-            autoincrement=False,
-            nullable=False,
-            primary_key=True,
-        ),
-    )
-    op.add_column(
-        "chat_message",
-        sa.Column(
-            "reference_docs",
-            postgresql.JSONB(astext_type=sa.Text()),
-            autoincrement=False,
-            nullable=True,
-        ),
-    )
-    op.add_column(
-        "chat_message",
-        sa.Column("persona_id", sa.INTEGER(), autoincrement=False, nullable=True),
-    )
-    op.add_column(
-        "chat_message",
-        sa.Column(
-            "parent_edit_number",
-            sa.INTEGER(),
-            autoincrement=False,
-            nullable=True,
-        ),
-    )
-    op.create_foreign_key(
-        "fk_chat_message_persona_id",
-        "chat_message",
-        "persona",
-        ["persona_id"],
-        ["id"],
-    )
-    op.drop_column("chat_message", "error")
-    op.drop_column("chat_message", "citations")
-    op.drop_column("chat_message", "prompt_id")
-    op.drop_column("chat_message", "rephrased_query")
-    op.drop_column("chat_message", "latest_child_message")
-    op.drop_column("chat_message", "parent_message")
-    op.drop_column("chat_message", "id")
-    op.add_column(
-        "chat_feedback",
-        sa.Column(
-            "chat_message_message_number",
-            sa.INTEGER(),
-            autoincrement=False,
-            nullable=False,
-        ),
-    )
-    op.add_column(
-        "chat_feedback",
-        sa.Column(
-            "chat_message_chat_session_id",
-            sa.INTEGER(),
-            autoincrement=False,
-            nullable=False,
-            primary_key=True,
-        ),
-    )
-    op.add_column(
-        "chat_feedback",
-        sa.Column(
-            "chat_message_edit_number",
-            sa.INTEGER(),
-            autoincrement=False,
-            nullable=False,
-        ),
-    )
-    op.drop_column("chat_feedback", "chat_message_id")
-    op.create_table(
-        "query_event",
-        sa.Column("id", sa.INTEGER(), autoincrement=True, nullable=False),
-        sa.Column("query", sa.VARCHAR(), autoincrement=False, nullable=False),
-        sa.Column(
-            "selected_search_flow",
-            sa.VARCHAR(),
-            autoincrement=False,
-            nullable=True,
-        ),
-        sa.Column("llm_answer", sa.VARCHAR(), autoincrement=False, nullable=True),
-        sa.Column("feedback", sa.VARCHAR(), autoincrement=False, nullable=True),
-        sa.Column("user_id", sa.UUID(), autoincrement=False, nullable=True),
-        sa.Column(
-            "time_created",
-            postgresql.TIMESTAMP(timezone=True),
-            server_default=sa.text("now()"),
-            autoincrement=False,
-            nullable=False,
-        ),
-        sa.Column(
-            "retrieved_document_ids",
-            postgresql.ARRAY(sa.VARCHAR()),
-            autoincrement=False,
-            nullable=True,
-        ),
-        sa.Column("chat_session_id", sa.INTEGER(), autoincrement=False, nullable=True),
-        sa.ForeignKeyConstraint(
-            ["chat_session_id"],
-            ["chat_session.id"],
-            name="fk_query_event_chat_session_id",
-        ),
-        sa.ForeignKeyConstraint(
-            ["user_id"], ["user.id"], name="query_event_user_id_fkey"
-        ),
-        sa.PrimaryKeyConstraint("id", name="query_event_pkey"),
-    )
-    op.drop_table("chat_message__search_doc")
-    op.drop_table("persona__prompt")
-    op.drop_table("prompt")
-    op.drop_table("search_doc")
-    op.create_unique_constraint(
-        "uq_chat_message_combination",
-        "chat_message",
-        ["chat_session_id", "message_number", "edit_number"],
-    )
-    op.create_foreign_key(
-        "chat_feedback_chat_message_chat_session_id_chat_message_me_fkey",
-        "chat_feedback",
-        "chat_message",
-        [
-            "chat_message_chat_session_id",
-            "chat_message_message_number",
-            "chat_message_edit_number",
-        ],
-        ["chat_session_id", "message_number", "edit_number"],
-    )
-    op.create_foreign_key(
-        "document_retrieval_feedback_qa_event_id_fkey",
-        "document_retrieval_feedback",
-        "query_event",
-        ["qa_event_id"],
-        ["id"],
-    )
-
-    op.execute("DROP TYPE IF EXISTS searchtype")
-    op.execute("DROP TYPE IF EXISTS recencybiassetting")
-    op.execute("DROP TYPE IF EXISTS documentsource")
--- a/backend/alembic/versions/b85f02ec1308_fix_file_type_migration.py
+++ b/backend/alembic/versions/b85f02ec1308_fix_file_type_migration.py
@@ -1,28 +0,0 @@
-"""fix-file-type-migration
-
-Revision ID: b85f02ec1308
-Revises: a3bfd0d64902
-Create Date: 2024-05-31 18:09:26.658164
-
-"""
-from alembic import op
-
-# revision identifiers, used by Alembic.
-revision = "b85f02ec1308"
-down_revision = "a3bfd0d64902"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.execute(
-        """
-        UPDATE file_store
-        SET file_origin = UPPER(file_origin)
-    """
-    )
-
-
-def downgrade() -> None:
-    # Let's not break anything on purpose :)
-    pass
--- a/backend/alembic/versions/b896bbd0d5a7_backfill_is_internet_data_to_false.py
+++ b/backend/alembic/versions/b896bbd0d5a7_backfill_is_internet_data_to_false.py
@@ -1,23 +0,0 @@
-"""backfill is_internet data to False
-
-Revision ID: b896bbd0d5a7
-Revises: 44f856ae2a4a
-Create Date: 2024-07-16 15:21:05.718571
-
-"""
-from alembic import op
-
-
-# revision identifiers, used by Alembic.
-revision = "b896bbd0d5a7"
-down_revision = "44f856ae2a4a"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.execute("UPDATE search_doc SET is_internet = FALSE WHERE is_internet IS NULL")
-
-
-def downgrade() -> None:
-    pass
--- a/backend/alembic/versions/baf71f781b9e_add_llm_model_version_override_to_.py
+++ b/backend/alembic/versions/baf71f781b9e_add_llm_model_version_override_to_.py
@@ -1,26 +0,0 @@
-"""Add llm_model_version_override to Persona
-
-Revision ID: baf71f781b9e
-Revises: 50b683a8295c
-Create Date: 2023-12-06 21:56:50.286158
-
-"""
-from alembic import op
-import sqlalchemy as sa
-
-# revision identifiers, used by Alembic.
-revision = "baf71f781b9e"
-down_revision = "50b683a8295c"
-branch_labels: None = None
-depends_on: None = None
-
-
-def upgrade() -> None:
-    op.add_column(
-        "persona",
-        sa.Column("llm_model_version_override", sa.String(), nullable=True),
-    )
-
-
-def downgrade() -> None:
-    op.drop_column("persona", "llm_model_version_override")
--- a/Show More
+++ b/Show More
Author	SHA1	Message	Date
Weves	36c30a7d94	fix	2023-11-03 00:45:31 -07:00
Weves	4ba37c255a	Fix	2023-11-03 00:36:57 -07:00
Weves	e8eb89f6ed	fix	2023-11-03 00:33:29 -07:00
Weves	aacee9b21a	fix	2023-11-03 00:28:54 -07:00
Weves	4cc0697b66	Standard	2023-11-03 00:25:42 -07:00
Weves	d5d7772524	Complete	2023-11-03 00:24:48 -07:00
Weves	4326866a9d	Add wiki scripts	2023-11-02 21:18:00 -07:00
Weves	609c387e9a	test	2023-11-02 18:30:18 -07:00
Weves	b66a0df069	Change	2023-11-02 16:09:20 -07:00
Weves	46ff75e675	Fix	2023-11-02 15:31:42 -07:00
Weves	279a3a02f8	Fix	2023-11-02 15:26:02 -07:00
Weves	1954164ec4	fix	2023-11-02 15:24:21 -07:00
Weves	c6f08cd1cd	fix	2023-11-02 15:22:30 -07:00
Weves	d9ada5d290	fix percentiles	2023-11-02 13:44:06 -07:00
Weves	0a1fdb80db	Fix	2023-11-02 13:28:22 -07:00
Weves	e94d753821	Add percentiles	2023-11-02 13:23:06 -07:00
Weves	8e81b935d1	Fix	2023-11-02 13:07:56 -07:00
Weves	17866dcf8b	tesT	2023-11-01 23:38:53 -07:00
Weves	b427fac6d7	50	2023-11-01 23:29:05 -07:00
Weves	9652af82fe	test	2023-11-01 23:22:20 -07:00
Weves	340f703ff5	test	2023-11-01 23:20:55 -07:00
Weves	8de8c00531	test	2023-11-01 23:14:56 -07:00
Weves	d82bd97dd4	Fix	2023-11-01 23:13:20 -07:00
Weves	39341516ab	Simplify query	2023-11-01 22:45:08 -07:00
Weves	54f5248eb1	Fix	2023-11-01 22:42:31 -07:00
Weves	97412c9b7a	Remove summary	2023-11-01 22:42:31 -07:00
Weves	2f770264c8	Add randomly generated sentences	2023-11-01 22:42:31 -07:00
Weves	8777749646	Disable filters	2023-11-01 22:42:31 -07:00
Weves	22d7427e45	adjust vespa fields	2023-11-01 22:42:31 -07:00
Weves	f4e80c9f22	Configure threads per search	2023-11-01 22:42:31 -07:00
Weves	cb06cf7481	make search profile configurable	2023-11-01 22:42:31 -07:00
Weves	0635a81d5e	Back to old bank	2023-11-01 22:42:31 -07:00
Weves	437c5856d0	Add back summary	2023-11-01 22:42:31 -07:00
Weves	1a58ad4276	Add embedding	2023-11-01 22:42:31 -07:00
Weves	a9e0967771	Hyrbrid	2023-11-01 22:42:31 -07:00
Weves	da81e843d2	Remove content summary	2023-11-01 22:42:31 -07:00
Weves	34980974ac	Isolate vespa	2023-11-01 22:42:31 -07:00
Weves	61ea59affc	Add more questions	2023-11-01 22:42:31 -07:00
Weves	83d5d49323	add logging	2023-11-01 22:42:31 -07:00
Weves	ca397c3121	Add more logging	2023-11-01 22:42:31 -07:00
Weves	d2f3e0165a	Adjust num to retrieve	2023-11-01 22:42:31 -07:00
Weves	90398f5e56	Adjust timeout across the board	2023-11-01 22:42:31 -07:00
Weves	7c2c5563e3	Handle empty blurb + adjust timeout	2023-11-01 22:42:31 -07:00
Weves	99df68f5ac	Adjust script	2023-11-01 22:42:31 -07:00
Weves	ebec047aa5	Benchmarking script	2023-11-01 22:42:31 -07:00