Release Khoj version 1.11.1

Support customization of the OpenAI base url in admin settings (#725 )
- Allow self-hosted users to customize their open ai base url. This allows you to easily use a proxy service and extend support for other models. - This also includes a migration that associates any existing openai chat model configuration with an openai processor configuration - Make changing model a paid/subscriber feature - Removes usage of langchain's OpenAI wrapper for better control over parsing input/output
2026-05-13 21:41:41 +00:00 · 2024-04-27 18:42:24 +05:30 · 2024-04-27 18:24:35 +05:30 · 2024-04-27 17:07:21 +05:30 · 2024-04-27 09:56:58 +05:30 · 2024-04-26 11:55:22 +05:30
461 changed files with 76153 additions and 7246 deletions
--- a/.dockerignore
+++ b/.dockerignore
@@ -6,4 +6,5 @@ docs/
 tests/
 build/
 dist/
+scripts/
 *.egg-info/
--- a/.gitattributes
+++ b/.gitattributes
@@ -0,0 +1,2 @@
+# Exclude tests data file from programming stats on Github
+tests/data/** linguist-vendored
--- a/.github/ISSUE_TEMPLATE/bug-report.md
+++ b/.github/ISSUE_TEMPLATE/bug-report.md
@@ -0,0 +1,42 @@
+---
+name: Bug Report
+about: Create a bug to help fix something that might not be working correctly
+title: "[FIX]"
+labels: fix
+assignees: ''
+
+---
+
+## Describe the bug
+A clear and concise description of what the bug is. Please include what you were expecting to happen vs. what actually happened.
+
+## To Reproduce
+Steps to reproduce the behavior:
+
+## Screenshots
+If applicable, add screenshots to help explain your problem.
+
+## Platform
+- Server:
+    - [ ] Cloud-Hosted (https://app.khoj.dev)
+    - [ ] Self-Hosted Docker
+    - [ ] Self-Hosted Python package
+    - [ ] Self-Hosted source code
+- Client:
+    - [ ] Obsidian
+    - [ ] Emacs
+    - [ ] Desktop app
+    - [ ] Web browser
+    - [ ] WhatsApp
+- OS:
+    - [ ] Windows
+    - [ ] macOS
+    - [ ] Linux
+    - [ ] Android
+    - [ ] iOS
+
+### If self-hosted
+- Server Version [e.g. 1.0.1]:
+
+## Additional context
+Add any other context about the problem here.
--- a/.github/ISSUE_TEMPLATE/feature-request.md
+++ b/.github/ISSUE_TEMPLATE/feature-request.md
@@ -0,0 +1,11 @@
+---
+name: Feature Request
+about: Suggest an idea to help make Khoj a better tool
+title: "[IDEA]"
+labels: "upgrade"
+assignees: ''
+
+---
+
+## Describe the feature you'd like
+A clear and concise description of what you want to happen. Include any relevant links or screenshots or inspiration.
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -1,45 +0,0 @@
-name: build
-
-on:
-  push:
-    branches:
-      - master
-    paths:
-      - src/**
-      - config/**
-      - setup.py
-      - Dockerfile
-      - docker-compose.yml
-      - .github/workflows/build.yml
-  workflow_dispatch:
-
-env:
-  DOCKER_IMAGE_TAG: ${{ github.ref == 'refs/heads/master' && 'latest' || github.ref_name }}
-
-jobs:
-  build:
-    name: Build Docker Image, Push to Container Registry
-    runs-on: ubuntu-latest
-    steps:
-      - name: Checkout Code
-        uses: actions/checkout@v2
-
-      - name: Set up Docker Buildx
-        uses: docker/setup-buildx-action@v1
-
-      - name: Login to GitHub Container Registry
-        uses: docker/login-action@v1
-        with:
-          registry: ghcr.io
-          username: ${{ github.repository_owner }}
-          password: ${{ secrets.PAT }}
-
-      - name: Build and Push Docker Image
-        uses: docker/build-push-action@v2
-        with:
-          context: .
-          file: Dockerfile
-          push: true
-          tags: ghcr.io/${{ github.repository }}:${{ env.DOCKER_IMAGE_TAG }}
-          build-args: |
-            PORT=8000
--- a/.github/workflows/build_khoj_el.yml
+++ b/.github/workflows/build_khoj_el.yml
@@ -0,0 +1,39 @@
+# melpa quality checks like checkdoc, byte-compile, package-lint for khoj.el
+# using melpazoid: https://github.com/riscy/melpazoid
+
+name: build khoj.el
+on:
+  push:
+    branches:
+      - 'master'
+    paths:
+      - src/interface/emacs/*.el
+      - .github/workflows/build_khoj_el.yml
+  pull_request:
+    branches:
+      - 'master'
+    paths:
+      - src/interface/emacs/*.el
+      - .github/workflows/build_khoj_el.yml
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v2
+    - name: Set up Python 3.11
+      uses: actions/setup-python@v1
+      with: { python-version: 3.11 }
+    - name: ⏬️ Install Dependencies
+      run: |
+        python -m pip install --upgrade pip
+        sudo apt-get install emacs && emacs --version
+        git clone https://github.com/riscy/melpazoid.git ~/melpazoid
+        pip install ~/melpazoid
+    - name: 🌡️ Validate Khoj.el
+      env:
+        # Khoj recipe from https://github.com/melpa/melpa/pull/8321/files
+        RECIPE: (khoj :fetcher github :repo "khoj-ai/khoj" :files ("src/interface/emacs/*.el"))
+        EXIST_OK: true
+        LOCAL_REPO: ${{ github.workspace }}
+      run: echo $GITHUB_REF && make -C ~/melpazoid
--- a/.github/workflows/desktop.yml
+++ b/.github/workflows/desktop.yml
@@ -0,0 +1,99 @@
+name: desktop
+
+on:
+  push:
+    tags:
+      - "*"
+    branches:
+      - 'master'
+    paths:
+      - src/interface/desktop/**
+      - .github/workflows/desktop.yml
+
+jobs:
+  build:
+    name: 🖥️ Build, Release Desktop App
+    runs-on: ubuntu-latest
+    env:
+      TODESKTOP_ACCESS_TOKEN: ${{ secrets.TODESKTOP_ACCESS_TOKEN }}
+      TODESKTOP_EMAIL: ${{ secrets.TODESKTOP_EMAIL }}
+    defaults:
+      run:
+        shell: bash
+        working-directory: src/interface/desktop
+    steps:
+      - name: ⬇️ Checkout Code
+        uses: actions/checkout@v3
+        with:
+          fetch-depth: 0
+
+      - name: ⤵️ Install Node
+        uses: actions/setup-node@v3
+        with:
+          node-version: "lts/*"
+
+      - name: ⚙️ Setup Desktop Build
+        run: |
+          yarn
+          npm install -g @todesktop/cli
+          sed -i "s/\"id\": \"\"/\"id\": \"${{ secrets.TODESKTOP_ID }}\"/g" todesktop.json
+
+      - name: ⚙️ Build Desktop App
+        run: |
+          npx todesktop build
+
+      - name: 📦 Release Desktop App
+        if: startsWith(github.ref, 'refs/tags/')
+        run: |
+          npx todesktop release --latest --force
+
+      - name: ⤵️ Get Desktop Apps
+        if: startsWith(github.ref, 'refs/tags/')
+        run: |
+          build_no=`npx todesktop builds --latest | tail -n 1 | awk -F'/' '{print $NF}'`
+          sleep 900  # wait for 15 minutes for the build to be available
+          wget https://download.khoj.dev/builds/$build_no/mac/dmg/arm64 -O khoj-${{ github.ref_name }}-arm64.dmg
+          wget https://download.khoj.dev/builds/$build_no/mac/dmg/x64 -O khoj-${{ github.ref_name }}-x64.dmg
+          wget https://download.khoj.dev/builds/$build_no/windows/nsis/x64 -O khoj-${{ github.ref_name }}-x64.exe
+          wget https://download.khoj.dev/builds/$build_no/linux/deb/x64 -O khoj-${{ github.ref_name }}-x64.deb
+          wget https://download.khoj.dev/builds/$build_no/linux/appImage/x64 -O khoj-${{ github.ref_name }}-x64.AppImage
+
+      - name: ⏫ Upload Mac ARM App
+        if: startsWith(github.ref, 'refs/tags/')
+        uses: actions/upload-artifact@v3
+        with:
+          if-no-files-found: warn
+          name: khoj-${{ github.ref_name }}-arm64.dmg
+          path: src/interface/desktop/khoj-${{ github.ref_name }}-arm64.dmg
+
+      - name: ⏫ Upload Mac x64 App
+        if: startsWith(github.ref, 'refs/tags/')
+        uses: actions/upload-artifact@v3
+        with:
+          if-no-files-found: warn
+          name: khoj-${{ github.ref_name }}-x64.dmg
+          path: src/interface/desktop/khoj-${{ github.ref_name }}-x64.dmg
+
+      - name: ⏫ Upload Windows App
+        if: startsWith(github.ref, 'refs/tags/')
+        uses: actions/upload-artifact@v3
+        with:
+          if-no-files-found: warn
+          name: khoj-${{ github.ref_name }}-x64.exe
+          path: src/interface/desktop/khoj-${{ github.ref_name }}-x64.exe
+
+      - name: ⏫ Upload Debian App
+        if: startsWith(github.ref, 'refs/tags/')
+        uses: actions/upload-artifact@v3
+        with:
+          if-no-files-found: warn
+          name: khoj-${{ github.ref_name }}-x64.deb
+          path: src/interface/desktop/khoj-${{ github.ref_name }}-x64.deb
+
+      - name: ⏫ Upload Linux App Image
+        if: startsWith(github.ref, 'refs/tags/')
+        uses: actions/upload-artifact@v3
+        with:
+          if-no-files-found: warn
+          name: khoj-${{ github.ref_name }}-x64.AppImage
+          path: src/interface/desktop/khoj-${{ github.ref_name }}-x64.AppImage
--- a/.github/workflows/dockerize.yml
+++ b/.github/workflows/dockerize.yml
@@ -0,0 +1,98 @@
+name: dockerize
+
+on:
+  push:
+    tags:
+      - "*"
+    branches:
+      - master
+    paths:
+      - src/khoj/**
+      - pyproject.toml
+      - Dockerfile
+      - prod.Dockerfile
+      - docker-compose.yml
+      - .github/workflows/dockerize.yml
+  workflow_dispatch:
+    inputs:
+      tag:
+        description: 'Docker image tag'
+        default: 'dev'
+      khoj:
+        description: 'Build Khoj docker image'
+        type: boolean
+        default: true
+      khoj-cloud:
+        description: 'Build Khoj cloud docker image'
+        type: boolean
+        default: true
+
+env:
+  # Tag Image with tag name on release
+  # else with user specified tag (default 'dev') if triggered via workflow
+  # else with 'pre' (if push to master)
+  DOCKER_IMAGE_TAG: ${{ github.ref_type == 'tag' && github.ref_name || github.event_name == 'workflow_dispatch' && github.event.inputs.tag || 'pre' }}
+
+jobs:
+  build:
+    name: Publish Khoj Docker Images
+    runs-on: ubuntu-latest
+    strategy:
+      fail-fast: false
+      matrix:
+        image:
+          - 'local'
+          - 'cloud'
+    steps:
+      - name: Checkout Code
+        uses: actions/checkout@v3
+        with:
+          # Get all history to correctly infer Khoj version using hatch
+          fetch-depth: 0
+
+      - name: Set up Docker Buildx
+        uses: docker/setup-buildx-action@v2
+
+      - name: Login to GitHub Container Registry
+        uses: docker/login-action@v2
+        with:
+          registry: ghcr.io
+          username: ${{ github.repository_owner }}
+          password: ${{ secrets.PAT }}
+
+      - name: Get App Version
+        id: hatch
+        run: echo "version=$(pipx run hatch version)" >> $GITHUB_OUTPUT
+
+      - name: 🧹 Delete huge unnecessary tools folder
+        run: rm -rf /opt/hostedtoolcache
+
+      - name: 📦 Build and Push Docker Image
+        uses: docker/build-push-action@v2
+        if: (matrix.image == 'local' && github.event_name == 'workflow_dispatch') && github.event.inputs.khoj == 'true' || (matrix.image == 'local' && github.event_name == 'push')
+        with:
+          context: .
+          file: Dockerfile
+          platforms: linux/amd64, linux/arm64
+          push: true
+          tags: |
+            ghcr.io/${{ github.repository }}:${{ env.DOCKER_IMAGE_TAG }}
+            ${{ github.ref_type == 'tag' && format('ghcr.io/{0}:latest', github.repository) || '' }}
+          build-args: |
+            VERSION=${{ steps.hatch.outputs.version }}
+            PORT=42110
+
+      - name: 📦️⛅️ Build and Push Cloud Docker Image
+        uses: docker/build-push-action@v2
+        if: (matrix.image == 'cloud' && github.event_name == 'workflow_dispatch') && github.event.inputs.khoj-cloud == 'true' || (matrix.image == 'cloud' && github.event_name == 'push')
+        with:
+          context: .
+          file: prod.Dockerfile
+          platforms: linux/amd64
+          push: true
+          tags: |
+            ghcr.io/${{ github.repository }}-cloud:${{ env.DOCKER_IMAGE_TAG }}
+            ${{ github.ref_type == 'tag' && format('ghcr.io/{0}-cloud:latest', github.repository) || '' }}
+          build-args: |
+            VERSION=${{ steps.hatch.outputs.version }}
+            PORT=42110
--- a/.github/workflows/dockerize_telemetry_server.yml
+++ b/.github/workflows/dockerize_telemetry_server.yml
@@ -0,0 +1,47 @@
+name: dockerize telemetry server
+
+on:
+  push:
+    branches:
+      - master
+    paths:
+      - src/telemetry/**
+      - .github/workflows/dockerize_telemetry_server.yml
+  pull_request:
+    branches:
+      - master
+    paths:
+      - src/telemetry/**
+      - .github/workflows/dockerize_telemetry_server.yml
+  workflow_dispatch:
+
+env:
+  DOCKER_IMAGE_TAG: ${{ github.ref == 'refs/heads/master' && 'latest' || github.event.pull_request.number }}
+
+jobs:
+  build:
+    name: Build Docker Image, Push to Container Registry
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout Code
+        uses: actions/checkout@v3
+
+      - name: Set up Docker Buildx
+        uses: docker/setup-buildx-action@v2
+
+      - name: Login to GitHub Container Registry
+        uses: docker/login-action@v2
+        with:
+          registry: ghcr.io
+          username: ${{ github.repository_owner }}
+          password: ${{ secrets.PAT }}
+
+      - name: 📦 Build and Push Docker Image
+        uses: docker/build-push-action@v2
+        with:
+          context: src/telemetry
+          file: src/telemetry/Dockerfile
+          push: true
+          tags: ghcr.io/${{ github.repository }}-telemetry:${{ env.DOCKER_IMAGE_TAG }}
+          secrets: |
+            "POSTHOG_API_KEY=${{ secrets.POSTHOG_API_KEY }}"
--- a/.github/workflows/github_pages_deploy.yml
+++ b/.github/workflows/github_pages_deploy.yml
@@ -0,0 +1,46 @@
+name: build and deploy github pages for documentation
+on:
+  push:
+    branches:
+      - 'master'
+
+permissions:
+  contents: read
+  pages: write
+  id-token: write
+
+jobs:
+    deploy:
+      environment:
+        name: github-pages
+        url: https://docs.khoj.dev
+      runs-on: ubuntu-latest
+      steps:
+        - name: Checkout
+          uses: actions/checkout@v3
+        # 👇 Build steps
+        - name: Set up Node.js
+          uses: actions/setup-node@v3
+          with:
+            node-version: 18.x
+            cache: yarn
+            cache-dependency-path: documentation/yarn.lock
+        - name: Install dependencies
+          run: |
+            cd documentation
+            yarn install --frozen-lockfile --non-interactive
+        - name: Build
+          run: |
+            cd documentation
+            yarn build
+        # 👆 Build steps
+        - name: Setup Pages
+          uses: actions/configure-pages@v3
+        - name: Upload artifact
+          uses: actions/upload-pages-artifact@v2
+          with:
+            # 👇 Specify build output path
+            path: documentation/build
+        - name: Deploy to GitHub Pages
+          id: deployment
+          uses: actions/deploy-pages@v2
--- a/.github/workflows/pre-commit.yml
+++ b/.github/workflows/pre-commit.yml
@@ -0,0 +1,48 @@
+name: pre-commit
+
+on:
+  pull_request:
+    paths:
+      - src/**
+      - tests/**
+      - config/**
+      - pyproject.toml
+      - .pre-commit-config.yml
+      - .github/workflows/test.yml
+  push:
+    branches:
+      - master
+    paths:
+      - src/khoj/**
+      - tests/**
+      - config/**
+      - pyproject.toml
+      - .pre-commit-config.yml
+      - .github/workflows/test.yml
+
+jobs:
+  test:
+    name: Run Tests
+    runs-on: ubuntu-latest
+    strategy:
+      fail-fast: false
+    steps:
+      - uses: actions/checkout@v3
+        with:
+          fetch-depth: 0
+
+      - name: Set up Python 3.11
+        uses: actions/setup-python@v4
+        with:
+          python-version: 3.11
+
+      - name: ⏬️ Install Dependencies
+        run: |
+          sudo apt update && sudo apt install -y libegl1
+          python -m pip install --upgrade pip
+
+      - name: ⬇️ Install Application
+        run: pip install --upgrade .[dev]
+
+      - name: 🌡️ Validate Application
+        run: pre-commit run --hook-stage manual --all
--- a/.github/workflows/publish.yml
+++ b/.github/workflows/publish.yml
@@ -1,95 +0,0 @@
-name: publish
-
-on:
-  push:
-    tags:
-      - "*"
-    branches:
-      - 'master'
-    paths:
-      - src/**
-      - setup.py
-      - .github/workflows/publish.yml
-  pull_request:
-    branches:
-      - 'master'
-    paths:
-      - src/**
-      - setup.py
-      - .github/workflows/publish.yml
-
-jobs:
-  publish:
-    name: Publish App to PyPI
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-
-      - name: Set up Python 3.10
-        uses: actions/setup-python@v4
-        with:
-          python-version: '3.10'
-
-      - name: Install Dependencies
-        run: |
-          python -m pip install --upgrade pip
-          pip install build twine
-
-      - name: Install Application
-        run: |
-          pip install --upgrade .
-
-      - name: Publish Release to PyPI
-        if: startsWith(github.ref, 'refs/tags')
-        env:
-          TWINE_USERNAME: __token__
-          TWINE_PASSWORD: ${{ secrets.PYPI_API_KEY }}
-        run: |
-          # Setup Environment for Reproducible Builds
-          export PYTHONHASHSEED=42
-          export SOURCE_DATE_EPOCH=$(git log -1 --pretty=%ct)
-
-          # Build and Upload PyPi Package
-          rm -rf dist
-          python -m build
-          twine check dist/*
-          twine upload dist/*
-
-      - name: Publish Master to PyPI
-        if: github.ref == 'refs/heads/master'
-        env:
-          TWINE_USERNAME: __token__
-          TWINE_PASSWORD: ${{ secrets.PYPI_API_KEY }}
-        run: |
-          # Set Pre-Release Version
-          sed -E -i "s/version=(.*)',/version=\1a$(date +%s)',/g" setup.py
-
-          # Setup Environment for Reproducible Builds
-          export PYTHONHASHSEED=42
-          export SOURCE_DATE_EPOCH=$(git log -1 --pretty=%ct)
-
-          # Build and Upload PyPi Package
-          rm -rf dist
-          python -m build
-          twine check dist/*
-          twine upload dist/*
-
-      - name: Publish PR to Test PyPI
-        if: github.event_name == 'pull_request'
-        env:
-          TWINE_USERNAME: __token__
-          TWINE_PASSWORD: ${{ secrets.TEST_PYPI_API_KEY }}
-          PULL_REQUEST_NUMBER: ${{ github.event.number }}
-        run: |
-          # Set Development Release Version
-          sed -E -i "s/version=(.*)',/version=\1.dev$PULL_REQUEST_NUMBER$(date +%s)',/g" setup.py
-
-          # Setup Environment for Reproducible Builds
-          export PYTHONHASHSEED=42
-          export SOURCE_DATE_EPOCH=$(git log -1 --pretty=%ct)
-
-          # Build and Upload PyPi Package
-          rm -rf dist
-          python -m build
-          twine check dist/*
-          twine upload -r testpypi dist/*
--- a/.github/workflows/pypi.yml
+++ b/.github/workflows/pypi.yml
@@ -0,0 +1,64 @@
+name: pypi
+
+on:
+  push:
+    tags:
+      - "*"
+    branches:
+      - 'master'
+    paths:
+      - src/khoj/**
+      - pyproject.toml
+      - .github/workflows/pypi.yml
+  pull_request:
+    branches:
+      - 'master'
+    paths:
+      - src/khoj/**
+      - pyproject.toml
+      - .github/workflows/pypi.yml
+
+jobs:
+  publish:
+    name: Publish Python Package to PyPI
+    runs-on: ubuntu-latest
+    permissions:
+      id-token: write
+    steps:
+      - uses: actions/checkout@v3
+        with:
+          fetch-depth: 0
+
+      - name: Set up Python 3.11
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.11'
+
+      - name: ⬇️ Install Application
+        run: python -m pip install --upgrade pip && pip install --upgrade .
+
+      - name: ⚙️ Build Python Package
+        run: |
+          # Setup Environment for Reproducible Builds
+          export PYTHONHASHSEED=42
+          export SOURCE_DATE_EPOCH=$(git log -1 --pretty=%ct)
+          rm -rf dist
+
+          # Build PyPi Package
+          pipx run build
+
+      - name: 🌡️ Validate Python Package
+        run: |
+          # Validate PyPi Package
+          pipx run check-wheel-contents dist/*.whl --ignore W004
+          pipx run twine check dist/*
+
+      - name: ⏫ Upload Python Package Artifacts
+        uses: actions/upload-artifact@v3
+        with:
+          name: khoj-assistant
+          path: dist/*.whl
+
+      - name: 📦 Publish Python Package to PyPI
+        if: startsWith(github.ref, 'refs/tags') || github.ref == 'refs/heads/master'
+        uses: pypa/gh-action-pypi-publish@v1.8.14
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -12,106 +12,55 @@ on:
        type: string

 jobs:
-  publish:
-    strategy:
-      matrix:
-        include:
-        - os: ubuntu-latest
-          extension: deb
-        - os: macos-latest
-          extension: dmg
-        - os: windows-latest
-          extension: exe
-    runs-on: ${{ matrix.os }}
+  publish_obsidian_plugin:
+    name: 💎 Publish Obsidian Plugin
+    runs-on: ubuntu-latest
+    permissions:
+      contents: write
+    defaults:
+      run:
+        shell: bash
+        working-directory: src/interface/obsidian
    steps:
      - uses: actions/checkout@v3

-      - name: Set up Python 3.9
-        uses: actions/setup-python@v4
+      - name: Install Node
+        uses: actions/setup-node@v3
        with:
-          python-version: '3.9'
+          node-version: "lts/*"

-      - name: Install Dependencies
-        shell: bash
+      - name: ⚙️ Build Obsidian Plugin
        run: |
-          if [ "$RUNNER_OS" == "Linux" ]; then
-            sudo apt install libegl1 libxcb-xinerama0 python3-tk -y
-          fi
-          python -m pip install --upgrade pip
-          pip install pyinstaller
+          yarn
+          yarn run build --if-present

-      - name: Install Khoj App
-        run: |
-          pip install --upgrade .
-
-      - name: Package Khoj App
-        shell: bash
-        run: |
-          # Setup Environment for Reproducible Builds
-          export PYTHONHASHSEED=42
-          export SOURCE_DATE_EPOCH=$(git log -1 --pretty=%ct)
-
-          pyinstaller --noconfirm Khoj.spec
-          if [ "$RUNNER_OS" == "Windows" ]; then
-            mv dist/Khoj.exe dist/khoj_"$GITHUB_REF_NAME"_amd64.exe
-          fi
-
-      - name: Create Mac App DMG
-        if: matrix.os == 'macos-latest'
-        run: |
-         # Install Mac DMG Creator
-          brew install create-dmg
-          # Copy app to separate dmg folder
-          mkdir -p dist/dmg && cp -r dist/Khoj.app dist/dmg
-          # Create disk image with the app
-          create-dmg \
-            --volname "Khoj" \
-            --volicon "src/interface/web/assets/icons/favicon.icns" \
-            --window-pos 200 120 \
-            --window-size 600 300 \
-            --icon-size 100 \
-            --icon "Khoj.app" 175 120 \
-            --hide-extension "Khoj.app" \
-            --app-drop-link 425 120 \
-            "dist/khoj_"$GITHUB_REF_NAME"_amd64.dmg" \
-            "dist/dmg/"
-
-      - uses: ruby/setup-ruby@v1
-        if: matrix.os == 'ubuntu-latest'
+      - name: ⏫ Upload Obsidian Plugin main.js
+        uses: actions/upload-artifact@v3
        with:
-          ruby-version: '3.0'
-      - name: Create Debian Package
-        if: matrix.os == 'ubuntu-latest'
-        shell: bash
-        env:
-          DEBIAN_PACKAGE_VERSION: ${{ inputs.version }}
-        run: |
-          # Install Debian Packager
-          gem install fpm
+          if-no-files-found: error
+          name: main.js
+          path: src/interface/obsidian/main.js

-          # Copy app files into expected output directory structure
-          mkdir -p package/opt package/usr/share/applications package/usr/share/icons/hicolor/128x128/apps
-          cp -r dist/Khoj package/opt/Khoj
-          cp src/interface/web/assets/icons/favicon-128x128.png package/usr/share/icons/hicolor/128x128/apps/Khoj.png
-          cp Khoj.desktop package/usr/share/applications
-
-          # Fix permissions to be usable by non-root users
-          find package/usr/share -type f -exec chmod 644 -- {} +
-          chmod 755 package/opt/Khoj
-
-          # Package the app
-          if [ -z "$DEBIAN_PACKAGE_VERSION" ]; then
-            DEBIAN_PACKAGE_VERSION=$(echo $GITHUB_REF_NAME | sed -E 's/v(.*)/\1/g')
-          fi
-          fpm -C package -s dir -t deb -n Khoj --version $DEBIAN_PACKAGE_VERSION -p dist/khoj_"$GITHUB_REF_NAME"_amd64.deb
-
-      - uses: actions/upload-artifact@v3
+      - name: ⏫ Upload Obsidian Plugin manifest.json
+        uses: actions/upload-artifact@v3
        with:
-          name: khoj_${{github.ref_name}}_amd64.${{matrix.extension}}
-          path: dist/khoj_${{github.ref_name}}_amd64.${{matrix.extension}}
+          if-no-files-found: error
+          name: manifest.json
+          path: src/interface/obsidian/manifest.json

-      - name: Release
+      - name: ⏫ Upload Obsidian Plugin styles.css
+        uses: actions/upload-artifact@v3
+        with:
+          if-no-files-found: error
+          name: styles.css
+          path: src/interface/obsidian/styles.css
+
+      - name: 🌈 Create Release
        uses: softprops/action-gh-release@v1
        if: startsWith(github.ref, 'refs/tags/')
        with:
-          files: dist/khoj_${{github.ref_name}}_amd64.${{matrix.extension}}
+          generate_release_notes: true
+          files: |
+            src/interface/obsidian/main.js
+            src/interface/obsidian/manifest.json
+            src/interface/obsidian/styles.css
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -2,46 +2,89 @@ name: test

 on:
  pull_request:
-    branches:
-      - 'master'
    paths:
-      - src/**
+      - src/khoj/**
      - tests/**
      - config/**
-      - setup.py
+      - pyproject.toml
+      - .pre-commit-config.yml
      - .github/workflows/test.yml
  push:
    branches:
-      - 'master'
+      - master
    paths:
-      - src/**
+      - src/khoj/**
      - tests/**
      - config/**
-      - setup.py
+      - pyproject.toml
+      - .pre-commit-config.yml
      - .github/workflows/test.yml

 jobs:
  test:
    name: Run Tests
    runs-on: ubuntu-latest
+    container: ubuntu:jammy
+    strategy:
+      fail-fast: false
+      matrix:
+        python_version:
+          - '3.9'
+          - '3.10'
+          - '3.11'
+          - '3.12'
+
+    services:
+      postgres:
+        image: ankane/pgvector
+        env:
+          POSTGRES_PASSWORD: postgres
+          POSTGRES_USER: postgres
+        ports:
+          - 5432:5432
+        options: --health-cmd pg_isready --health-interval 10s --health-timeout 5s --health-retries 5
+
    steps:
      - uses: actions/checkout@v3
+        with:
+          fetch-depth: 0

-      - name: Set up Python 3.10
+      - name: Set up Python
        uses: actions/setup-python@v4
        with:
-          python-version: '3.10'
+          python-version: ${{ matrix.python_version }}

-      - name: Install Dependencies
+      - name: Install Git
        run: |
-          sudo apt install libegl1 -y
+          apt update && apt install -y git
+
+      - name: ⏬️ Install Dependencies
+        env:
+          DEBIAN_FRONTEND: noninteractive
+        run: |
+          apt update && apt install -y libegl1 sqlite3 libsqlite3-dev libsqlite3-0 ffmpeg libsm6 libxext6
+
+      - name: ⬇️ Install Postgres
+        env:
+          DEBIAN_FRONTEND: noninteractive
+        run : |
+          apt install -y postgresql postgresql-client && apt install -y postgresql-server-dev-14
+
+      - name: ⬇️ Install pip
+        run: |
+          apt install -y python3-pip
+          python -m ensurepip --upgrade
          python -m pip install --upgrade pip
-          pip install pytest

-      - name: Install Application
-        run: |
-          pip install --upgrade .
+      - name: ⬇️ Install Application
+        run: sed -i 's/dynamic = \["version"\]/version = "0.0.0"/' pyproject.toml && pip install --upgrade .[dev]

-      - name: Test Application
-        run: |
-          pytest 
+      - name: 🧪 Test Application
+        env:
+          POSTGRES_HOST: postgres
+          POSTGRES_PORT: 5432
+          POSTGRES_USER: postgres
+          POSTGRES_PASSWORD: postgres
+          POSTGRES_DB: postgres
+        run: pytest
+        timeout-minutes: 10
--- a/.github/workflows/test_khoj_el.yml
+++ b/.github/workflows/test_khoj_el.yml
@@ -0,0 +1,52 @@
+name: test khoj.el
+
+on:
+  push:
+    branches:
+      - 'master'
+    paths:
+      - src/interface/emacs/*.el
+      - src/interface/emacs/tests/*.el
+      - .github/workflows/test_khoj_el.yml
+  pull_request:
+    branches:
+      - 'master'
+    paths:
+      - src/interface/emacs/*.el
+      - src/interface/emacs/tests/*.el
+      - .github/workflows/test_khoj_el.yml
+
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    strategy:
+      fail-fast: false
+      matrix:
+        emacs_version:
+          - 27.1
+          - 27.2
+          - 28.1
+          - 28.2
+          - snapshot
+    steps:
+      - uses: purcell/setup-emacs@master
+        with:
+          version: ${{ matrix.emacs_version }}
+      - uses: actions/checkout@v3
+      - name: 🧪 Test Khoj.el
+        run: |
+           # Run ERT tests on khoj.el
+           emacs -batch \
+           --eval "(progn \
+                    (require 'package) \
+                    (push '(\"melpa\" . \"https://melpa.org/packages/\") package-archives) \
+                    (package-initialize) \
+                    (unless package-archive-contents (package-refresh-contents)) \
+                    (unless (package-installed-p 'transient) (package-install 'transient)) \
+                    (unless (package-installed-p 'dash) (package-install 'dash)) \
+                    (unless (package-installed-p 'org) (package-install 'org)) \
+                   )" \
+           -l ert \
+           -l ./src/interface/emacs/khoj.el \
+           -l ./src/interface/emacs/tests/khoj-tests.el \
+           -f ert-run-tests-batch-and-exit
--- a/.gitignore
+++ b/.gitignore
@@ -1,7 +1,6 @@
 # Khoj artifacts
 *.gz
 *.pt
-src/.data
 tests/data/models
 tests/data/embeddings

@@ -11,15 +10,19 @@ __pycache__
 .emacs.desktop*
 *.py[cod]
 .vscode
+.env
+.venv/*
+todesktop.json

 # Build artifacts
-/src/interface/web/images
+/src/khoj/interface/web/images
 /build/
 /dist/
-/khoj_assistant.egg-info/
+khoj_assistant.egg-info
 /config/khoj*.yml
 .pytest_cache
-khoj.log
+*.log
+static

 # Obsidian plugin artifacts
 # ---
@@ -28,7 +31,7 @@ node_modules

 # Don't include the compiled obsidian main.js file in the repo.
 # They should be uploaded to GitHub releases instead.
-main.js
+src/interface/obsidian/main.js

 # Exclude sourcemaps
 *.map
--- a/.mypy.ini
+++ b/.mypy.ini
@@ -1,13 +0,0 @@
-[mypy]
-strict_optional = False
-ignore_missing_imports = True
-install_types = True
-non_interactive = True
-show_error_codes = True
-exclude = (?x)(
-    src/interface/desktop/main_window.py
-    | src/interface/desktop/file_browser.py
-    | src/interface/desktop/system_tray.py
-    | build/*
-    | tests/*
-  )
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -0,0 +1,32 @@
+repos:
+- repo: https://github.com/psf/black
+  rev: 23.1.0
+  hooks:
+  - id: black
+
+- repo: https://github.com/pre-commit/pre-commit-hooks
+  rev: v4.4.0
+  hooks:
+  - id: end-of-file-fixer
+  - id: trailing-whitespace
+    # Exclude elisp files to not clear page breaks
+    exclude: \.el$
+  - id: check-json
+  - id: check-toml
+  - id: check-yaml
+
+- repo: https://github.com/pycqa/isort
+  rev: 5.12.0
+  hooks:
+  - id: isort
+    name: isort (python)
+    args: ["--profile", "black", "--filter-files"]
+
+- repo: https://github.com/pre-commit/mirrors-mypy
+  rev: v1.0.0
+  hooks:
+    - id: mypy
+      stages: [push, manual]
+      pass_filenames: false
+      args:
+      - --config-file=pyproject.toml
--- a/26
+++ b/26
@@ -1,22 +1,28 @@
 # syntax=docker/dockerfile:1
-FROM python:3.10-slim-bullseye
-LABEL org.opencontainers.image.source https://github.com/debanjum/khoj
+FROM ubuntu:jammy
+LABEL org.opencontainers.image.source https://github.com/khoj-ai/khoj

 # Install System Dependencies
-RUN apt-get update -y && \
-    apt-get -y install python3-pyqt5
+RUN apt update -y && apt -y install python3-pip swig

-# Copy Application to Container
-COPY . /app
 WORKDIR /app

-# Install Python Dependencies
-RUN pip install --upgrade pip && \
-    pip install --upgrade .
+# Install Application
+COPY pyproject.toml .
+COPY README.md .
+ARG VERSION=0.0.0
+RUN sed -i "s/dynamic = \\[\"version\"\\]/version = \"$VERSION\"/" pyproject.toml && \
+    pip install --no-cache-dir .
+
+# Copy Source Code
+COPY . .
+
+# Set the PYTHONPATH environment variable in order for it to find the Django app.
+ENV PYTHONPATH=/app/src:$PYTHONPATH

 # Run the Application
 # There are more arguments required for the application to run,
 # but these should be passed in through the docker-compose.yml file.
 ARG PORT
 EXPOSE ${PORT}
-ENTRYPOINT ["khoj"]
+ENTRYPOINT ["python3", "src/khoj/main.py"]
--- a/Khoj.desktop
+++ b/Khoj.desktop
@@ -1,7 +0,0 @@
-[Desktop Entry]
-Type=Application
-Name=Khoj
-Comment=A natural language search engine for your personal notes, transactions and images.
-Path=/opt
-Exec=/opt/Khoj
-Icon=Khoj
--- a/Khoj.spec
+++ b/Khoj.spec
@@ -1,115 +0,0 @@
-# -*- mode: python ; coding: utf-8 -*-
-from os.path import join
-from platform import system
-from PyInstaller.utils.hooks import copy_metadata
-import sysconfig
-
-datas = [
-    ('src/interface/web', 'src/interface/web'),
-    (f'{sysconfig.get_paths()["purelib"]}/transformers', 'transformers')
-]
-datas += copy_metadata('tqdm')
-datas += copy_metadata('regex')
-datas += copy_metadata('requests')
-datas += copy_metadata('packaging')
-datas += copy_metadata('filelock')
-datas += copy_metadata('numpy')
-datas += copy_metadata('tokenizers')
-
-block_cipher = None
-
-a = Analysis(
-    ['src/main.py'],
-    pathex=[],
-    binaries=[],
-    datas=datas,
-    hiddenimports=['huggingface_hub.repository'],
-    hookspath=[],
-    hooksconfig={},
-    runtime_hooks=[],
-    excludes=[],
-    win_no_prefer_redirects=False,
-    win_private_assemblies=False,
-    cipher=block_cipher,
-    noarchive=False,
-)
-
-# Filter out unused and/or duplicate shared libs
-torch_lib_paths = {
-    join('torch', 'lib', 'libtorch_cuda.so'),
-    join('torch', 'lib', 'libtorch_cpu.so'),
-}
-a.datas = [entry for entry in a.datas if not entry[0] in torch_lib_paths]
-
-os_path_separator = '\\' if system() == 'Windows' else '/'
-a.datas = [entry for entry in a.datas if not f'torch{os_path_separator}_C.cp' in entry[0]]
-a.datas = [entry for entry in a.datas if not f'torch{os_path_separator}_dl.cp' in entry[0]]
-
-pyz = PYZ(a.pure, a.zipped_data, cipher=block_cipher)
-
-if system() != 'Darwin':
-    # Add Splash screen to show on app launch
-    splash = Splash(
-        'src/interface/web/assets/icons/favicon-144x144.png',
-        binaries=a.binaries,
-        datas=a.datas,
-        text_pos=(10, 160),
-        text_size=12,
-        text_color='black',
-        minify_script=True,
-        always_on_top=True
-    )
-
-    exe = EXE(
-        pyz,
-        a.scripts,
-        a.binaries,
-        a.zipfiles,
-        a.datas,
-        splash,
-        splash.binaries,
-        [],
-        name='Khoj',
-        debug=False,
-        bootloader_ignore_signals=False,
-        strip=False,
-        upx=True,
-        upx_exclude=[],
-        runtime_tmpdir=None,
-        console=False,
-        disable_windowed_traceback=False,
-        argv_emulation=False,
-        target_arch='x86_64',
-        codesign_identity=None,
-        entitlements_file=None,
-        icon='src/interface/web/assets/icons/favicon-144x144.ico',
-    )
-else:
-    exe = EXE(
-        pyz,
-        a.scripts,
-        a.binaries,
-        a.zipfiles,
-        a.datas,
-        [],
-        name='Khoj',
-        debug=False,
-        bootloader_ignore_signals=False,
-        strip=False,
-        upx=True,
-        upx_exclude=[],
-        runtime_tmpdir=None,
-        console=False,
-        disable_windowed_traceback=False,
-        argv_emulation=False,
-        target_arch='x86_64',
-        codesign_identity=None,
-        entitlements_file=None,
-        icon='src/interface/web/assets/icons/favicon.icns',
-    )
-    app = BUNDLE(
-        exe,
-        name='Khoj.app',
-        icon='src/interface/web/assets/icons/favicon.icns',
-        bundle_identifier=None,
-    )
--- a/151
+++ b/151
@@ -1,23 +1,21 @@
-                    GNU GENERAL PUBLIC LICENSE
-                       Version 3, 29 June 2007
+                    GNU AFFERO GENERAL PUBLIC LICENSE
+                       Version 3, 19 November 2007

- Copyright (C) 2007 Free Software Foundation, Inc. <http://fsf.org/>
+ Copyright (C) 2007 Free Software Foundation, Inc. <https://fsf.org/>
 Everyone is permitted to copy and distribute verbatim copies
 of this license document, but changing it is not allowed.

                            Preamble

-  The GNU General Public License is a free, copyleft license for
-software and other kinds of works.
+  The GNU Affero General Public License is a free, copyleft license for
+software and other kinds of works, specifically designed to ensure
+cooperation with the community in the case of network server software.

  The licenses for most software and other practical works are designed
 to take away your freedom to share and change the works.  By contrast,
-the GNU General Public License is intended to guarantee your freedom to
+our General Public Licenses are intended to guarantee your freedom to
 share and change all versions of a program--to make sure it remains free
-software for all its users.  We, the Free Software Foundation, use the
-GNU General Public License for most of our software; it applies also to
-any other work released this way by its authors.  You can apply it to
-your programs, too.
+software for all its users.

  When we speak of free software, we are referring to freedom, not
 price.  Our General Public Licenses are designed to make sure that you
@@ -26,44 +24,34 @@ them if you wish), that you receive source code or can get it if you
 want it, that you can change the software or use pieces of it in new
 free programs, and that you know you can do these things.

-  To protect your rights, we need to prevent others from denying you
-these rights or asking you to surrender the rights.  Therefore, you have
-certain responsibilities if you distribute copies of the software, or if
-you modify it: responsibilities to respect the freedom of others.
+  Developers that use our General Public Licenses protect your rights
+with two steps: (1) assert copyright on the software, and (2) offer
+you this License which gives you legal permission to copy, distribute
+and/or modify the software.

-  For example, if you distribute copies of such a program, whether
-gratis or for a fee, you must pass on to the recipients the same
-freedoms that you received.  You must make sure that they, too, receive
-or can get the source code.  And you must show them these terms so they
-know their rights.
+  A secondary benefit of defending all users' freedom is that
+improvements made in alternate versions of the program, if they
+receive widespread use, become available for other developers to
+incorporate.  Many developers of free software are heartened and
+encouraged by the resulting cooperation.  However, in the case of
+software used on network servers, this result may fail to come about.
+The GNU General Public License permits making a modified version and
+letting the public access it on a server without ever releasing its
+source code to the public.

-  Developers that use the GNU GPL protect your rights with two steps:
-(1) assert copyright on the software, and (2) offer you this License
-giving you legal permission to copy, distribute and/or modify it.
+  The GNU Affero General Public License is designed specifically to
+ensure that, in such cases, the modified source code becomes available
+to the community.  It requires the operator of a network server to
+provide the source code of the modified version running there to the
+users of that server.  Therefore, public use of a modified version, on
+a publicly accessible server, gives the public access to the source
+code of the modified version.

-  For the developers' and authors' protection, the GPL clearly explains
-that there is no warranty for this free software.  For both users' and
-authors' sake, the GPL requires that modified versions be marked as
-changed, so that their problems will not be attributed erroneously to
-authors of previous versions.
-
-  Some devices are designed to deny users access to install or run
-modified versions of the software inside them, although the manufacturer
-can do so.  This is fundamentally incompatible with the aim of
-protecting users' freedom to change the software.  The systematic
-pattern of such abuse occurs in the area of products for individuals to
-use, which is precisely where it is most unacceptable.  Therefore, we
-have designed this version of the GPL to prohibit the practice for those
-products.  If such problems arise substantially in other domains, we
-stand ready to extend this provision to those domains in future versions
-of the GPL, as needed to protect the freedom of users.
-
-  Finally, every program is threatened constantly by software patents.
-States should not allow patents to restrict development and use of
-software on general-purpose computers, but in those that do, we wish to
-avoid the special danger that patents applied to a free program could
-make it effectively proprietary.  To prevent this, the GPL assures that
-patents cannot be used to render the program non-free.
+  An older license, called the Affero General Public License and
+published by Affero, was designed to accomplish similar goals.  This is
+a different license, not a version of the Affero GPL, but Affero has
+released a new version of the Affero GPL which permits relicensing under
+this license.

  The precise terms and conditions for copying, distribution and
 modification follow.
@@ -72,7 +60,7 @@ modification follow.

  0. Definitions.

-  "This License" refers to version 3 of the GNU General Public License.
+  "This License" refers to version 3 of the GNU Affero General Public License.

  "Copyright" also means copyright-like laws that apply to other kinds of
 works, such as semiconductor masks.
@@ -549,35 +537,45 @@ to collect a royalty for further conveying from those to whom you convey
 the Program, the only way you could satisfy both those terms and this
 License would be to refrain entirely from conveying the Program.

-  13. Use with the GNU Affero General Public License.
+  13. Remote Network Interaction; Use with the GNU General Public License.
+
+  Notwithstanding any other provision of this License, if you modify the
+Program, your modified version must prominently offer all users
+interacting with it remotely through a computer network (if your version
+supports such interaction) an opportunity to receive the Corresponding
+Source of your version by providing access to the Corresponding Source
+from a network server at no charge, through some standard or customary
+means of facilitating copying of software.  This Corresponding Source
+shall include the Corresponding Source for any work covered by version 3
+of the GNU General Public License that is incorporated pursuant to the
+following paragraph.

  Notwithstanding any other provision of this License, you have
 permission to link or combine any covered work with a work licensed
-under version 3 of the GNU Affero General Public License into a single
+under version 3 of the GNU General Public License into a single
 combined work, and to convey the resulting work.  The terms of this
 License will continue to apply to the part which is the covered work,
-but the special requirements of the GNU Affero General Public License,
-section 13, concerning interaction through a network will apply to the
-combination as such.
+but the work with which it is combined will remain governed by version
+3 of the GNU General Public License.

  14. Revised Versions of this License.

  The Free Software Foundation may publish revised and/or new versions of
-the GNU General Public License from time to time.  Such new versions will
-be similar in spirit to the present version, but may differ in detail to
+the GNU Affero General Public License from time to time.  Such new versions
+will be similar in spirit to the present version, but may differ in detail to
 address new problems or concerns.

  Each version is given a distinguishing version number.  If the
-Program specifies that a certain numbered version of the GNU General
+Program specifies that a certain numbered version of the GNU Affero General
 Public License "or any later version" applies to it, you have the
 option of following the terms and conditions either of that numbered
 version or of any later version published by the Free Software
 Foundation.  If the Program does not specify a version number of the
-GNU General Public License, you may choose any version ever published
+GNU Affero General Public License, you may choose any version ever published
 by the Free Software Foundation.

  If the Program specifies that a proxy can decide which future
-versions of the GNU General Public License can be used, that proxy's
+versions of the GNU Affero General Public License can be used, that proxy's
 public statement of acceptance of a version permanently authorizes you
 to choose that version for the Program.

@@ -620,3 +618,44 @@ copy of the Program in return for a fee.

                     END OF TERMS AND CONDITIONS

+            How to Apply These Terms to Your New Programs
+
+  If you develop a new program, and you want it to be of the greatest
+possible use to the public, the best way to achieve this is to make it
+free software which everyone can redistribute and change under these terms.
+
+  To do so, attach the following notices to the program.  It is safest
+to attach them to the start of each source file to most effectively
+state the exclusion of warranty; and each file should have at least
+the "copyright" line and a pointer to where the full notice is found.
+
+    <one line to give the program's name and a brief idea of what it does.>
+    Copyright (C) <year>  <name of author>
+
+    This program is free software: you can redistribute it and/or modify
+    it under the terms of the GNU Affero General Public License as published
+    by the Free Software Foundation, either version 3 of the License, or
+    (at your option) any later version.
+
+    This program is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU Affero General Public License for more details.
+
+    You should have received a copy of the GNU Affero General Public License
+    along with this program.  If not, see <https://www.gnu.org/licenses/>.
+
+Also add information on how to contact you by electronic and paper mail.
+
+  If your software can interact with users remotely through a computer
+network, you should also make sure that it provides a way for users to
+get its source.  For example, if your program is a web application, its
+interface could display a "Source" link that leads users to an archive
+of the code.  There are many ways you could offer source, and different
+solutions will be better for different programs; see section 13 for the
+specific requirements.
+
+  You should also get your employer (if you work as a programmer) or school,
+if any, to sign a "copyright disclaimer" for the program, if necessary.
+For more information on this, and how to apply and follow the GNU AGPL, see
+<https://www.gnu.org/licenses/>.
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -1,5 +0,0 @@
-include Readme.md
-graft src/interface/*
-prune src/interface/web/images*
-prune docs*
-global-exclude .DS_Store *.py[cod]
--- a/README.md
+++ b/README.md
@@ -0,0 +1,78 @@
+<p align="center"><img src="src/khoj/interface/web/assets/icons/khoj-logo-sideways-500.png" width="230" alt="Khoj Logo"></p>
+
+<div align="center">
+
+[![test](https://github.com/khoj-ai/khoj/actions/workflows/test.yml/badge.svg)](https://github.com/khoj-ai/khoj/actions/workflows/test.yml)
+[![dockerize](https://github.com/khoj-ai/khoj/actions/workflows/dockerize.yml/badge.svg)](https://github.com/khoj-ai/khoj/pkgs/container/khoj)
+[![pypi](https://github.com/khoj-ai/khoj/actions/workflows/pypi.yml/badge.svg)](https://pypi.org/project/khoj-assistant/)
+![Discord](https://img.shields.io/discord/1112065956647284756?style=plastic&label=discord)
+
+</div>
+
+<div align="center">
+<b>The open-source, personal AI for your digital brain</b>
+</div>
+
+<br />
+
+<div align="center">
+
+[🤖 Read Docs](https://docs.khoj.dev)
+<span>&nbsp;&nbsp;•&nbsp;&nbsp;</span>
+[🏮 Khoj Cloud](https://khoj.dev)
+<span>&nbsp;&nbsp;•&nbsp;&nbsp;</span>
+[💬 Get Involved](https://discord.gg/BDgyabRM6e)
+<span>&nbsp;&nbsp;•&nbsp;&nbsp;</span>
+[📚 Read Blog](https://blog.khoj.dev)
+
+</div>
+
+<div align="left">
+
+***
+
+Khoj is an application that creates always-available, personal AI agents for you to extend your capabilities.
+- You can share your notes and documents to extend your digital brain.
+- Your AI agents have access to the internet, allowing you to incorporate realtime information.
+- Khoj is accessible on Desktop, Emacs, Obsidian, Web and Whatsapp.
+- You can share pdf, markdown, org-mode, notion files and github repositories.
+- You'll get fast, accurate semantic search on top of your docs.
+- Your agents can create deeply personal images and understand your speech.
+- Khoj is open-source, self-hostable. Always.
+
+***
+
+</div>
+
+## See it in action
+
+<img src="https://github.com/khoj-ai/khoj/blob/master/documentation/assets/img/using_khoj_for_studying.gif?raw=true" alt="Khoj Demo">
+
+Go to https://app.khoj.dev to see Khoj live.
+
+## Full feature list
+You can see the full feature list [here](https://docs.khoj.dev/category/features).
+
+## Self-Host
+
+To get started with self-hosting Khoj, [read the docs](https://docs.khoj.dev/get-started/setup).
+
+## Contributors
+Cheers to our awesome contributors! 🎉
+
+<a href="https://github.com/khoj-ai/khoj/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=khoj-ai/khoj" />
+</a>
+
+Made with [contrib.rocks](https://contrib.rocks).
+
+### Interested in Contributing?
+
+We are always looking for contributors to help us build new features, improve the project documentation, or fix bugs. If you're interested, please see our [Contributing Guidelines](https://docs.khoj.dev/contributing/development) and check out our [Contributors Project Board](https://github.com/orgs/khoj-ai/projects/4).
+
+## [Sponsors](https://github.com/sponsors/khoj-ai)
+Shout out to our brilliant sponsors! 🌈
+
+<a href="http://github.com/beekeeb">
+  <img src="https://raw.githubusercontent.com/beekeeb/piantor/main/docs/beekeeb.png" width=250/>
+</a>
--- a/Readme.md
+++ b/Readme.md
@@ -1,321 +0,0 @@
-# Khoj 🦅
-[![build](https://github.com/debanjum/khoj/actions/workflows/build.yml/badge.svg)](https://github.com/debanjum/khoj/actions/workflows/build.yml)
-[![test](https://github.com/debanjum/khoj/actions/workflows/test.yml/badge.svg)](https://github.com/debanjum/khoj/actions/workflows/test.yml)
-[![publish](https://github.com/debanjum/khoj/actions/workflows/publish.yml/badge.svg)](https://github.com/debanjum/khoj/actions/workflows/publish.yml)
-
-*A natural language search engine for your personal notes, transactions and images*
-
-## Table of Contents
-
- [Features](#Features)
- [Demos](#Demos)
-  - [Khoj in Obsidian](#khoj-in-obsidian)
-  - [Khoj in Emacs, Browser](#khoj-in-emacs-browser)
-  - [Interfaces](#Interfaces)
- [Architecture](#Architecture)
- [Setup](#Setup)
-  - [Install](#1-Install)
-  - [Configure](#2-Configure)
-  - [Run](#3-Run)
- [Use](#Use)
-  - [Interfaces](#Interfaces-1)
-  - [Query Filters](#Query-filters)
- [Upgrade](#Upgrade)
-  - [Khoj Server](#upgrade-khoj-server)
-  - [Khoj.el](#upgrade-khoj-on-emacs)
-  - [Khoj Obsidian](#upgrade-khoj-on-obsidian)
- [Troubleshoot](#Troubleshoot)
- [Advanced Usage](#advanced-usage)
-  - [Access Khoj on Mobile](#access-khoj-on-mobile)
- [Miscellaneous](#Miscellaneous)
- [Performance](#Performance)
-  - [Query Performance](#Query-performance)
-  - [Indexing Performance](#Indexing-performance)
-  - [Miscellaneous](#Miscellaneous-1)
- [Development](#Development)
-  - [Setup](#Setup)
-    - [Using Pip](#Using-Pip)
-    - [Using Docker](#Using-Docker)
-    - [Using Conda](#Test)
-  - [Test](#Test)
- [Credits](#Credits)
-
-## Features
-
- **Natural**: Advanced natural language understanding using Transformer based ML Models
- **Local**: Your personal data stays local. All search, indexing is done on your machine[\*](https://github.com/debanjum/khoj#miscellaneous)
- **Incremental**: Incremental search for a fast, search-as-you-type experience
- **Pluggable**: Modular architecture makes it easy to plug in new data sources, frontends and ML models
- **Multiple Sources**: Search your Org-mode and Markdown notes, Beancount transactions and Photos
- **Multiple Interfaces**: Search using a [Web Browser](./src/interface/web/index.html), [Emacs](./src/interface/emacs/khoj.el) or the [API](http://localhost:8000/docs)
-
-## Demos
-### Khoj in Obsidian
-https://user-images.githubusercontent.com/6413477/210486007-36ee3407-e6aa-4185-8a26-b0bfc0a4344f.mp4
-
-<details><summary>Description</summary>
-
- Install Khoj via `pip` and start Khoj backend in non-gui mode
- Install Khoj plugin via Community Plugins settings pane on Obsidian app
- Check the new Khoj plugin settings
- Let Khoj backend index the markdown files in the current Vault
- Open Khoj plugin on Obsidian via Search button on Left Pane
- Search \"*Announce plugin to folks*\" in the [Obsidian Plugin docs](https://marcus.se.net/obsidian-plugin-docs/)
- Jump to the [search result](https://marcus.se.net/obsidian-plugin-docs/publishing/submit-your-plugin)
-</details>
-
-### Khoj in Emacs, Browser
-https://user-images.githubusercontent.com/6413477/184735169-92c78bf1-d827-4663-9087-a1ea194b8f4b.mp4
-
-<details><summary>Description</summary>
-
- Install Khoj via pip
- Start Khoj app
- Add this readme and [khoj.el readme](https://github.com/debanjum/khoj/tree/master/src/interface/emacs) as org-mode for Khoj to index
- Search \"*Setup editor*\" on the Web and Emacs. Re-rank the results for better accuracy
- Top result is what we are looking for, the [section to Install Khoj.el on Emacs](https://github.com/debanjum/khoj/tree/master/src/interface/emacs#installation)
-</details>
-
-<details><summary>Analysis</summary>
-
- The results do not have any words used in the query
-  - *Based on the top result it seems the re-ranking model understands that Emacs is an editor?*
- The results incrementally update as the query is entered
- The results are re-ranked, for better accuracy, once user hits enter
-</details>
-
-### Interfaces
-
-![](https://github.com/debanjum/khoj/blob/master/docs/interfaces.png)
-
-## Architecture
-
-![](https://github.com/debanjum/khoj/blob/master/docs/khoj_architecture.png)
-
-## Setup
-These are the general setup instructions for Khoj.
-
-Check the [Khoj Obsidian Readme](https://github.com/debanjum/khoj/tree/master/src/interface/obsidian#Setup) to setup Khoj with the Obsidian Plugin. Its simpler as it can skip the configure step below.
-
-### 1. Install
-
-```shell
-pip install khoj-assistant
-```
-
-### 2. Start App
-
-```shell
-khoj
-```
-
-### 3. Configure
-
-1. Enable content types and point to files to search in the First Run Screen that pops up on app start
-2. Click `Configure` and wait. The app will download ML models and index the content for search
-
-## Use
-### Interfaces
-
- **Khoj via Obsidian**
-  - [Install](https://github.com/debanjum/khoj/tree/master/src/interface/obsidian#2-Setup-Plugin) the Khoj Obsidian plugin
-  - Click the *Khoj search* icon 🔎 on the [Ribbon](https://help.obsidian.md/User+interface/Workspace/Ribbon) or Search for *Khoj: Search* in the [Command Palette](https://help.obsidian.md/Plugins/Command+palette)
- **Khoj via Emacs**
-  - [Install](https://github.com/debanjum/khoj/tree/master/src/interface/emacs#installation) [khoj.el](./src/interface/emacs/khoj.el)
-  - Run `M-x khoj <user-query>`
- **Khoj via Web**
-  - Open <http://localhost:8000/> via desktop interface or directly
- **Khoj via API**
-  - See the Khoj FastAPI [Swagger Docs](http://localhost:8000/docs), [ReDocs](http://localhost:8000/redocs)
-
-### Query Filters
-Use structured query syntax to filter the natural language search results
- **Word Filter**: Get entries that include/exclude a specified term
-  - Entries that contain term_to_include: `+"term_to_include"`
-  - Entries that contain term_to_exclude: `-"term_to_exclude"`
- **Date Filter**: Get entries containing dates in YYYY-MM-DD format from specified date (range)
-  - Entries from April 1st 1984: `dt:"1984-04-01"`
-  - Entries after March 31st 1984: `dt>="1984-04-01"`
-  - Entries before April 2nd 1984 : `dt<="1984-04-01"`
- **File Filter**: Get entries from a specified file
-  - Entries from incoming.org file: `file:"incoming.org"`
- Combined Example
-  - `what is the meaning of life? file:"1984.org" dt>="1984-01-01" dt<="1985-01-01" -"big" -"brother"`
-  - Adds all filters to the natural language query. It should return entries
-    - from the file *1984.org*
-    - containing dates from the year *1984*
-    - excluding words *"big"* and *"brother"*
-    - that best match the natural language query *"what is the meaning of life?"*
-
-## Upgrade
-### Upgrade Khoj Server
-```shell
-pip install --upgrade khoj-assistant
-```
-
-### Upgrade Khoj on Emacs
- Use your Emacs Package Manager to Upgrade
- See [khoj.el readme](https://github.com/debanjum/khoj/tree/master/src/interface/emacs#Upgrade) for details
-
-### Upgrade Khoj on Obsidian
- Upgrade via the Community plugins tab on the settings pane in the Obsidian app
- See the [khoj plugin readme](https://github.com/debanjum/khoj/tree/master/src/interface/obsidian#2-Setup-Plugin) for details
-
-## Troubleshoot
-
- Symptom: Errors out complaining about Tensors mismatch, null etc
-  - Mitigation: Disable `image` search using the desktop GUI
- Symptom: Errors out with \"Killed\" in error message in Docker
-  - Fix: Increase RAM available to Docker Containers in Docker Settings
-  - Refer: [StackOverflow Solution](https://stackoverflow.com/a/50770267), [Configure Resources on Docker for Mac](https://docs.docker.com/desktop/mac/#resources)
-
-# Advanced Usage
-## Access Khoj on Mobile
-1. [Setup Khoj](#Setup) on your personal server. This can be any always-on machine, i.e an old computer, RaspberryPi(?) etc
-2. [Install](https://tailscale.com/kb/installation/) [Tailscale](tailscale.com/) on your personal server and phone
-3. Open the Khoj web interface of the server from your phone browser. It should be `http://tailscale-url-of-server:8000` or `http://name-of-server:8000` if you've setup [MagicDNS](https://tailscale.com/kb/1081/magicdns/)
-4. Click the [Install/Add to Homescreen](https://developer.mozilla.org/en-US/docs/Web/Progressive_web_apps/Add_to_home_screen) button
-5. Enjoy exploring your notes, transactions and images from your phone!
-
-![](https://github.com/debanjum/khoj/blob/master/docs/khoj_pwa_android.png)
-
-## Miscellaneous
-
- The beta [chat](http://localhost:8000/api/beta/chat) and [search](http://localhost:8000/api/beta/search) API endpoints use [OpenAI API](https://openai.com/api/)
-  - It is disabled by default
-  - To use it add your `openai-api-key` via the app configure screen
-  - Warning: *If you use the above beta APIs, your query and top result(s) will be sent to OpenAI for processing*
-
-## Performance
-
-### Query performance
-
- Semantic search using the bi-encoder is fairly fast at \<50 ms
- Reranking using the cross-encoder is slower at \<2s on 15 results. Tweak `top_k` to tradeoff speed for accuracy of results
- Filters in query (e.g by file, word or date) usually add \<20ms to query latency
-
-### Indexing performance
-
- Indexing is more strongly impacted by the size of the source data
- Indexing 100K+ line corpus of notes takes about 10 minutes
- Indexing 4000+ images takes about 15 minutes and more than 8Gb of RAM
- Note: *It should only take this long on the first run* as the index is incrementally updated
-
-### Miscellaneous
-
- Testing done on a Mac M1 and a \>100K line corpus of notes
- Search, indexing on a GPU has not been tested yet
-
-## Development
-### Setup
-#### Using Pip
-##### 1. Install
-
-```shell
-git clone https://github.com/debanjum/khoj && cd khoj
-python3 -m venv .venv && source .venv/bin/activate
-pip install -e .
-```
-
-##### 2. Configure
-
- Copy the `config/khoj_sample.yml` to `~/.khoj/khoj.yml`
- Set `input-files` or `input-filter` in each relevant `content-type` section of `~/.khoj/khoj.yml`
-  - Set `input-directories` field in `image` `content-type` section
- Delete `content-type` and `processor` sub-section(s) irrelevant for your use-case
-
-##### 3. Run
-
-```shell
-khoj -vv
-```
-Load ML model, generate embeddings and expose API to query notes, images, transactions etc specified in config YAML
-
-##### 4. Upgrade
-
-```shell
-# To Upgrade To Latest Stable Release
-# Maps to the latest tagged version of khoj on master branch
-pip install --upgrade khoj-assistant
-
-# To Upgrade To Latest Pre-Release
-# Maps to the latest commit on the master branch
-pip install --upgrade --pre khoj-assistant
-
-# To Upgrade To Specific Development Release.
-# Useful to test, review a PR.
-# Note: khoj-assistant is published to test PyPi on creating a PR
-pip install -i https://test.pypi.org/simple/ khoj-assistant==0.1.5.dev57166025766
-```
-
-#### Using Docker
-##### 1. Clone
-
-```shell
-git clone https://github.com/debanjum/khoj && cd khoj
-```
-
-##### 2. Configure
-
- **Required**: Update [docker-compose.yml](./docker-compose.yml) to mount your images, (org-mode or markdown) notes and beancount directories
- **Optional**: Edit application configuration in [khoj_docker.yml](./config/khoj_docker.yml)
-
-##### 3. Run
-
-```shell
-docker-compose up -d
-```
-
-*Note: The first run will take time. Let it run, it\'s mostly not hung, just generating embeddings*
-
-##### 4. Upgrade
-
-```shell
-docker-compose build --pull
-```
-
-#### Using Conda
-##### 1. Install Dependencies
- [Install Conda](https://docs.conda.io/projects/conda/en/latest/user-guide/install/index.html)
-
-##### 2. Install Khoj
-```shell
-git clone https://github.com/debanjum/khoj && cd khoj
-conda env create -f config/environment.yml
-conda activate khoj
-python3 -m pip install pyqt6  # As conda does not support pyqt6 yet
-```
-
-##### 3. Configure
- Copy the `config/khoj_sample.yml` to `~/.khoj/khoj.yml`
- Set `input-files` or `input-filter` in each relevant `content-type` section of `~/.khoj/khoj.yml`
-  - Set `input-directories` field in `image` `content-type` section
- Delete `content-type`, `processor` sub-sections irrelevant for your use-case
-
-##### 4. Run
-```shell
-python3 -m src.main -vv
-```
-  Load ML model, generate embeddings and expose API to query notes, images, transactions etc specified in config YAML
-
-##### 5. Upgrade
-```shell
-cd khoj
-git pull origin master
-conda deactivate khoj
-conda env update -f config/environment.yml
-conda activate khoj
-```
-
-### Test
-```shell
-pytest
-```
-
-## Credits
-
- [Multi-QA MiniLM Model](https://huggingface.co/sentence-transformers/multi-qa-MiniLM-L6-cos-v1), [All MiniLM Model](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2) for Text Search. See [SBert Documentation](https://www.sbert.net/examples/applications/retrieve_rerank/README.html)
- [OpenAI CLIP Model](https://github.com/openai/CLIP) for Image Search. See [SBert Documentation](https://www.sbert.net/examples/applications/image-search/README.html)
- Charles Cave for [OrgNode Parser](http://members.optusnet.com.au/~charles57/GTD/orgnode.html)
- [Org.js](https://mooz.github.io/org-js/) to render Org-mode results on the Web interface
- [Markdown-it](https://github.com/markdown-it/markdown-it) to render Markdown results on the Web interface
--- a/config/environment.yml
+++ b/config/environment.yml
@@ -1,21 +0,0 @@
-name: khoj
-channels:
-  - conda-forge
-dependencies:
-  - python=3.8.*
-  - numpy=1.22.4
-  - pytorch=1.11.0
-  - transformers=4.19.4
-  - sentence-transformers=2.1.0
-  - fastapi=0.77.1
-  - uvicorn=0.17.6
-  - pyyaml=6.0
-  - pytest=7.1.2
-  - pillow=8.4.0
-  - torchvision=0.12.0
-  - openai=0.20.0
-  - pydantic=1.9.1
-  - jinja2=3.1.2
-  - aiofiles=0.8.0
-  - huggingface_hub=0.8.1
-  - dateparser=1.1.1
--- a/config/environment_osx-arm64.yml
+++ b/config/environment_osx-arm64.yml
@@ -1,116 +0,0 @@
-name: khoj
-channels:
-  - conda-forge
-dependencies:
-  - aiofiles=0.8.0=pyhd8ed1ab_0
-  - asgiref=3.4.1=pyhd8ed1ab_0
-  - attrs=21.2.0=pyhd8ed1ab_0
-  - brotlipy=0.7.0=py39h5161555_1001
-  - ca-certificates=2022.6.15=h4653dfc_0
-  - certifi=2022.6.15=py39h2804cbe_0
-  - cffi=1.14.6=py39hda8b47f_0
-  - chardet=4.0.0=py39h2804cbe_1
-  - charset-normalizer=2.0.0=pyhd8ed1ab_0
-  - click=8.0.1=py39h2804cbe_0
-  - colorama=0.4.4=pyh9f0ad1d_0
-  - cryptography=3.4.7=py39h73257c9_0
-  - dataclasses=0.8=pyhc8e2a94_3
-  - dateparser=1.1.1=pyhd8ed1ab_0
-  - et_xmlfile=1.0.1=py_1001
-  - fastapi=0.68.2=pyhd8ed1ab_0
-  - filelock=3.0.12=pyh9f0ad1d_0
-  - freetype=2.10.4=h17b34a0_1
-  - future=0.18.2=py39h2804cbe_3
-  - h11=0.12.0=pyhd8ed1ab_0
-  - huggingface_hub=0.2.1=pyhd8ed1ab_0
-  - idna=3.1=pyhd3deb0d_0
-  - importlib-metadata=4.6.4=py39h2804cbe_0
-  - importlib_metadata=4.6.4=hd8ed1ab_0
-  - iniconfig=1.1.1=pyh9f0ad1d_0
-  - jbig=2.1=h3422bc3_2003
-  - jinja2=3.0.3=pyhd8ed1ab_0
-  - joblib=1.0.1=pyhd8ed1ab_0
-  - jpeg=9d=h27ca646_0
-  - lcms2=2.12=had6a04f_0
-  - lerc=2.2.1=h9f76cd9_0
-  - libblas=3.9.0=11_osxarm64_openblas
-  - libcblas=3.9.0=11_osxarm64_openblas
-  - libcxx=12.0.1=h168391b_0
-  - libdeflate=1.7=h27ca646_5
-  - libffi=3.3=h9f76cd9_2
-  - libgfortran=5.0.0.dev0=11_0_1_hf114ba7_23
-  - libgfortran5=11.0.1.dev0=hf114ba7_23
-  - liblapack=3.9.0=11_osxarm64_openblas
-  - libopenblas=0.3.17=openmp_h5dd58f0_1
-  - libpng=1.6.37=hf7e6567_2
-  - libprotobuf=3.16.0=hccf11d3_0
-  - libtiff=4.3.0=hc6122e1_1
-  - libwebp-base=1.2.1=h3422bc3_0
-  - llvm-openmp=12.0.1=hf3c4609_1
-  - lz4-c=1.9.3=hbdafb3b_1
-  - markupsafe=2.0.1=py39h5161555_1
-  - more-itertools=8.8.0=pyhd8ed1ab_0
-  - ncurses=6.2=h9aa5885_4
-  - ninja=1.10.2=h4d860bb_0
-  - nltk=3.6.2=pyhd8ed1ab_0
-  - numpy=1.21.4=py39h1f3b974_0
-  - olefile=0.46=pyh9f0ad1d_1
-  - openai=0.11.4=py39h2804cbe_0
-  - openjpeg=2.4.0=h062765e_1
-  - openpyxl=3.0.9=pyhd8ed1ab_0
-  - openssl=1.1.1q=ha287fd2_0
-  - packaging=21.0=pyhd8ed1ab_0
-  - pandas=1.3.4=py39h7f752ed_1
-  - pandas-stubs=1.2.0.38=py39h2804cbe_0
-  - pillow=8.3.2=py39ha74c66e_0
-  - pip=21.2.4=pyhd8ed1ab_0
-  - pluggy=0.13.1=py39h2804cbe_4
-  - py=1.10.0=pyhd3deb0d_0
-  - pycparser=2.20=pyh9f0ad1d_2
-  - pydantic=1.8.2=py39h5161555_2
-  - pyopenssl=20.0.1=pyhd8ed1ab_0
-  - pyparsing=2.4.7=pyh9f0ad1d_0
-  - pysocks=1.7.1=py39h2804cbe_3
-  - pytest=6.2.5=py39h2804cbe_1
-  - python=3.9.7=h54d631c_3_cpython
-  - python-dateutil=2.8.2=pyhd8ed1ab_0
-  - python-tzdata=2022.1=pyhd8ed1ab_0
-  - python_abi=3.9=2_cp39
-  - pytorch=1.9.0=cpu_py39he8fdc14_2
-  - pytorch-cpu=1.9.0=cpu_py39hd610c6a_2
-  - pytz=2021.3=pyhd8ed1ab_0
-  - pytz-deprecation-shim=0.1.0.post0=py39h2804cbe_2
-  - pyyaml=5.4.1=py39h5161555_1
-  - readline=8.1=hedafd6a_0
-  - regex=2021.8.21=py39h5161555_0
-  - requests=2.26.0=pyhd8ed1ab_0
-  - sacremoses=0.0.43=pyh9f0ad1d_0
-  - scikit-learn=0.24.2=py39hef7049f_1
-  - scipy=1.7.0=py39h5060c3b_0
-  - sentence-transformers=2.1.0=pyhd8ed1ab_0
-  - sentencepiece=0.1.95=py39h4d2d688_1
-  - setuptools=57.4.0=py39h2804cbe_0
-  - six=1.16.0=pyh6c4a22f_0
-  - sleef=3.5.1=h27ca646_1
-  - sqlite=3.36.0=h72a2b83_0
-  - starlette=0.14.2=pyhd8ed1ab_0
-  - threadpoolctl=2.2.0=pyh8a188c0_0
-  - tk=8.6.11=he1e0b03_0
-  - tokenizers=0.10.3=py39hab32027_1
-  - toml=0.10.2=pyhd8ed1ab_0
-  - torchvision=0.10.1=py39h0a40b5a_0_cpu
-  - tqdm=4.62.1=pyhd8ed1ab_0
-  - transformers=4.14.1=pyhd8ed1ab_0
-  - typing-extensions=3.10.0.0=hd8ed1ab_0
-  - typing_extensions=3.10.0.0=pyha770c72_0
-  - tzdata=2021a=he74cb21_1
-  - tzlocal=4.2=py39h2804cbe_1
-  - urllib3=1.26.6=pyhd8ed1ab_0
-  - uvicorn=0.16.0=py39h2804cbe_0
-  - wheel=0.37.0=pyhd8ed1ab_1
-  - xz=5.2.5=h642e427_1
-  - yaml=0.2.5=h642e427_0
-  - zipp=3.5.0=pyhd8ed1ab_0
-  - zlib=1.2.11=h31e879b_1009
-  - zstd=1.5.0=h861e0a7_0
-prefix: /opt/homebrew/Caskroom/miniforge/base/envs/khoj
--- a/config/khoj_docker.yml
+++ b/config/khoj_docker.yml
@@ -1,54 +0,0 @@
-content-type:
-  # The /data/folder/ prefix to the folders is here because this is
-  # the directory to which the local files are copied in the docker-compose.
-  # If changing, the docker-compose volumes should also be changed to match.
-  org:
-    input-files: null
-    input-filter: "/data/org/*.org"
-    compressed-jsonl: "/data/embeddings/notes.jsonl.gz"
-    embeddings-file: "/data/embeddings/note_embeddings.pt"
-    index_heading_entries: false
-
-  markdown:
-    input-files: null
-    input-filter: "/data/markdown/*.md"
-    compressed-jsonl: "/data/embeddings/markdown.jsonl.gz"
-    embeddings-file: "/data/embeddings/markdown_embeddings.pt"
-
-  ledger:
-    input-files: null
-    input-filter: /data/ledger/*.beancount
-    compressed-jsonl: /data/embeddings/transactions.jsonl.gz
-    embeddings-file: /data/embeddings/transaction_embeddings.pt
-
-  image:
-    input-directories: ["/data/images/"]
-    embeddings-file: "/data/embeddings/image_embeddings.pt"
-    batch-size: 50
-    use-xmp-metadata: false
-
-  music:
-    input-files: ["/data/music/music.org"]
-    input-filter: null
-    compressed-jsonl: "/data/embeddings/songs.jsonl.gz"
-    embeddings-file: "/data/embeddings/song_embeddings.pt"
-
-search-type:
-  symmetric:
-    encoder: "sentence-transformers/all-MiniLM-L6-v2"
-    cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
-    model_directory: "/data/models/symmetric"
-
-  asymmetric:
-    encoder: "sentence-transformers/multi-qa-MiniLM-L6-cos-v1"
-    cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
-    model_directory: "/data/models/asymmetric"
-
-  image:
-    encoder: "sentence-transformers/clip-ViT-B-32"
-    model_directory: "/data/models/image_encoder"
-
-processor:
-  #conversation:
-  #  openai-api-key: null
-  #  conversation-logfile: "/data/embeddings/conversation_logs.json"
--- a/config/khoj_sample.yml
+++ b/config/khoj_sample.yml
@@ -1,52 +0,0 @@
-content-type:
-  org:
-    input-files:  # ["/path/to/org-file.org"]  REQUIRED IF input-filter IS NOT SET OR
-    input-filter: # /path/to/org/*.org         REQUIRED IF input-files IS NOT SET
-    compressed-jsonl: "~/.khoj/content/org/org.jsonl.gz"
-    embeddings-file: "~/.khoj/content/org/org_embeddings.pt"
-    index_heading_entries: false  # Set to true to index entries with empty body
-
-  markdown:
-    input-files:  # ["/path/to/markdown-file.md"]  REQUIRED IF input-filter IS NOT SET OR
-    input-filter: # "/path/to/markdown/*.md"       REQUIRED IF input-files IS NOT SET
-    compressed-jsonl: "~/.khoj/content/markdown/markdown.jsonl.gz"
-    embeddings-file: "~/.khoj/content/markdown/markdown_embeddings.pt"
-
-  ledger:
-    input-files:  # ["/path/to/ledger-file.beancount"]  REQUIRED IF input-filter is not set OR
-    input-filter: # /path/to/ledger/*.beancount         REQUIRED IF input-files is not set
-    compressed-jsonl: "~/.khoj/content/ledger/ledger.jsonl.gz"
-    embeddings-file: "~/.khoj/content/ledger/ledger_embeddings.pt"
-
-  image:
-    input-directories: # ["/path/to/images/"]   REQUIRED IF input-filter IS NOT SET OR
-    input-filter:      # /path/to/images/*.jpg  REQUIRED IF input-directories IS NOT SET
-    embeddings-file: "~/.khoj/content/image/image_embeddings.pt"
-    batch-size: 50
-    use-xmp-metadata: false
-
-  music:
-    input-files:  # ["/path/to/music-file.org"] REQUIRED IF input-filter IS NOT SET OR
-    input-filter: # /path/to/music/*.org        REQUIRED IF input-files IS NOT SET
-    compressed-jsonl: "~/.khoj/content/music/music.jsonl.gz"
-    embeddings-file: "~/.khoj/content/music/music_embeddings.pt"
-
-search-type:
-  symmetric:
-    encoder: "sentence-transformers/all-MiniLM-L6-v2"
-    cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
-    model_directory: "~/.khoj/search/symmetric/"
-
-  asymmetric:
-    encoder: "sentence-transformers/multi-qa-MiniLM-L6-cos-v1"
-    cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
-    model_directory: "~/.khoj/search/asymmetric/"
-
-  image:
-    encoder: "sentence-transformers/clip-ViT-B-32"
-    model_directory: "~/.khoj/search/image/"
-
-processor:
-  conversation:
-    openai-api-key: # "YOUR_OPENAI_API_KEY"
-    conversation-logfile: "~/.khoj/processor/conversation/conversation_logs.json"
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -1,29 +1,54 @@
 version: "3.9"
 services:
+  database:
+    image: ankane/pgvector
+    ports:
+      - "5432:5432"
+    environment:
+      POSTGRES_USER: postgres
+      POSTGRES_PASSWORD: postgres
+      POSTGRES_DB: postgres
+    volumes:
+      - khoj_db:/var/lib/postgresql/data/
+    healthcheck:
+      test: ["CMD-SHELL", "pg_isready -U postgres"]
+      interval: 30s
+      timeout: 10s
+      retries: 5
  server:
-    image: ghcr.io/debanjum/khoj:latest
+    depends_on:
+      database:
+        condition: service_healthy
+    # Use the following line to use the latest version of khoj. Otherwise, it will build from source.
+    image: ghcr.io/khoj-ai/khoj:latest
+    # Uncomment the following line to build from source. This will take a few minutes. Comment the next two lines out if you want to use the offiicial image.
+    # build:
+      # context: .
    ports:
      # If changing the local port (left hand side), no other changes required.
-      # If changing the remote port (right hand side), 
-      #   change the port in the args in the build section, 
+      # If changing the remote port (right hand side),
+      #   change the port in the args in the build section,
      #   as well as the port in the command section to match
-      - "8000:8000"
+      - "42110:42110"
    working_dir: /app
    volumes:
-      - .:/app
-      # These mounted volumes hold the raw data that should be indexed for search. 
-      # The path in your local directory (left hand side)
-      #   points to the files you want to index.
-      # The path of the mounted directory (right hand side),
-      #   must match the path prefix in your config file.
-      - ./tests/data/org/:/data/org/
-      - ./tests/data/images/:/data/images/
-      - ./tests/data/ledger/:/data/ledger/
-      - ./tests/data/music/:/data/music/
-      - ./tests/data/markdown/:/data/markdown/
-      # Embeddings and models are populated after the first run
-      # You can set these volumes to point to empty directories on host
-      - ./tests/data/embeddings/:/data/embeddings/
-      - ./tests/data/models/:/data/models/
+      - khoj_config:/root/.khoj/
+      - khoj_models:/root/.cache/torch/sentence_transformers
    # Use 0.0.0.0 to explicitly set the host ip for the service on the container. https://pythonspeed.com/articles/docker-connection-refused/
-    command: --no-gui --host="0.0.0.0" --port=8000 -c=config/khoj_docker.yml -vv
+    environment:
+      - POSTGRES_DB=postgres
+      - POSTGRES_USER=postgres
+      - POSTGRES_PASSWORD=postgres
+      - POSTGRES_HOST=database
+      - POSTGRES_PORT=5432
+      - KHOJ_DJANGO_SECRET_KEY=secret
+      - KHOJ_DEBUG=False
+      - KHOJ_ADMIN_EMAIL=username@example.com
+      - KHOJ_ADMIN_PASSWORD=password
+    command: --host="0.0.0.0" --port=42110 -vv --anonymous-mode
+
+
+volumes:
+  khoj_config:
+  khoj_db:
+  khoj_models:
--- a/docs/interfaces.png
+++ b/docs/interfaces.png
--- a/docs/khoj_pwa_android.png
+++ b/docs/khoj_pwa_android.png
--- a/documentation/.gitignore
+++ b/documentation/.gitignore
@@ -0,0 +1,20 @@
+# Dependencies
+/node_modules
+
+# Production
+/build
+
+# Generated files
+.docusaurus
+.cache-loader
+
+# Misc
+.DS_Store
+.env.local
+.env.development.local
+.env.test.local
+.env.production.local
+
+npm-debug.log*
+yarn-debug.log*
+yarn-error.log*
--- a/documentation/README.md
+++ b/documentation/README.md
@@ -0,0 +1,41 @@
+# Website
+
+This website is built using [Docusaurus](https://docusaurus.io/), a modern static website generator.
+
+### Installation
+
+```
+$ yarn
+```
+
+### Local Development
+
+```
+$ yarn start
+```
+
+This command starts a local development server and opens up a browser window. Most changes are reflected live without having to restart the server.
+
+### Build
+
+```
+$ yarn build
+```
+
+This command generates static content into the `build` directory and can be served using any static contents hosting service.
+
+### Deployment
+
+Using SSH:
+
+```
+$ USE_SSH=true yarn deploy
+```
+
+Not using SSH:
+
+```
+$ GIT_USER=<Your GitHub username> yarn deploy
+```
+
+If you are using GitHub pages for hosting, this command is a convenient way to build the website and push to the `gh-pages` branch.
--- a/documentation/assets/.nojekyll
+++ b/documentation/assets/.nojekyll
--- a/documentation/assets/img/agents_demo.gif
+++ b/documentation/assets/img/agents_demo.gif
--- a/documentation/assets/img/dream_house.png
+++ b/documentation/assets/img/dream_house.png
--- a/documentation/assets/img/favicon-128x128.ico
+++ b/documentation/assets/img/favicon-128x128.ico
--- a/documentation/assets/img/khoj-logo-sideways-200.png
+++ b/documentation/assets/img/khoj-logo-sideways-200.png
--- a/documentation/assets/img/khoj-logo-sideways-500.png
+++ b/documentation/assets/img/khoj-logo-sideways-500.png
--- a/documentation/assets/img/khoj-logo-sideways.svg
+++ b/documentation/assets/img/khoj-logo-sideways.svg
--- a/documentation/assets/img/khoj_architecture.png
+++ b/documentation/assets/img/khoj_architecture.png
--- a/documentation/assets/img/khoj_chat_on_desktop.png
+++ b/documentation/assets/img/khoj_chat_on_desktop.png
--- a/documentation/assets/img/khoj_chat_on_emacs.png
+++ b/documentation/assets/img/khoj_chat_on_emacs.png
--- a/documentation/assets/img/khoj_chat_on_obsidian.png
+++ b/documentation/assets/img/khoj_chat_on_obsidian.png
--- a/documentation/assets/img/khoj_chat_on_web.png
+++ b/documentation/assets/img/khoj_chat_on_web.png
--- a/documentation/assets/img/khoj_clients.svg
+++ b/documentation/assets/img/khoj_clients.svg
--- a/documentation/assets/img/khoj_codebase_visualization_0.2.1.png
+++ b/documentation/assets/img/khoj_codebase_visualization_0.2.1.png
--- a/documentation/assets/img/khoj_datasources.svg
+++ b/documentation/assets/img/khoj_datasources.svg
--- a/documentation/assets/img/khoj_emacs_menu.png
+++ b/documentation/assets/img/khoj_emacs_menu.png
--- a/documentation/assets/img/khoj_obsidian_codebase_visualization_0.2.1.png
+++ b/documentation/assets/img/khoj_obsidian_codebase_visualization_0.2.1.png
--- a/documentation/assets/img/khoj_pwa_android.png
+++ b/documentation/assets/img/khoj_pwa_android.png
--- a/documentation/assets/img/khoj_search_on_desktop.png
+++ b/documentation/assets/img/khoj_search_on_desktop.png
--- a/documentation/assets/img/khoj_search_on_emacs.png
+++ b/documentation/assets/img/khoj_search_on_emacs.png
--- a/documentation/assets/img/khoj_search_on_obsidian.png
+++ b/documentation/assets/img/khoj_search_on_obsidian.png
--- a/documentation/assets/img/khoj_search_on_web.png
+++ b/documentation/assets/img/khoj_search_on_web.png
--- a/documentation/assets/img/logo.svg
+++ b/documentation/assets/img/logo.svg
--- a/documentation/assets/img/notion_integration.gif
+++ b/documentation/assets/img/notion_integration.gif
--- a/documentation/assets/img/plants_i_got.png
+++ b/documentation/assets/img/plants_i_got.png
--- a/documentation/assets/img/pwa_install_1.png
+++ b/documentation/assets/img/pwa_install_1.png
--- a/documentation/assets/img/pwa_install_2.png
+++ b/documentation/assets/img/pwa_install_2.png
--- a/documentation/assets/img/pwa_install_3.png
+++ b/documentation/assets/img/pwa_install_3.png
--- a/documentation/assets/img/using_khoj_for_studying.gif
+++ b/documentation/assets/img/using_khoj_for_studying.gif
--- a/documentation/babel.config.js
+++ b/documentation/babel.config.js
@@ -0,0 +1,3 @@
+module.exports = {
+  presets: [require.resolve('@docusaurus/core/lib/babel/preset')],
+};
--- a/documentation/docs/clients/_category_.json
+++ b/documentation/docs/clients/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "Clients",
+  "position": 4,
+  "link": {
+    "type": "generated-index",
+    "description": "Different ways for indexing data with the Khoj backend. To see online data sources, go to https://docs.khoj.dev/category/data-sources"
+  }
+}
--- a/documentation/docs/clients/desktop.md
+++ b/documentation/docs/clients/desktop.md
@@ -0,0 +1,32 @@
+---
+sidebar_position: 1
+---
+
+# Desktop
+
+> Query your Second Brain from your machine
+
+Use the Desktop app to chat and search with Khoj.
+You can also sync any relevant files with Khoj using the app.
+Khoj will use these files to provide contextual reponses when you search or chat.
+
+## Features
+- **Chat**
+  - **Faster answers**: Find answers quickly, from your private notes or the public internet
+  - **Assisted creativity**: Smoothly weave across retrieving answers and generating content
+  - **Iterative discovery**: Iteratively explore and re-discover your notes
+- **Search**
+  - **Natural**: Advanced natural language understanding using Transformer based ML Models
+  - **Incremental**: Incremental search for a fast, search-as-you-type experience
+
+## Setup
+
+1. Install the [Khoj Desktop app](https://khoj.dev/downloads) for your OS
+2. Generate an API key on the [Khoj Web App](https://app.khoj.dev/config#clients)
+3. Set your Khoj API Key on the *Settings* page of the Khoj Desktop app
+4. [Optional] Add any files, folders you'd like Khoj to be aware of on the *Settings* page and Click *Save*
+
+## Interface
+| Chat | Search |
+|:----:|:------:|
+| ![](/img/khoj_chat_on_desktop.png) | ![](/img/khoj_search_on_desktop.png) |
--- a/documentation/docs/clients/emacs.md
+++ b/documentation/docs/clients/emacs.md
@@ -0,0 +1,137 @@
+---
+sidebar_position: 2
+---
+
+# Emacs
+
+<img src="https://stable.melpa.org/packages/khoj-badge.svg" width="130" alt="Melpa Stable Badge" />
+<img src="https://melpa.org/packages/khoj-badge.svg" width="150" alt="Melpa Badge" />
+
+<img src="https://github.com/khoj-ai/khoj/actions/workflows/build_khoj_el.yml/badge.svg" width="150" alt="Build Badge" />
+<img src="https://github.com/khoj-ai/khoj/actions/workflows/test_khoj_el.yml/badge.svg" width="150" alt="Test Badge" />
+
+<br />
+<br />
+> Query your Second Brain from Emacs
+
+## Features
+- **Chat**
+  - **Faster answers**: Find answers quickly, from your private notes or the public internet
+  - **Assisted creativity**: Smoothly weave across retrieving answers and generating content
+  - **Iterative discovery**: Iteratively explore and re-discover your notes
+- **Search**
+  - **Natural**: Advanced natural language understanding using Transformer based ML Models
+  - **Incremental**: Incremental search for a fast, search-as-you-type experience
+
+## Interface
+
+| Search | Chat |
+|:------:|:----:|
+| ![khoj search on emacs](/img/khoj_search_on_emacs.png) | ![khoj chat on emacs](/img/khoj_chat_on_emacs.png) |
+
+## Setup
+1. Generate an API key on the [Khoj Web App](https://app.khoj.dev/config#clients)
+2. Add below snippet to your Emacs config file, usually at `~/.emacs.d/init.el`
+
+
+#### **Direct Install**
+*Khoj will index your org-agenda files, by default*
+
+```elisp
+;; Install Khoj.el
+M-x package-install khoj
+
+; Set your Khoj API key
+(setq khoj-api-key "YOUR_KHOJ_CLOUD_API_KEY")
+```
+
+#### **Minimal Install**
+*Khoj will index your org-agenda files, by default*
+
+```elisp
+;; Install Khoj client from MELPA Stable
+(use-package khoj
+  :ensure t
+  :pin melpa-stable
+  :bind ("C-c s" . 'khoj)
+  :config (setq khoj-api-key "YOUR_KHOJ_CLOUD_API_KEY"))
+```
+
+#### **Standard Install**
+*Configures the specified org files, directories to be indexed by Khoj*
+
+```elisp
+;; Install Khoj client from MELPA Stable
+(use-package khoj
+  :ensure t
+  :pin melpa-stable
+  :bind ("C-c s" . 'khoj)
+  :config (setq khoj-api-key "YOUR_KHOJ_CLOUD_API_KEY"
+                khoj-org-directories '("~/docs/org-roam" "~/docs/notes")
+                khoj-org-files '("~/docs/todo.org" "~/docs/work.org")))
+```
+
+#### **Straight.el**
+*Configures the specified org files, directories to be indexed by Khoj*
+
+```elisp
+;; Install Khoj client using Straight.el
+(use-package khoj
+  :after org
+  :straight (khoj :type git :host github :repo "khoj-ai/khoj" :files (:defaults "src/interface/emacs/khoj.el"))
+  :bind ("C-c s" . 'khoj)
+  :config (setq khoj-api-key "YOUR_KHOJ_CLOUD_API_KEY"
+                khoj-org-directories '("~/docs/org-roam" "~/docs/notes")
+                khoj-org-files '("~/docs/todo.org" "~/docs/work.org")))
+```
+
+## Use
+### Search
+See [Khoj Search](/features/search) for details
+1. Hit  `C-c s s` (or `M-x khoj RET s`) to open khoj search
+2. Enter your query in natural language<br/>
+  E.g *"What is the meaning of life?"*, *"My life goals for 2023"*
+
+### Chat
+See [Khoj Chat](/features/chat) for details
+1. Hit `C-c s c` (or `M-x khoj RET c`) to open khoj chat
+2. Ask questions in a natural, conversational style<br/>
+  E.g *"When did I file my taxes last year?"*
+
+### Find Similar Entries
+This feature finds entries similar to the one you are currently on.
+1. Move cursor to the org-mode entry, markdown section or text paragraph you want to find similar entries for
+2. Hit `C-c s f` (or `M-x khoj RET f`) to find similar entries
+
+### Advanced Usage
+- Add [query filters](https://github.com/khoj-ai/khoj/#query-filters) during search to narrow down results further
+  e.g `What is the meaning of life? -"god" +"none" dt>"last week"`
+
+- Use `C-c C-o 2` to open the current result at cursor in its source org file
+  - This calls `M-x org-open-at-point` on the current entry and opens the second link in the entry.
+  - The second link is the entries [org-id](https://orgmode.org/manual/Handling-Links.html#FOOT28), if set, or the heading text.
+    The first link is the line number of the entry in the source file. This link is less robust to file changes.
+  - Note: If you have [speed keys](https://orgmode.org/manual/Speed-Keys.html) enabled, `o 2` will also work
+
+### Khoj Menu
+![](/img/khoj_emacs_menu.png)
+Hit `C-c s` (or `M-x khoj`) to open the khoj menu above. Then:
+- Hit `t` until you preferred content type is selected in the khoj menu
+  `Content Type` specifies the content to perform `Search`, `Update` or `Find Similar` actions on
+- Hit `n` twice and then enter number of results you want to see
+  `Results Count` is used by the `Search` and `Find Similar` actions
+- Hit `-f u` to `force` update the khoj content index
+  The `Force Update` switch is only used by the `Update` action
+
+## Upgrade
+Use your Emacs package manager to upgrade `khoj.el`
+<!-- tabs:start -->
+
+#### **With MELPA**
+1. Run `M-x package-refresh-content`
+2. Run `M-x package-reinstall khoj`
+
+#### **With Straight.el**
+- Run `M-x straight-pull-package khoj`
+
+<!-- tabs:end -->
--- a/documentation/docs/clients/obsidian.md
+++ b/documentation/docs/clients/obsidian.md
@@ -0,0 +1,59 @@
+---
+sidebar_position: 3
+---
+
+# Obsidian
+
+> Query your Second Brain from Obsidian
+
+## Features
+- **Chat**
+  - **Faster answers**: Find answers quickly, from your private notes or the public internet
+  - **Assisted creativity**: Smoothly weave across retrieving answers and generating content
+  - **Iterative discovery**: Iteratively explore and re-discover your notes
+- **Search**
+  - **Natural**: Advanced natural language understanding using Transformer based ML Models
+  - **Incremental**: Incremental search for a fast, search-as-you-type experience
+
+## Interface
+
+| Search | Chat |
+|:------:|:----:|
+| ![](/img/khoj_search_on_obsidian.png) | ![](/img/khoj_chat_on_obsidian.png) |
+
+
+## Setup
+
+  1. Open [Khoj](https://obsidian.md/plugins?id=khoj) from the *Community plugins* tab in Obsidian settings panel
+  2. Click *Install*, then *Enable* on the Khoj plugin page in Obsidian
+  3. Generate an API key on the [Khoj Web App](https://app.khoj.dev/config#clients)
+  4. Set your Khoj API Key in the Khoj plugin settings in Obsidian
+
+See the official [Obsidian Plugin Docs](https://help.obsidian.md/Extending+Obsidian/Community+plugins) for more details on installing Obsidian plugins.
+
+## Use
+### Chat
+Click the *Khoj chat* icon 💬 on the [Ribbon](https://help.obsidian.md/User+interface/Workspace/Ribbon) or run *Khoj: Chat* from the [Command Palette](https://help.obsidian.md/Plugins/Command+palette) and ask questions in a natural, conversational style.<br />
+E.g *"When did I file my taxes last year?"*
+
+See [Khoj Chat](/features/chat) for more details
+
+### Find Similar Notes
+To see other notes similar to the current one, run *Khoj: Find Similar Notes* from the [Command Palette](https://help.obsidian.md/Plugins/Command+palette)
+
+### Search
+Run *Khoj: Search* from the [Command Palette](https://help.obsidian.md/Plugins/Command+palette)
+
+See [Khoj Search](/features/search) for more details. Use [query filters](/miscellaneous/advanced#query-filters) to limit entries to search
+
+[search_demo](https://user-images.githubusercontent.com/6413477/218801155-cd67e8b4-a770-404a-8179-d6b61caa0f93.mp4 ':include :type=mp4')
+
+## Upgrade
+  1. Open *Community plugins* tab in Obsidian settings
+  2. Click the *Check for updates* button
+  3. Click the *Update* button next to Khoj, if available
+
+## Troubleshooting
+  - Open the Khoj plugin settings pane, to configure Khoj
+  - Toggle Enable/Disable Khoj, if setting changes have not applied
+  - Click *Update* button to force index to refresh, if results are failing or stale
--- a/documentation/docs/clients/web.md
+++ b/documentation/docs/clients/web.md
@@ -0,0 +1,45 @@
+---
+sidebar_position: 4
+---
+
+# Web
+
+> Query your Second Brain from your Web Browser
+
+Without any desktop clients, you can start chatting with Khoj on the web. Bear in mind you do need one of the desktop clients in order to share and sync your data with Khoj.
+
+## Features
+- **Chat**
+  - **Faster answers**: Find answers quickly, from your private notes or the public internet
+  - **Assisted creativity**: Smoothly weave across retrieving answers and generating content
+  - **Iterative discovery**: Iteratively explore and re-discover your notes
+- **Search**
+  - **Natural**: Advanced natural language understanding using Transformer based ML Models
+  - **Incremental**: Incremental search for a fast, search-as-you-type experience
+
+## Setup
+No setup required. The Khoj web app is the default Khoj client. You can access it from any web browser. Try it on [Khoj Cloud](https://app.khoj.dev)
+
+## Upload Documents
+You can upload documents to Khoj from the web interface, one at a time. This is useful for uploading documents from your phone or tablet. To upload a document:
+1. You can drag and drop the document into the chat window.
+2. Or click the paperclip icon in the chat window and select the document from your file system.
+
+![demo of dragging and dropping a file](https://khoj-web-bucket.s3.amazonaws.com/drag_drop_file.gif)
+
+### Install on Phone
+You can optionally install Khoj as a [Progressive Web App (PWA)](https://web.dev/learn/pwa/installation). This makes it quick and easy to access Khoj on your phone.
+1. Login to [Khoj Cloud](https://app.khoj.dev) or your self-hosted Khoj server from the web browser (prefer Chrome/Edge) on your phone
+2. Open the 3 dot menu on the browser and click the "Add to Home screen" option
+3. Click "Install" on the next screen to add the Khoj icon to your phone Home screen
+
+**Process via Screenshots**
+| Step 1 | Step 2 | Step 3|
+|:---:|:---:|:---:|
+| ![](/img/pwa_install_1.png) | ![](/img/pwa_install_2.png) | ![](/img/pwa_install_3.png) |
+
+## Interface
+
+| Search | Chat |
+|:------:|:----:|
+| ![](/img/khoj_search_on_web.png) | ![](/img/khoj_chat_on_web.png) |
--- a/documentation/docs/clients/whatsapp.md
+++ b/documentation/docs/clients/whatsapp.md
@@ -0,0 +1,28 @@
+---
+sidebar_position: 5
+---
+
+# WhatsApp
+
+> Query your Second Brain from WhatsApp
+
+Text [+1 (848) 800 4242](https://wa.me/18488004242) or scan [this QR code](https://khoj.dev/whatsapp) on your phone to chat with Khoj on WhatsApp.
+
+Without any desktop clients, you can start chatting with Khoj on WhatsApp. Bear in mind you do need one of the desktop clients in order to share and sync your data with Khoj. The WhatsApp AI bot will work right away for answering generic queries and using Khoj in default mode.
+
+In order to use Khoj on WhatsApp with your own data, you need to setup a Khoj Cloud account and connect your WhatsApp account to it. This is a one time setup and you can do it from the [Khoj Cloud config page](https://app.khoj.dev/config).
+
+If you hit usage limits for the WhatsApp bot, upgrade to [a paid plan](https://khoj.dev/pricing) on Khoj Cloud.
+
+## Features
+
+- **Slash Commands**: Use slash commands to quickly access Khoj features
+    - `/online`: Get responses from Khoj powered by online search.
+    - `/dream`: Generate an image in response to your prompt.
+    - `/notes`: Explicitly force Khoj to retrieve context from your notes. Note: You'll need to connect your WhatsApp account to a Khoj Cloud account for this to work.
+
+We have more commands under development, including `/share` to uploading documents directly to your Khoj account from WhatsApp, and `/speak` in order to get a speech response from Khoj. Feel free to [raise an issue](https://github.com/khoj-ai/flint/issues) if you have any suggestions for new commands.
+
+## Nerdy Details
+
+You can find all of the code for the WhatsApp bot in the the [flint repository](https://github.com/khoj-ai/flint). As all of our code, it is open source and you can contribute to it.
--- a/documentation/docs/contributing/_category_.json
+++ b/documentation/docs/contributing/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "Contributing",
+  "position": 2,
+  "link": {
+    "type": "generated-index",
+    "description": "Development Setup"
+  }
+}
--- a/documentation/docs/contributing/development.mdx
+++ b/documentation/docs/contributing/development.mdx
@@ -0,0 +1,181 @@
+---
+sidebar_position: 0
+---
+
+# Development
+
+Welcome to the development docs of Khoj! Thanks for you interesting in being a contributor ❤️. Open source contributors are a corner-store of the Khoj community. We welcome all contributions, big or small.
+
+To get started with contributing, check out the official GitHub docs on [contributing to an open-source project](https://docs.github.com/en/get-started/exploring-projects-on-github/contributing-to-a-project).
+
+Join the [Discord](https://discord.gg/WaxF3SkFPU) server and click the ✅ for the question "Are you interested in becoming a contributor?" in the `#welcome-and-rules` channel. This will give you access to the `#contributors` channel where you can ask questions and get help from other contributors.
+
+If you're looking for a place to get started, check out the list of [Github Issues](https://github.com/khoj-ai/khoj/issues) with the tag `good first issue` to find issues that are good for first-time contributors.
+
+## Local Server Installation
+### Using Pip
+#### 1. Install
+```mdx-code-block
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+```
+
+```mdx-code-block
+  <Tabs>
+    <TabItem value="macos" label="MacOS">
+    ```shell
+# Get Khoj Code
+git clone https://github.com/khoj-ai/khoj && cd khoj
+
+# Create, Activate Virtual Environment
+python3 -m venv .venv && source .venv/bin/activate
+
+# For MacOS or zsh users run this
+pip install -e '.[dev]'
+    ```
+    </TabItem>
+    <TabItem value="win" label="Windows">
+    ```shell
+# Get Khoj Code
+git clone https://github.com/khoj-ai/khoj && cd khoj
+
+# Create, Activate Virtual Environment
+python3 -m venv .venv && .venv\Scripts\activate
+
+# Install Khoj for Development
+pip install -e .[dev]
+      ```
+    </TabItem>
+    <TabItem value="unix" label="Linux">
+      ```shell
+    # Get Khoj Code
+git clone https://github.com/khoj-ai/khoj && cd khoj
+
+# Create, Activate Virtual Environment
+python3 -m venv .venv && source .venv/bin/activate
+
+# Install Khoj for Development
+pip install -e .[dev]
+      ```
+    </TabItem>
+  </Tabs>
+```
+
+
+#### 2. Run
+1. Start Khoj
+   ```bash
+   khoj -vv
+   ```
+2. Configure Khoj
+   - **Via the Desktop application**: Add files, directories to index using the settings page of your desktop application. Click "Save" to immediately trigger indexing.
+
+  Note: Wait after configuration for khoj to Load ML model, generate embeddings and expose API to query notes, images, documents etc specified in config YAML
+
+### Using Docker
+
+Make sure you install the latest version of [Docker](https://docs.docker.com/get-docker/) and [Docker Compose](https://docs.docker.com/compose/install/).
+
+#### 1. Clone
+
+```shell
+git clone https://github.com/khoj-ai/khoj && cd khoj
+```
+
+#### 2. Configure
+
+1. Update [docker-compose.yml](https://github.com/khoj-ai/khoj/blob/master/docker-compose.yml) to use relevant environment variables.
+2. Comment out the `image` line and uncomment the `build` line in the `server` service
+
+#### 3. Run
+
+This will start the Khoj server, and the database.
+
+```shell
+docker-compose up -d
+```
+
+#### 4. Upgrade
+
+If you've made changes to the codebase, you'll need to rebuild the Docker image before running the container again.
+
+```shell
+docker-compose build --no-cache
+```
+
+## Update clients
+In whichever clients you're using for testing, you'll need to update the server URL to point to your local server. By default, the local server URL should be `http://127.0.0.1:42110`.
+
+## Validate
+### Before Making Changes
+1. Install Git Hooks for Validation
+   ```shell
+   pre-commit install -t pre-push -t pre-commit
+   ```
+   - This ensures standard code formatting fixes and other checks run automatically on every commit and push
+   - Note 1: If [pre-commit](https://pre-commit.com/#intro) didn't already get installed, [install it](https://pre-commit.com/#install) via `pip install pre-commit`
+   - Note 2: To run the pre-commit changes manually, use `pre-commit run --hook-stage manual --all` before creating PR
+
+### Before Creating PR
+
+:::tip[Note]
+You should be in an active virtual environment for Khoj in order to run the unit tests and linter.
+:::
+
+1. Ensure that you have a [Github Issue](https://github.com/khoj-ai/khoj/issues) that can be linked to the PR. If not, create one. Make sure you've tagged one of the maintainers to the issue. This will ensure that the maintainers are notified of the PR and can review it. It's best discuss the code design on an existing issue or Discord thread before creating a PR. This helps get your PR merged faster.
+1. Run unit tests.
+   ```shell
+   pytest
+   ```
+2. Run the linter.
+   ```shell
+   mypy
+   ```
+4. Think about how to add unit tests to verify the functionality you're adding in the PR. If you're not sure how to do this, ask for help in the Github issue or on Discord's `#contributors` channel.
+
+### After Creating PR
+1. Automated [validation workflows](https://github.com/khoj-ai/khoj/tree/master/.github/workflows) should run for every PR. Tag one of the maintainers in the PR to trigger it.
+
+## Obsidian Plugin Development
+### Plugin development setup
+The core code for the Obsidian plugin is under `src/interface/obsidian`. The file `main.ts` is a good place to start.
+
+1. In your CLI, go to the directory `src/interface/obsidian` in the Khoj repository.
+2. Run `yarn install` to install the dependencies.
+3. Run `yarn dev` to start the development server. This will continually rebuild the plugin as you make changes to the code.
+    - Your code changes will be outputted to a file called `main.js` in the `obsidian` directory.
+
+### Loading your development plugin in Obsidian
+1. Make sure you have the Khoj plugin installed in Obsidian. [See the plugin page](https://publish.obsidian.md/hub/02+-+Community+Expansions/02.05+All+Community+Expansions/Plugins/khoj).
+1. Open Obsidian and go to your settings (gear icon in the bottom left corner)
+2. Click on 'Community Plugins' in the left panel
+3. Next to the 'Installed Plugins' heading, click on the folder icon to open the folder with the plugin's source code.
+4. Open the `khoj` folder in the file explorer that opens. You'll see a file called `main.js` in this folder. To test your changes, replace this file with the `main.js` file that was generated by the development server in the previous section.
+
+## Create Khoj Release (Only for Maintainers)
+Follow the steps below to [release](https://github.com/debanjum/khoj/releases/) Khoj. This will create a stable release of Khoj on [Pypi](https://pypi.org/project/khoj-assistant/), [Melpa](https://stable.melpa.org/#%252Fkhoj) and [Obsidian](https://obsidian.md/plugins?id%253Dkhoj). It will also create desktop apps of Khoj and attach them to the latest release.
+
+1. Create and tag release commit by running the bump_version script. The release commit sets version number in required metadata files.
+  ```shell
+  ./scripts/bump_version.sh -c "<release_version>"
+  ```
+2. Push commit and then the tag to trigger the release workflow to create Release with auto generated release notes.
+  ```shell
+  git push origin master  # push release commit to khoj repository
+  git push origin <release_version>  # push release tag to khoj repository
+  ```
+3. [Optional] Update the Release Notes to highlight new features, fixes and updates
+
+## Architecture
+
+![](/img/khoj_architecture.png)
+
+## Visualize Codebase
+
+*[Interactive Visualization](https://mango-dune-07a8b7110.1.azurestaticapps.net/?repo=debanjum%2Fkhoj)*
+
+![](/img/khoj_codebase_visualization_0.2.1.png)
+
+## Visualize Khoj Obsidian Plugin Codebase
+
+![](/img/khoj_obsidian_codebase_visualization_0.2.1.png)
--- a/documentation/docs/features/_category_.json
+++ b/documentation/docs/features/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "Features",
+  "position": 3,
+  "link": {
+    "type": "generated-index",
+    "description": "Features supported by Khoj"
+  }
+}
--- a/documentation/docs/features/agents.md
+++ b/documentation/docs/features/agents.md
@@ -0,0 +1,15 @@
+---
+sidebar_position: 4
+---
+
+# Agents
+
+You can use agents to setup custom system prompts with Khoj. The server host can setup their own agents, which are accessible to all users. You can see ours at https://app.khoj.dev/agents.
+
+![Demo](/img/agents_demo.gif)
+
+## Creating an Agent (Self-Hosted)
+
+Go to `server/admin/database/agent` on your server and click `Add Agent` to create a new one. You have to set it to `public` in order for it to be accessible to all the users on your server. To limit access to a specific user, do not set the `public` flag and add the user in the `Creator` field.
+
+Set your custom prompt in the `personality` field.
--- a/documentation/docs/features/all_features.md
+++ b/documentation/docs/features/all_features.md
@@ -0,0 +1,34 @@
+---
+sidebar_position: 1
+---
+
+# Overview
+
+Khoj supports a variety of features, including search and chat with a wide range of data sources and interfaces.
+
+#### [Search](/features/search)
+  - **Local**: Your personal data stays local. All search and indexing is done on your machine when you [self-host](/get-started/setup)
+  - **Incremental**: Incremental search for a fast, search-as-you-type experience
+
+#### [Chat](/features/chat)
+  - **Faster answers**: Find answers faster, smoother than search. No need to manually scan through your notes to find answers.
+  - **Iterative discovery**: Iteratively explore and (re-)discover your notes
+  - **Assisted creativity**: Smoothly weave across answers retrieval and content generation
+  - **Works online or offline**: Chat using online or offline AI chat models
+
+#### General
+  - **Cloud or Self-Host**: Use [cloud](https://app.khoj.dev/login) to use Khoj anytime from anywhere or [self-host](/get-started/setup) for privacy
+  - **Natural**: Advanced natural language understanding using Transformer based ML Models
+  - **Pluggable**: Modular architecture makes it easy to plug in new data sources, frontends and ML models
+  - **Multiple Sources**: Index your Org-mode, Markdown, PDF, plaintext files, Github repos and Notion pages
+  - **Multiple Interfaces**: Interact from your Web Browser, Emacs, Obsidian, Desktop app or even Whatsapp
+
+### Supported Interfaces
+Khoj is available as a [Desktop app](/clients/desktop), [Emacs package](/clients/emacs), [Obsidian plugin](/clients/obsidian), [Web app](/clients/web) and a [Whatsapp AI](https://khoj.dev/whatsapp).
+
+![](/img/khoj_clients.svg ':size=400px')
+
+### Supported Data Sources
+Khoj can understand your org-mode, markdown, PDF, plaintext files, [Github projects](/online-data-sources/github_integration) and [Notion pages](/online-data-sources/notion_integration).
+
+![](/img/khoj_datasources.svg ':size=200px')
--- a/documentation/docs/features/chat.md
+++ b/documentation/docs/features/chat.md
@@ -0,0 +1,64 @@
+---
+sidebar_position: 2
+---
+
+# Chat
+
+You can configure Khoj to chat with you about anything. When relevant, it'll use any notes or documents you shared with it to respond.
+
+### Overview
+- Creates a personal assistant for you to inquire and engage with your notes
+- You can choose to use Online or Offline Chat depending on your requirements
+- Supports multi-turn conversations with the relevant notes for context
+- Shows reference notes used to generate a response
+
+### Setup (Self-Hosting)
+#### Offline Chat
+Offline chat stays completely private and can work without internet using open-source models.
+
+> **System Requirements**:
+>  - Minimum 8 GB RAM. Recommend **16Gb VRAM**
+>  - Minimum **5 GB of Disk** available
+>  - A CPU supporting [AVX or AVX2 instructions](https://en.wikipedia.org/wiki/Advanced_Vector_Extensions) is required
+>  - An Nvidia, AMD GPU or a Mac M1+ machine would significantly speed up chat response times
+
+1. Open your [Khoj offline settings](http://localhost:42110/server/admin/database/offlinechatprocessorconversationconfig/) and click *Enable* on the Offline Chat configuration.
+2. Open your [Chat model options settings](http://localhost:42110/server/admin/database/chatmodeloptions/) and add any [GGUF chat model](https://huggingface.co/models?library=gguf) to use for offline chat. Make sure to use `Offline` as its type. For a balanced chat model that runs well on standard consumer hardware we recommend using [Hermes-2-Pro-Mistral-7B by NousResearch](https://huggingface.co/NousResearch/Hermes-2-Pro-Mistral-7B-GGUF) by default.
+
+
+:::tip[Note]
+Offline chat is not supported for a multi-user scenario. The host machine will encounter segmentation faults if multiple users try to use offline chat at the same time.
+:::
+
+#### Online Chat
+Online chat requires internet to use ChatGPT but is faster, higher quality and less compute intensive.
+
+:::danger[Warning]
+This will enable Khoj to send your chat queries and query relevant notes to OpenAI for processing.
+:::
+
+1. Get your [OpenAI API Key](https://platform.openai.com/account/api-keys)
+2. Open your [Khoj Online Chat settings](http://localhost:42110/server/admin/database/openaiprocessorconversationconfig/). Add a new setting with your OpenAI API key, and click *Save*. Only one configuration will be used, so make sure that's the only one you have.
+3. Open your [Chat model options](http://localhost:42110/server/admin/database/chatmodeloptions/) and add a new option for the OpenAI chat model you want to use. Make sure to use `OpenAI` as its type.
+
+### Use
+1. Open Khoj Chat
+    - **On Web**: Open [/chat](https://app.khoj.dev/chat) in your web browser
+    - **On Obsidian**: Search for *Khoj: Chat* in the [Command Palette](https://help.obsidian.md/Plugins/Command+palette)
+    - **On Emacs**: Run `M-x khoj <user-query>`
+2. Enter your queries to chat with Khoj. Use [slash commands](#commands) and [query filters](/miscellaneous/advanced#query-filters) to change what Khoj uses to respond
+
+![](/img/khoj_chat_on_web.png ':size=400px')
+
+#### Details
+1. Your query is used to retrieve the most relevant notes, if any, using Khoj search
+2. These notes, the last few messages and associated metadata is passed to the enabled chat model along with your query to generate a response
+
+#### Commands
+Slash commands allows you to change what Khoj uses to respond to your query
+- **/notes**: Limit chat to only respond using your notes, not just Khoj's general world knowledge as reference
+- **/general**: Limit chat to only respond using Khoj's general world knowledge, not using your notes as reference
+- **/default**: Allow chat to respond using your notes or it's general knowledge as reference. It's the default behavior when no slash command is used
+- **/online**: Use online information and incorporate it in the prompt to the LLM to send you a response.
+- **/image**: Generate an image in response to your query.
+- **/help**: Use /help to get all available commands and general information about Khoj
--- a/documentation/docs/features/image_generation.md
+++ b/documentation/docs/features/image_generation.md
@@ -0,0 +1,15 @@
+# Image Generation
+You can use Khoj to generate images from text prompts. You can get deeper into the  details of our image generation flow in this blog post: https://blog.khoj.dev/posts/how-khoj-generates-images/.
+
+To generate images, you just need to provide a prompt to Khoj in which the image generation is in the instructions. Khoj will automatically detect the image generation intent, augment your generation prompt, and then create the image. Here are some examples:
+| Prompt | Image |
+| --- | --- |
+| Paint a picture of the plants I got last month, pixar-animation | ![plants](/img/plants_i_got.png) |
+| Create a picture of my dream house, based on my interests | ![house](/img/dream_house.png) |
+
+
+## Setup (Self-Hosting)
+
+Right now, we only support integration with OpenAI's DALL-E. You need to have an OpenAI API key to use this feature. Here's how you can set it up:
+1. Setup your OpenAI API key. See instructions [here](/get-started/setup#2-configure)
+2. Create a text to image config at http://localhost:42110/server/admin/database/texttoimagemodelconfig/. We recommend the value `dall-e-3`.
--- a/documentation/docs/features/online_search.md
+++ b/documentation/docs/features/online_search.md
@@ -0,0 +1,17 @@
+# Online Search
+
+By default, Khoj will try to infer which information-sourcing tools are required to answer your question. Sometimes, you'll have a need for outside questions that the LLM's knowledge doesn't cover. In that case, it will use the `online` search feature.
+
+For example, these queries would trigger an online search:
+- What's the latest news about the Israel-Palestine war?
+- Where can I find the best pizza in New York City?
+- Deadline for filing taxes 2024.
+- Give me a summary of this article: https://en.wikipedia.org/wiki/Haitian_Revolution
+
+Try it out yourself! https://app.khoj.dev
+
+## Self-Hosting
+
+The general online search function currently requires an API key from Serper.dev. You can grab one here: https://serper.dev/, and then add it as an environment variable with the name `SERPER_DEV_API_KEY`.
+
+Without any API keys, Khoj will use the `requests` library to directly read any webpages you give it a link to. This means that you can use Khoj to read any webpage that you have access in your local network.
--- a/documentation/docs/features/search.md
+++ b/documentation/docs/features/search.md
@@ -0,0 +1,17 @@
+---
+sidebar_position: 3
+---
+
+# Search
+
+Take advantage of super fast search to find relevant notes and documents from your Second Brain.
+
+### Use
+1. Open Khoj Search
+  - **On Web**: Open https://app.khoj.dev/ in your web browser
+  - **On Obsidian**: Click the *Khoj search* icon 🔎 on the [Ribbon](https://help.obsidian.md/User+interface/Workspace/Ribbon) or Search for *Khoj: Search* in the [Command Palette](https://help.obsidian.md/Plugins/Command+palette)
+  - **On Emacs**: Run `M-x khoj <user-query>`
+2. Query using natural language to find relevant entries from your knowledge base. Use [query filters](/miscellaneous/advanced#query-filters) to limit entries to search
+
+### Demo
+![](/img/khoj_search_on_web.png ':size=400px')
--- a/documentation/docs/features/voice_chat.md
+++ b/documentation/docs/features/voice_chat.md
@@ -0,0 +1,14 @@
+# Voice
+
+You can talk to Khoj using your voice. Khoj will respond to your queries using the same models as the chat feature. You can use voice chat on the web, Desktop, and Obsidian apps. Click on the little mic icon to send your voice message to Khoj. It will send back what it heard via text. You'll have some time to edit it before sending it, if required. Try it at https://app.khoj.dev/.
+
+:::info[Voice Response]
+Khoj doesn't yet respond with voice, but it will send back a text response. Let us know if you're interested in voice responses at team at khoj.dev.
+:::
+
+## Setup (Self-Hosting)
+
+Voice chat will automatically be configured when you initialize the application. The default configuration will run locally. If you want to use the OpenAI whisper API for voice chat, you can set it up by following these steps:
+
+1. Setup your OpenAI API key. See instructions [here](/get-started/setup#2-configure).
+2. Create a new configuration at http://localhost:42110/server/admin/database/speechtotextmodeloptions/. We recommend the value `whisper-1` and model type `Openai`.
--- a/documentation/docs/get-started/_category_.json
+++ b/documentation/docs/get-started/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "Get Started",
+  "position": 1,
+  "link": {
+    "type": "generated-index",
+    "description": "Learn how to get started with using Khoj"
+  }
+}
--- a/documentation/docs/get-started/demos.md
+++ b/documentation/docs/get-started/demos.md
@@ -0,0 +1,51 @@
+---
+sidebar_position: 2
+---
+
+# Demos
+
+Check out a couple of demos and screenshots of Khoj in action.
+
+### Screenshots
+
+| Web | Obsidian | Emacs |
+|:---:|:--------:|:-----:|
+| ![](/img/khoj_search_on_web.png ':size=300px') | ![](/img/khoj_search_on_obsidian.png ':size=300px') | ![](/img/khoj_search_on_emacs.png ':size=300px') |
+| ![](/img/khoj_chat_on_web.png ':size=300px') | ![](/img/khoj_chat_on_obsidian.png ':size=300px') | ![](/img/khoj_chat_on_emacs.png ':size=400px') |
+
+
+### Videos
+#### Khoj in Obsidian
+[Link to Video](https://github-production-user-asset-6210df.s3.amazonaws.com/6413477/240061700-3e33d8ea-25bb-46c8-a3bf-c92f78d0f56b.mp4)
+
+##### Installation
+
+1. Install Khoj via `pip` and start Khoj backend in a terminal (Run `khoj`)
+    ```bash
+    python -m pip install khoj-assistant
+    khoj
+    ```
+2. Install Khoj plugin via Community Plugins settings pane on Obsidian app
+    - Check the new Khoj plugin settings
+    - Let Khoj backend index the markdown, pdf, Github markdown files in the current Vault
+    - Open Khoj plugin on Obsidian via Search button on Left Pane
+    - Search \"*Announce plugin to folks*\" in the [Obsidian Plugin docs](https://marcus.se.net/obsidian-plugin-docs/)
+    - Jump to the [search result](https://marcus.se.net/obsidian-plugin-docs/publishing/submit-your-plugin)
+
+#### Khoj in Emacs, Browser
+[Link to Video](https://user-images.githubusercontent.com/6413477/184735169-92c78bf1-d827-4663-9087-a1ea194b8f4b.mp4)
+
+##### Installation
+
+- Install Khoj via pip
+- Start Khoj app
+- Add this readme and [khoj.el readme](https://github.com/khoj-ai/khoj/tree/master/src/interface/emacs) as org-mode for Khoj to index
+- Search \"*Setup editor*\" on the Web and Emacs. Re-rank the results for better accuracy
+- Top result is what we are looking for, the [section to Install Khoj.el on Emacs](https://github.com/khoj-ai/khoj/tree/master/src/interface/emacs#2-Install-Khojel)
+
+##### Analysis
+
+- The results do not have any words used in the query
+  - *Based on the top result it seems the re-ranking model understands that Emacs is an editor?*
+- The results incrementally update as the query is entered
+- The results are re-ranked, for better accuracy, once user hits enter
--- a/documentation/docs/get-started/overview.md
+++ b/documentation/docs/get-started/overview.md
@@ -0,0 +1,50 @@
+---
+sidebar_position: 0
+slug: /
+---
+
+# Overview
+
+<p align="center"><img src="/img/khoj-logo-sideways-500.png" width="200" alt="Khoj Logo"></img></p>
+
+<div align="center">
+  <b>An AI copilot for your Second Brain</b>
+</div>
+
+<br />
+<div align="center">
+
+  [📜 Explore Code](https://github.com/khoj-ai/khoj)
+  <span>&nbsp;&nbsp;•&nbsp;&nbsp;</span>
+  [🌍 Try Khoj Cloud](https://khoj.dev)
+  <span>&nbsp;&nbsp;•&nbsp;&nbsp;</span>
+  [💬 Get Involved](https://discord.gg/BDgyabRM6e)
+
+</div>
+
+## Introduction
+Welcome to the Khoj Docs! This is the best place to get setup and explore Khoj's features.
+
+- Khoj is an open source, personal AI
+- You can [chat](/features/chat) with it about anything. It'll use files you shared with it to respond, when relevant
+- Quickly [find](/features/search) relevant notes and documents using natural language
+- It understands pdf, plaintext, markdown, org-mode files, [notion pages](/online-data-sources/notion_integration) and [github repositories](/online-data-sources/github_integration)
+- Access it from your [Emacs](/clients/emacs), [Obsidian](/clients/obsidian), [Web browser](/clients/web) or the [Khoj Desktop app](/clients/desktop)
+- Use [cloud](https://app.khoj.dev/login) to access your Khoj anytime from anywhere, [self-host](/get-started/setup) on consumer hardware for privacy
+
+## Quickstart
+- [Try Khoj Cloud](https://app.khoj.dev) to get started quickly
+- [Read these instructions](/get-started/setup) to self-host a private instance of Khoj
+
+## At a Glance
+![demo_chat](/img/using_khoj_for_studying.gif)
+
+#### [Search](/features/search)
+  - **Natural**: Use natural language queries to quickly find relevant notes and documents.
+  - **Incremental**: Incremental search for a fast, search-as-you-type experience
+
+#### [Chat](/features/chat)
+  - **Faster answers**: Find answers faster, smoother than search. No need to manually scan through your notes to find answers.
+  - **Iterative discovery**: Iteratively explore and (re-)discover your notes
+  - **Assisted creativity**: Smoothly weave across answers retrieval and content generation
+  - **Online or Offline**: Choose online or offline chat depending on your requirements
--- a/documentation/docs/get-started/privacy_security.md
+++ b/documentation/docs/get-started/privacy_security.md
@@ -0,0 +1,31 @@
+---
+sidebar_position: 4
+slug: /privacy
+---
+
+# Privacy
+
+If you're using Khoj to index you personal data, it's almost certain you'll have sensitive and private information you'd like to index.
+
+Khoj is designed to be a personal AI, so one of our cornerstone principles is to make it as privacy-friendly as possible. That's why, you can *always* choose to run Khoj on your own hardware, and never share your data outside of your device. You can generate your embeddings directly on your machine, and then use an offline chat client so that your data never leaves your machine. You'll find the instructions to [self-hosting](./setup.mdx) here.
+
+Here's what to consider if you're using Khoj, whether self-hosted or on our cloud:
+1. Some of your relevant indexed data may be included as context when you chat with Khoj. This means that it may be sent to OpenAI, if you use one of the OpenAI models.
+1. We collect completely anonymized usage telemetry and send it to [PostHog](https://posthog.com/). This includes data like unique chat requests, unique search requests, unique requests to index data. Usage data is collected to help us understand how people are using Khoj, and to help us prioritize features.
+    - We do not log your IP address, nor upload any of your personal data to PostHog.
+    - You can see our telemetry aggregation code [here](https://github.com/khoj-ai/khoj/blob/master/src/khoj/routers/helpers.py#L71) and see our telemetry server [here](https://github.com/khoj-ai/khoj/blob/master/src/telemetry/telemetry.py).
+    - If you're self-hosting, you can opt out of telemetry by following [these instructions](./miscellaneous/telemetry).
+
+
+Self-hosting isn't for everyone, so we've still taken steps to make Khoj privacy-friendly, even if you choose to use our [cloud offering](https://app.khoj.dev/login). Here's what to consider when using Khoj Cloud:
+1. Your embeddings are generated by an open source model within our own dedicated endpoint [hosted on AWS with Huggingface](https://huggingface.co/inference-endpoints/dedicated). There's zero persistent memory to the Huggingface Inference endpoints (it's stateless).
+1. Your embeddings and the associated raw text are stored in a secure Postgres DB in our private AWS cloud. Your data is sharded on a unique user ID. We store the raw text in your files to improve file syncing and provide context when you chat with Khoj.
+1. When you use the single-sign-on option with Google, we only receive your name, a link to your profile photo, and your email address.
+
+
+:::tip[Info]
+Your data is yours. We do not sell your data or use it for training models. Khoj is a sustainable, open-source alternative to closed-source, commercial personal AI. We have no interest in selling your data to make a quick buck.
+:::
+
+
+We have lots of ideas of how to make Khoj really robust as a personal AI and cloud offering, but also trust-less and privacy-centric. Please [reach out](mailto:team@khoj.dev) if this is important to you, and you'd like to help us build it.
--- a/documentation/docs/get-started/setup.mdx
+++ b/documentation/docs/get-started/setup.mdx
@@ -0,0 +1,329 @@
+---
+sidebar_position: 1
+---
+
+# Self-Host
+Learn about how to self-host Khoj on your own machine.
+
+Benefits to self-hosting:
+1. **Privacy**: Your data will never have to leave your private network. You can even use Khoj without an internet connection if deployed on your personal computer.
+2. **Customization**: You can customize Khoj to your liking, from models, to host URL, to feature enablement.
+
+```mdx-code-block
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+```
+
+## Setup
+These are the general setup instructions for self-hosted Khoj.
+
+- Make sure [python](https://realpython.com/installing-python/) and [pip](https://pip.pypa.io/en/stable/installation/) are installed on your machine
+- Check the [Khoj Emacs docs](/clients/emacs#setup) to setup Khoj with Emacs<br />
+  It's simpler as it can skip the server *install*, *run* and *configure* step below.
+- Check the [Khoj Obsidian docs](/clients/obsidian#setup) to setup Khoj with Obsidian<br />
+  Its simpler as it can skip the *configure* step below.
+
+For Installation, you can either use Docker or install the Khoj server locally.
+
+:::info[Offline Model + GPU]
+If you want to use the offline chat model and you have a GPU, you should use Installation Option 2  - local setup via the Python package directly. Our Docker image doesn't currently support running the offline chat model on GPU, making inference times really slow.
+:::
+
+### Installation Option 1 (Docker)
+
+#### Prerequisites
+1. Install Docker Engine. See [official instructions](https://docs.docker.com/engine/install/).
+2. Ensure you have Docker Compose. See [official instructions](https://docs.docker.com/compose/install/).
+
+#### Setup
+
+Use the sample docker-compose [in Github](https://github.com/khoj-ai/khoj/blob/master/docker-compose.yml) to run Khoj in Docker. Start by configuring all the environment variables to your choosing. Your admin account will automatically be created based on the admin credentials in that file, so pay attention to those. To start the container, run the following command in the same directory as the docker-compose.yml file. This will automatically setup the database and run the Khoj server.
+
+```shell
+docker-compose up
+```
+
+Khoj should now be running at http://localhost:42110. You can see the web UI in your browser.
+
+### Installation Option 2 (Local)
+
+#### Prerequisites
+
+##### Install Postgres (with PgVector)
+
+Khoj uses the `pgvector` package to store embeddings of your index in a Postgres database. In order to use this, you need to have Postgres installed.
+
+```mdx-code-block
+  <Tabs groupId="operating-systems">
+    <TabItem value="macos" label="MacOS">
+Install [Postgres.app](https://postgresapp.com/). This comes pre-installed with `pgvector` and relevant dependencies.
+    </TabItem>
+    <TabItem value="win" label="Windows">
+    1. Use the [recommended installer](https://www.postgresql.org/download/windows/).
+    2. Follow instructions to [Install PgVector](https://github.com/pgvector/pgvector#windows) in case you need to manually install it. Windows support is experimental for pgvector currently, so we recommend using Docker.
+    </TabItem>
+    <TabItem value="unix" label="Linux">
+    From [official instructions](https://wiki.postgresql.org/wiki/Apt)
+    </TabItem>
+    <TabItem value="source" label="From Source">
+    1. Follow instructions to [Install Postgres](https://www.postgresql.org/download/)
+    2. Follow instructions to [Install PgVector](https://github.com/pgvector/pgvector#installation) in case you need to manually install it.
+    </TabItem>
+  </Tabs>
+```
+
+##### Create the Khoj database
+
+Make sure to update your environment variables to match your Postgres configuration if you're using a different name. The default values should work for most people. When prompted for a password, you can use the default password `postgres`, or configure it to your preference. Make sure to set the environment variable `POSTGRES_PASSWORD` to the same value as the password you set here.
+
+```mdx-code-block
+  <Tabs groupId="operating-systems">
+    <TabItem value="macos" label="MacOS">
+    ```shell
+createdb khoj -U postgres --password
+    ```
+    </TabItem>
+    <TabItem value="win" label="Windows">
+    ```shell
+createdb -U postgres khoj --password
+      ```
+    </TabItem>
+    <TabItem value="unix" label="Linux">
+      ```shell
+sudo -u postgres createdb khoj --password
+      ```
+    </TabItem>
+  </Tabs>
+```
+
+
+#### Install package
+
+##### Local Server Setup
+- *Make sure [python](https://realpython.com/installing-python/) and [pip](https://pip.pypa.io/en/stable/installation/) are installed on your machine*
+- Check [llama-cpp-python setup](https://python.langchain.com/docs/integrations/llms/llamacpp#installation) if you hit any llama-cpp issues with the installation
+
+Run the following command in your terminal to install the Khoj backend.
+
+```mdx-code-block
+  <Tabs groupId="operating-systems">
+    <TabItem value="macos" label="MacOS">
+    ```shell
+# ARM/M1+ Machines
+MAKE_ARGS="-DLLAMA_METAL=on" python -m pip install khoj-assistant
+
+# Intel Machines
+python -m pip install khoj-assistant
+    ```
+    </TabItem>
+    <TabItem value="win" label="Windows">
+      ```shell
+ # 1. (Optional) To use NVIDIA (CUDA) GPU
+ $env:CMAKE_ARGS = "-DLLAMA_OPENBLAS=on"
+ # 1. (Optional) To use AMD (ROCm) GPU
+ CMAKE_ARGS="-DLLAMA_HIPBLAS=on"
+ # 1. (Optional) To use VULCAN GPU
+ CMAKE_ARGS="-DLLAMA_VULKAN=on"
+
+ # 2. Install Khoj
+ py -m pip install khoj-assistant
+      ```
+    </TabItem>
+    <TabItem value="unix" label="Linux">
+      ```shell
+ # CPU
+ python -m pip install khoj-assistant
+ # NVIDIA (CUDA) GPU
+ CMAKE_ARGS="DLLAMA_CUDA=on" FORCE_CMAKE=1 python -m pip install khoj-assistant
+ # AMD (ROCm) GPU
+ CMAKE_ARGS="-DLLAMA_HIPBLAS=on" FORCE_CMAKE=1 python -m pip install khoj-assistant
+ # VULCAN GPU
+ CMAKE_ARGS="-DLLAMA_VULKAN=on" FORCE_CMAKE=1 python -m pip install khoj-assistant
+      ```
+    </TabItem>
+  </Tabs>
+```
+
+##### Local Server Start
+
+Before getting started, configure the following environment variables in your terminal for the first run
+
+```mdx-code-block
+  <Tabs groupId="operating-systems">
+    <TabItem value="macos" label="MacOS">
+      ```shell
+      export KHOJ_ADMIN_EMAIL=<your-email>
+      export KHOJ_ADMIN_PASSWORD=<your-password>
+      ```
+    </TabItem>
+    <TabItem value="win" label="Windows">
+      If you're using PowerShell:
+      ```shell
+      $env:KHOJ_ADMIN_EMAIL="<your-email>"
+      $env:KHOJ_ADMIN_PASSWORD="<your-password>"
+      ```
+    </TabItem>
+    <TabItem value="unix" label="Linux">
+      ```shell
+      export KHOJ_ADMIN_EMAIL=<your-email>
+      export KHOJ_ADMIN_PASSWORD=<your-password>
+      ```
+    </TabItem>
+  </Tabs>
+```
+
+
+Run the following command from your terminal to start the Khoj backend and open Khoj in your browser.
+
+```shell
+khoj --anonymous-mode
+```
+`--anonymous-mode` allows you to run the server without setting up Google credentials for login. This allows you to use any of the clients without a login wall. If you want to use Google login, you can skip this flag, but you will have to add your Google developer credentials.
+
+On the first run, you will be prompted to input credentials for your admin account and do some basic configuration for your chat model settings. Once created, you can go to http://localhost:42110/server/admin and login with the credentials you just created.
+
+Khoj should now be running at http://localhost:42110. You can see the web UI in your browser.
+
+Note: To start Khoj automatically in the background use [Task scheduler](https://www.windowscentral.com/how-create-automated-task-using-task-scheduler-windows-10) on Windows or [Cron](https://en.wikipedia.org/wiki/Cron) on Mac, Linux (e.g with `@reboot khoj`)
+
+
+### Setup Notes
+
+You can use Khoj with a custom domain as well. To do so, you need to set the `KHOJ_DOMAIN` environment variable to your domain (e.g., `export KHOJ_DOMAIN=my-khoj-domain.com` or add it to your `docker-compose.yml`). By default, the Khoj server you set up will not be accessible outside of `localhost` or `127.0.0.1`.
+
+:::warning[Without HTTPS certificate]
+To expose Khoj on a custom domain over the public internet, use of an SSL certificate is strongly recommended. You can use [Let's Encrypt](https://letsencrypt.org/) to get a free SSL certificate for your domain.
+
+To disable HTTPS, set the `KHOJ_NO_HTTPS` environment variable to `True`. This can be useful if Khoj is only accessible behind a secure, private network.
+:::
+
+### 2. Configure
+1. Go to http://localhost:42110/server/admin and login with your admin credentials.
+    1. Go to [OpenAI settings](http://localhost:42110/server/admin/database/openaiprocessorconversationconfig/) in the server admin settings to add an OpenAI processor conversation config. This is where you set your API key. Alternatively, you can go to the [offline chat settings](http://localhost:42110/server/admin/database/offlinechatprocessorconversationconfig/) and simply create a new setting with `Enabled` set to `True`.
+    2. Go to the ChatModelOptions if you want to add additional models for chat.
+       - Set the `chat-model` field to a supported chat model[^1] of your choice. For example, you can specify `gpt-4-turbo-preview` if you're using OpenAI or `NousResearch/Hermes-2-Pro-Mistral-7B-GGUF` if you're using offline chat.
+       - Make sure to set the `model-type` field to `OpenAI` or `Offline` respectively.
+       - The `tokenizer` and `max-prompt-size` fields are optional. Set them only when using a non-standard model (i.e not mistral, gpt or llama2 model).
+1. Select files and folders to index [using the desktop client](/get-started/setup#2-download-the-desktop-client). When you click 'Save', the files will be sent to your server for indexing.
+    - Select Notion workspaces and Github repositories to index using the web interface.
+
+[^1]: Khoj, by default, can use [OpenAI GPT3.5+ chat models](https://platform.openai.com/docs/models/overview) or [GGUF chat models](https://huggingface.co/models?library=gguf). See [this section](/miscellaneous/advanced#use-openai-compatible-llm-api-server-self-hosting) to use non-standard chat models
+
+:::tip[Note]
+Using Safari on Mac? You might not be able to login to the admin panel. Try using Chrome or Firefox instead.
+:::
+
+### 3. Download the desktop client (Optional)
+
+You can use our desktop executables to select file paths and folders to index. You can simply select the folders or files, and they'll be automatically uploaded to the server. Once you specify a file or file path, you don't need to update the configuration again; it will grab any data diffs dynamically over time.
+
+**To download the latest desktop client, go to https://download.khoj.dev** and the correct executable for your OS will automatically start downloading. You can also go to https://khoj.dev/downloads to explicitly download your image of choice. Once downloaded, you can configure your folders for indexing using the settings tab. To set your chat configuration, you'll have to use the web interface for the Khoj server you setup in the previous step.
+
+To use the desktop client, you need to go to your Khoj server's settings page (http://localhost:42110/config) and copy the API key. Then, paste it into the desktop client's settings page. Once you've done that, you can select files and folders to index. Set the desktop client settings to use `http://127.0.0.1:42110` as the host URL.
+
+
+### 4. Install Client Plugins (Optional)
+Khoj exposes a web interface to search, chat and configure by default.<br />
+The optional steps below allow using Khoj from within an existing application like Obsidian or Emacs.
+
+- **Khoj Obsidian**:<br />
+[Install](/clients/obsidian#setup) the Khoj Obsidian plugin
+
+- **Khoj Emacs**:<br />
+[Install](/clients/emacs#setup) khoj.el
+
+#### Setup host URL
+To configure your host URL on your clients when self-hosting, use `http://127.0.0.1:42110`. This is the default port for the Khoj server. Note that `localhost` will not work.
+
+### 5. Use Khoj 🚀
+
+You can head to http://localhost:42110 to use the web interface. You can also use the desktop client to search and chat.
+
+## Upgrade
+### Upgrade Khoj Server
+
+```mdx-code-block
+  <Tabs groupId="environment">
+    <TabItem value="localsetup" label="Local Setup">
+      ```shell
+      pip install --upgrade khoj-assistant
+      ```
+      *Note: To upgrade to the latest pre-release version of the khoj server run below command*
+    </TabItem>
+    <TabItem value="docker" label="Docker">
+      From the same directory where you have your `docker-compose` file, this will fetch the latest build and upgrade your server.
+      ```shell
+      docker-compose up --build
+      ```
+    </TabItem>
+    <TabItem value="emacs" label="Emacs">
+    - Use your Emacs Package Manager to Upgrade
+    - See [khoj.el package setup](/clients/emacs#setup) for details
+    </TabItem>
+    <TabItem value="obsidian" label="Obsidian">
+      - Upgrade via the Community plugins tab on the settings pane in the Obsidian app
+      - See the [khoj plugin setup](/clients/obsidian#setup) for details
+    </TabItem>
+  </Tabs>
+```
+
+## Uninstall
+### Uninstall Khoj Server
+
+```mdx-code-block
+  <Tabs groupId="environment">
+    <TabItem value="localsetup" label="Local Setup">
+    ```shell
+    # uninstall khoj server
+    pip uninstall khoj-assistant
+
+    # delete khoj postgres db
+    dropdb khoj -U postgres
+    ```
+    </TabItem>
+    <TabItem value="docker" label="Docker">
+    From the same directory where you have your `docker-compose` file, run the command below to remove the server to delete its containers, networks, images and volumes.
+
+    ```shell
+    docker-compose down --volumes
+    ```
+    </TabItem>
+    <TabItem value="emacs" label="Emacs">
+    Uninstall the khoj Emacs, or desktop client in the standard way from Emacs or your OS respectively
+    You can also `rm -rf ~/.khoj` to remove the Khoj data directory if did a local install.
+    </TabItem>
+    <TabItem value="obsidian" label="Obsidian">
+    Uninstall the khoj Obisidan, or desktop client in the standard way from Obsidian or your OS respectively
+    You can also `rm -rf ~/.khoj` to remove the Khoj data directory if did a local install.
+    </TabItem>
+  </Tabs>
+```
+
+## Troubleshoot
+
+#### Dependency conflict when trying to install Khoj python package with pip
+- **Reason**: When conflicting dependency versions are required by Khoj vs other python packages installed on your system
+- **Fix**: Install Khoj in a python virtual environment using [venv](https://docs.python.org/3/library/venv.html) or [pipx](https://pypa.github.io/pipx) to avoid this dependency conflicts
+- **Process**:
+  1. Install [pipx](https://pypa.github.io/pipx/#install-pipx)
+  2. Use `pipx` to install Khoj to avoid dependency conflicts with other python packages.
+     ```shell
+     pipx install khoj-assistant
+     ```
+  3. Now start `khoj` using the standard steps described earlier
+
+
+#### Install fails while building Tokenizer dependency
+- **Details**: `pip install khoj-assistant` fails while building the `tokenizers` dependency. Complains about Rust.
+- **Fix**: Install Rust to build the tokenizers package. For example on Mac run:
+    ```shell
+    brew install rustup
+    rustup-init
+    source ~/.cargo/env
+    ```
+- **Refer**: [Issue with Fix](https://github.com/khoj-ai/khoj/issues/82#issuecomment-1241890946) for more details
+
+
+#### Khoj in Docker errors out with \"Killed\" in error message
+- **Fix**: Increase RAM available to Docker Containers in Docker Settings
+- **Refer**: [StackOverflow Solution](https://stackoverflow.com/a/50770267), [Configure Resources on Docker for Mac](https://docs.docker.com/desktop/mac/#resources)
--- a/documentation/docs/miscellaneous/_category_.json
+++ b/documentation/docs/miscellaneous/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "Miscellaneous",
+  "position": 6,
+  "link": {
+    "type": "generated-index",
+    "description": "Additional resources for learning about Khoj"
+  }
+}
--- a/documentation/docs/miscellaneous/advanced.md
+++ b/documentation/docs/miscellaneous/advanced.md
@@ -0,0 +1,56 @@
+---
+sidebar_position: 3
+---
+
+# Advanced Usage
+
+## Search across Different Languages (Self-Hosting)
+To search for notes in multiple, different languages, you can use a [multi-lingual model](https://www.sbert.net/docs/pretrained_models.html#multi-lingual-models).<br />
+For example, the [paraphrase-multilingual-MiniLM-L12-v2](https://huggingface.co/sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2) supports [50+ languages](https://www.sbert.net/docs/pretrained_models.html#:~:text=we%20used%20the%20following%2050%2B%20languages), has good search quality and speed. To use it:
+1. Manually update the search config in server's admin settings page. Go to [the search config](http://localhost:42110/server/admin/database/searchmodelconfig/). Either create a new one, if none exists, or update the existing one. Set the bi_encoder to `sentence-transformers/multi-qa-MiniLM-L6-cos-v1` and the cross_encoder to `mixedbread-ai/mxbai-rerank-xsmall-v1`.
+2. Regenerate your content index from all the relevant clients. This step is very important, as you'll need to re-encode all your content with the new model.
+
+Note: If you use a search model that expects a prefix (e.g [mixedbread-ai/mxbai-embed-large-v1](https://huggingface.co/mixedbread-ai/mxbai-embed-large-v1)) to the query (or docs) string before encoding. Update the `bi_encoder_query_encode_config` field with `{prompt: <prefix-prompt>}`. Eg. `{prompt: "Represent this query for searching documents"}`. You can pass a valid JSON object that the SentenceTransformer `encode` function accepts
+
+## Query Filters
+
+Use structured query syntax to filter entries from your knowledge based used by search results or chat responses.
+
+- **Word Filter**: Get entries that include/exclude a specified term
+  - Entries that contain term_to_include: `+"term_to_include"`
+  - Entries that contain term_to_exclude: `-"term_to_exclude"`
+- **Date Filter**: Get entries containing dates in YYYY-MM-DD format from specified date (range)
+  - Entries from April 1st 1984: `dt:"1984-04-01"`
+  - Entries after March 31st 1984: `dt>="1984-04-01"`
+  - Entries before April 2nd 1984 : `dt<="1984-04-01"`
+- **File Filter**: Get entries from a specified file
+  - Entries from incoming.org file: `file:"incoming.org"`
+- Combined Example
+  - `what is the meaning of life? file:"1984.org" dt>="1984-01-01" dt<="1985-01-01" -"big" -"brother"`
+  - Adds all filters to the natural language query. It should return entries
+    - from the file *1984.org*
+    - containing dates from the year *1984*
+    - excluding words *"big"* and *"brother"*
+    - that best match the natural language query *"what is the meaning of life?"*
+
+## Use OpenAI compatible LLM API Server (Self Hosting)
+Use this if you want to use non-standard, open or commercial, local or hosted LLM models for Khoj chat
+1. Setup your desired chat LLM by installing an OpenAI compatible LLM API Server like [LiteLLM](https://docs.litellm.ai/docs/proxy/quick_start), [llama-cpp-python](https://github.com/abetlen/llama-cpp-python?tab=readme-ov-file#openai-compatible-web-server)
+2. Set environment variable `OPENAI_API_BASE="<url-of-your-llm-server>"` before starting Khoj
+3. Add ChatModelOptions with `model-type` `OpenAI`, and `chat-model` to anything (e.g `gpt-3.5-turbo`) during [Config](/get-started/setup#3-configure)
+   - *(Optional)* Set the `tokenizer` and `max-prompt-size` relevant to the actual chat model you're using
+
+#### Sample Setup using LiteLLM and Mistral API
+
+```shell
+# Install LiteLLM
+pip install litellm[proxy]
+
+# Start LiteLLM and use Mistral tiny via Mistral API
+export MISTRAL_API_KEY=<MISTRAL_API_KEY>
+litellm --model mistral/mistral-tiny --drop_params
+
+# Set OpenAI API Base to LiteLLM server URL and start Khoj
+export OPENAI_API_BASE='http://localhost:8000'
+khoj --anonymous-mode
+```
--- a/documentation/docs/miscellaneous/credits.md
+++ b/documentation/docs/miscellaneous/credits.md
@@ -0,0 +1,13 @@
+---
+sidebar_position: 4
+---
+
+# Credits
+Many Open Source projects are used to power Khoj. Here's a few of them:
+
+- [Multi-QA MiniLM Model](https://huggingface.co/sentence-transformers/multi-qa-MiniLM-L6-cos-v1), [All MiniLM Model](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2) for Text Search. See [SBert Documentation](https://www.sbert.net/examples/applications/retrieve_rerank/README.html)
+- [OpenAI CLIP Model](https://github.com/openai/CLIP) for Image Search. See [SBert Documentation](https://www.sbert.net/examples/applications/image-search/README.html)
+- Charles Cave for [OrgNode Parser](http://members.optusnet.com.au/~charles57/GTD/orgnode.html)
+- [Org.js](https://mooz.github.io/org-js/) to render Org-mode results on the Web interface
+- [Markdown-it](https://github.com/markdown-it/markdown-it) to render Markdown results on the Web interface
+- [Llama.cpp](https://github.com/ggerganov/llama.cpp) to chat with local LLM
--- a/documentation/docs/miscellaneous/performance.md
+++ b/documentation/docs/miscellaneous/performance.md
@@ -0,0 +1,25 @@
+---
+sidebar_position: 2
+---
+
+# Performance
+
+Here are some top-level performance metrics for Khoj. These are rough estimates and will vary based on your hardware and data.
+
+### Search performance
+
+- Semantic search using the bi-encoder is fairly fast at \<100 ms across all content types
+- Reranking using the cross-encoder is slower at \<2s on 15 results. Tweak `top_k` to tradeoff speed for accuracy of results
+- Filters in query (e.g by file, word or date) usually add \<20ms to query latency
+
+### Indexing performance
+
+- Indexing is more strongly impacted by the size of the source data
+- Indexing 100K+ line corpus of notes takes about 10 minutes
+- Indexing 4000+ images takes about 15 minutes and more than 8Gb of RAM
+- Note: *It should only take this long on the first run* as the index is incrementally updated
+
+### Miscellaneous
+
+- Testing done on a Mac M1 and a \>100K line corpus of notes
+- Search, indexing on a GPU has not been tested yet
--- a/documentation/docs/miscellaneous/telemetry.md
+++ b/documentation/docs/miscellaneous/telemetry.md
@@ -0,0 +1,22 @@
+---
+sidebar_position: 1
+---
+
+# Telemetry
+
+We collect some high level, anonymized metadata about usage of self-hosted Khoj. This includes:
+- Client (Web, Emacs, Obsidian)
+- API usage (Search, Chat)
+- Configured content types (Github, Org, etc)
+- Request metadata (e.g., host, referrer)
+
+We don't send any personal information or any information from/about your content. We only send the above metadata. This helps us prioritize feature development and understand how people are using Khoj. Don't just take our word for it -- you can see [the code here](https://github.com/khoj-ai/khoj/tree/master/src/telemetry).
+
+## Disable Telemetry
+
+If you're self-hosting Khoj, you can opt out of telemetry at any time. To do so,
+1. Open `~/.khoj/khoj.yml`
+2. Set `should-log-telemetry` to `false`
+3. Save the file and restart Khoj
+
+If you have any questions or concerns, please reach out to us on [Discord](https://discord.gg/BDgyabRM6e).
--- a/documentation/docs/online-data-sources/_category_.json
+++ b/documentation/docs/online-data-sources/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "Data Sources",
+  "position": 5,
+  "link": {
+    "type": "generated-index",
+    "description": "Online data sources for indexing via Khoj"
+  }
+}
--- a/documentation/docs/online-data-sources/github_integration.md
+++ b/documentation/docs/online-data-sources/github_integration.md
@@ -0,0 +1,14 @@
+# Github integration
+
+The Github integration allows you to index as many repositories as you want. It's currently default configured to index Issues, Commits, and all Markdown/Org files in each repository. For large repositories, this takes a fairly long time, but it works well for smaller projects.
+
+# Configure your settings
+
+1. Go to [https://app.khoj.dev/config](https://app.khoj.dev/config) and enter in settings for the data sources you want to index. You'll have to specify the file paths.
+
+## Use the Github plugin
+
+1. Generate a [classic PAT (personal access token)](https://docs.github.com/en/authentication/keeping-your-account-and-data-secure/managing-your-personal-access-tokens) from [Github](https://github.com/settings/tokens) with `repo` and `admin:org` scopes at least.
+2. Navigate to [https://app.khoj.dev/config/content-source/github](https://app.khoj.dev/config/content-source/github) to configure your Github settings. Enter in your PAT, along with details for each repository you want to index.
+3. Click `Save`. Go back to the settings page and click `Configure`.
+4. Go to [https://app.khoj.dev/](https://app.khoj.dev/) and start searching!
--- a/documentation/docs/online-data-sources/notion_integration.md
+++ b/documentation/docs/online-data-sources/notion_integration.md
@@ -0,0 +1,19 @@
+# Notion Integration
+
+The Notion integration allows you to search/chat with your Notion workspaces. [Notion](https://notion.so/) is a platform people use for taking notes, especially for collaboration.
+
+Go to https://app.khoj.dev/config to connect your Notion workspace(s) to Khoj.
+
+![notion_integration](/img/notion_integration.gif)
+
+
+## Self-Hosted Setup
+
+1. Go to https://www.notion.so/my-integrations and create a new integration called Khoj to get an API key.
+![setup_new_integration](https://github.com/khoj-ai/khoj/assets/65192171/b056e057-d4dc-47dc-aad3-57b59a22c68b)
+3. Share all the workspaces that you want to integrate with the Khoj integration you just made in the previous step
+![enable_workspace](https://github.com/khoj-ai/khoj/assets/65192171/98290303-b5b8-4cb0-b32c-f68c6923a3d0)
+4. In the first step, you generated an API key. Use the newly generated API Key in your Khoj settings, by default at http://localhost:42110/config/content-source/notion. Click `Save`.
+5. Click `Configure` in http://localhost:42110/config to index your Notion workspace(s).
+
+That's it! You should be ready to start searching and chatting. Make sure you've configured your [chat settings](/get-started/setup#2-configure).
--- a/documentation/docusaurus.config.js
+++ b/documentation/docusaurus.config.js
@@ -0,0 +1,210 @@
+// @ts-check
+// `@type` JSDoc annotations allow editor autocompletion and type checking
+// (when paired with `@ts-check`).
+// There are various equivalent ways to declare your Docusaurus config.
+// See: https://docusaurus.io/docs/api/docusaurus-config
+
+import {themes as prismThemes} from 'prism-react-renderer';
+
+/** @type {import('@docusaurus/types').Config} */
+const config = {
+  title: 'Khoj AI',
+  tagline: 'An AI copilot for your Second Brain',
+
+  staticDirectories: ['assets'],
+
+  favicon: 'img/favicon-128x128.ico',
+
+  // Set the production url of your site here
+  url: 'https://docs.khoj.dev',
+  // Set the /<baseUrl>/ pathname under which your site is served
+  // For GitHub pages deployment, it is often '/<projectName>/'
+  baseUrl: '/',
+
+  // GitHub pages deployment config.
+  // If you aren't using GitHub pages, you don't need these.
+  organizationName: 'khoj-ai', // Usually your GitHub org/user name.
+  projectName: 'khoj', // Usually your repo name.
+
+  onBrokenLinks: 'throw',
+  onBrokenMarkdownLinks: 'warn',
+
+  // Even if you don't use internationalization, you can use this field to set
+  // useful metadata like html lang. For example, if your site is Chinese, you
+  // may want to replace "en" with "zh-Hans".
+  i18n: {
+    defaultLocale: 'en',
+    locales: ['en'],
+  },
+
+  presets: [
+    [
+      'classic',
+      /** @type {import('@docusaurus/preset-classic').Options} */
+      ({
+        docs: {
+          sidebarPath: './sidebars.js',
+          routeBasePath: '/',
+          // Please change this to your repo.
+          // Remove this to remove the "edit this page" links.
+          editUrl:
+            'https://github.com/khoj-ai/khoj/tree/master/documentation/',
+        },
+        blog: {
+          showReadingTime: true,
+          // Please change this to your repo.
+          // Remove this to remove the "edit this page" links.
+          editUrl:
+            'https://github.com/khoj-ai/khoj/tree/master/documentation/blog/',
+        },
+        theme: {
+          customCss: './src/css/custom.css',
+        },
+        sitemap: {
+          lastmod: 'date',
+          changefreq: 'weekly',
+          priority: 0.5,
+          filename: 'sitemap.xml',
+        },
+      }),
+    ],
+  ],
+
+  themeConfig:
+    /** @type {import('@docusaurus/preset-classic').ThemeConfig} */
+    ({
+      image: 'img/khoj-logo-sideways-500.png',
+      metadata: [
+        {name: 'keywords', content: 'khoj, khoj ai, chatgpt, open ai, open source, productivity'},
+        {name: 'og:title', content: 'Khoj Documentation'},
+        {name: 'og:type', content: 'website'},
+        {name: 'og:site_name', content: 'Khoj Documentation'},
+        {name: 'og:description', content: 'Quickly get started with using or self-hosting Khoj'},
+        {name: 'og:image', content: 'https://khoj-web-bucket.s3.amazonaws.com/link_preview_docs.png'},
+        {name: 'og:url', content: 'https://docs.khoj.dev'},
+        {name: 'keywords', content: 'khoj, khoj ai, chatgpt, open ai, open source, productivity'}
+      ],
+      navbar: {
+        title: 'Khoj',
+        logo: {
+          alt: 'Khoj AI',
+          src: 'img/favicon-128x128.ico',
+        },
+        items: [
+          {
+            href: 'https://github.com/khoj-ai/khoj',
+            label: 'GitHub',
+            position: 'right',
+          },
+          {
+            href: 'https://app.khoj.dev/login',
+            label: 'Cloud',
+            position: 'right',
+          },
+          {
+            href: 'https://discord.gg/BDgyabRM6e',
+            label: 'Discord',
+            position: 'right',
+          },
+          {
+            href: 'https://blog.khoj.dev',
+            label: 'Blog',
+            position: 'right',
+          },
+        ],
+      },
+      footer: {
+        style: 'dark',
+        links: [
+          {
+            title: 'Docs',
+            items: [
+              {
+                label: 'Get Started',
+                to: '/',
+              },
+              {
+                label: 'Privacy',
+                to: '/privacy',
+              },
+              {
+                label: 'Features',
+                to: '/features/all_features',
+              },
+              {
+                label: 'Client Apps',
+                to: '/category/clients',
+              },
+              {
+                label: 'Self-Hosting',
+                to: '/get-started/setup',
+              },
+              {
+                label: 'Contributing',
+                to: '/contributing/development',
+              },
+            ],
+          },
+          {
+            title: 'Community',
+            items: [
+              {
+                label: 'Discord',
+                href: 'https://discord.gg/BDgyabRM6e',
+              },
+              {
+                label: 'LinkedIn',
+                href: 'https://www.linkedin.com/company/khoj-ai/'
+              },
+              {
+                label: 'Twitter',
+                href: 'https://twitter.com/khoj_ai',
+              },
+              {
+                label: 'GitHub',
+                href: 'https://github.com/khoj-ai/khoj/issues',
+              },
+              {
+                label: 'Email',
+                href: 'mailto:team@khoj.dev',
+              }
+            ],
+          },
+          {
+            title: 'More',
+            items: [
+              {
+                href: 'https://blog.khoj.dev',
+                label: 'Blog',
+              },
+              {
+                label: 'Khoj Cloud',
+                href: 'https://app.khoj.dev/login',
+              },
+              {
+                label: 'GitHub',
+                href: 'https://github.com/khoj-ai/khoj',
+              },
+              {
+                label: 'Website',
+                href: 'https://khoj.dev',
+              },
+            ],
+          },
+        ],
+        copyright: `Copyright © ${new Date().getFullYear()} Khoj, Inc.`,
+      },
+      prism: {
+        theme: prismThemes.github,
+        darkTheme: prismThemes.dracula,
+      },
+      algolia: {
+        appId: "NBR0FXJNGW",
+        apiKey: "8841b34192a28b2d06f04dd28d768017",
+        indexName: "khoj",
+        contextualSearch: false,
+      }
+    }),
+};
+
+export default config;
--- a/documentation/package.json
+++ b/documentation/package.json
@@ -0,0 +1,45 @@
+{
+  "name": "documentation",
+  "version": "0.0.0",
+  "private": true,
+  "scripts": {
+    "docusaurus": "docusaurus",
+    "start": "docusaurus start",
+    "build": "docusaurus build",
+    "swizzle": "docusaurus swizzle",
+    "deploy": "docusaurus deploy",
+    "clear": "docusaurus clear",
+    "serve": "docusaurus serve",
+    "write-translations": "docusaurus write-translations",
+    "write-heading-ids": "docusaurus write-heading-ids"
+  },
+  "dependencies": {
+    "@docusaurus/core": "^3.2.1",
+    "@docusaurus/plugin-sitemap": "^3.2.1",
+    "@docusaurus/preset-classic": "^3.2.1",
+    "@mdx-js/react": "^3.0.0",
+    "clsx": "^2.0.0",
+    "prism-react-renderer": "^2.3.0",
+    "react": "^18.0.0",
+    "react-dom": "^18.0.0"
+  },
+  "devDependencies": {
+    "@docusaurus/module-type-aliases": "^3.2.1",
+    "@docusaurus/types": "^3.2.1"
+  },
+  "browserslist": {
+    "production": [
+      ">0.5%",
+      "not dead",
+      "not op_mini all"
+    ],
+    "development": [
+      "last 3 chrome version",
+      "last 3 firefox version",
+      "last 5 safari version"
+    ]
+  },
+  "engines": {
+    "node": ">=18.0"
+  }
+}
--- a/documentation/sidebars.js
+++ b/documentation/sidebars.js
@@ -0,0 +1,33 @@
+/**
+ * Creating a sidebar enables you to:
+ - create an ordered group of docs
+ - render a sidebar for each doc of that group
+ - provide next/previous navigation
+
+ The sidebars can be generated from the filesystem, or explicitly defined here.
+
+ Create as many sidebars as you want.
+ */
+
+// @ts-check
+
+/** @type {import('@docusaurus/plugin-content-docs').SidebarsConfig} */
+const sidebars = {
+  // By default, Docusaurus generates a sidebar from the docs folder structure
+  tutorialSidebar: [{type: 'autogenerated', dirName: '.'}],
+
+  // But you can create a sidebar manually
+  /*
+  tutorialSidebar: [
+    'intro',
+    'hello',
+    {
+      type: 'category',
+      label: 'Tutorial',
+      items: ['tutorial-basics/create-a-document'],
+    },
+  ],
+   */
+};
+
+export default sidebars;
--- a/documentation/src/components/HomepageFeatures/styles.module.css
+++ b/documentation/src/components/HomepageFeatures/styles.module.css
@@ -0,0 +1,11 @@
+.features {
+  display: flex;
+  align-items: center;
+  padding: 2rem 0;
+  width: 100%;
+}
+
+.featureSvg {
+  height: 200px;
+  width: 200px;
+}
--- a/documentation/src/css/custom.css
+++ b/documentation/src/css/custom.css
@@ -0,0 +1,37 @@
+/**
+ * Any CSS included here will be global. The classic template
+ * bundles Infima by default. Infima is a CSS framework designed to
+ * work well for content-centric websites.
+ */
+
+ @import url('https://fonts.googleapis.com/css2?family=Source+Sans+3&display=swap');
+
+/* You can override the default Infima variables here. */
+:root {
+  --ifm-color-primary: #fcc50b;
+  --ifm-color-primary-dark: #fcc50b;
+  --ifm-color-primary-darker: #fcc50b;
+  --ifm-color-primary-darkest: #fcc50b;
+  --ifm-color-primary-light: #fcc50b;
+  --ifm-color-primary-lighter: #fcc50b;
+  --ifm-color-primary-lightest: #fcc50b;
+  --ifm-code-font-size: 95%;
+  --ifm-heading-font-family: 'Source Sans 3', sans-serif;
+  --docusaurus-highlighted-code-line-bg: rgba(0, 0, 0, 0.1);
+}
+
+/* For readability concerns, you should choose a lighter palette in dark mode. */
+[data-theme='dark'] {
+  --ifm-color-primary: #fcc50b;
+  --ifm-color-primary-dark: #fcc50b;
+  --ifm-color-primary-darker: #fcc50b;
+  --ifm-color-primary-darkest: #fcc50b;
+  --ifm-color-primary-light: #fcc50b;
+  --ifm-color-primary-lighter: #fcc50b;
+  --ifm-color-primary-lightest: #fcc50b;
+  --docusaurus-highlighted-code-line-bg: rgba(0, 0, 0, 0.3);
+}
+
+body {
+  font-family: 'Source Sans 3', sans-serif;
+}
--- a/documentation/yarn.lock
+++ b/documentation/yarn.lock
--- a/Show More
+++ b/Show More