├── .github
    ├── release.yml
    └── workflows
    │   ├── codeql.yml
    │   ├── docker_release.yml
    │   ├── e2e_test.yml
    │   ├── gh_project.yml
    │   ├── lint.yml
    │   ├── publish_release.yml
    │   └── unit_test.yml
├── .gitignore
├── .pre-commit-config.yaml
├── .taplo.toml
├── CHANGELOG.md
├── CONTRIBUTING.md
├── LICENSE
├── Makefile
├── README.md
├── docker
    ├── Dockerfile.base
    ├── README.md
    ├── docker-bake.hcl
    ├── run_apiserver.py
    └── run_autodeploy.py
├── docs
    ├── README.md
    ├── docs
    │   ├── _static
    │   │   ├── assets
    │   │   │   ├── LlamaLogoBrowserTab.png
    │   │   │   └── LlamaSquareBlack.svg
    │   │   ├── css
    │   │   │   ├── algolia.css
    │   │   │   └── custom.css
    │   │   └── js
    │   │   │   ├── algolia.js
    │   │   │   ├── leadfeeder.js
    │   │   │   └── mendablesearch.js
    │   ├── api_reference
    │   │   └── llama_deploy
    │   │   │   ├── apiserver.md
    │   │   │   ├── control_plane.md
    │   │   │   ├── message_queues
    │   │   │       ├── index.md
    │   │   │       ├── kafka.md
    │   │   │       ├── rabbitmq.md
    │   │   │       ├── redis.md
    │   │   │       └── simple.md
    │   │   │   ├── python_sdk.md
    │   │   │   ├── services.md
    │   │   │   └── types.md
    │   ├── css
    │   │   ├── algolia.css
    │   │   ├── custom.css
    │   │   └── style.css
    │   ├── index.md
    │   ├── javascript
    │   │   ├── algolia.js
    │   │   ├── llms_example.js
    │   │   └── mendablesearch.js
    │   └── module_guides
    │   │   └── llama_deploy
    │   │       ├── 10_getting_started.md
    │   │       ├── 20_core_components.md
    │   │       ├── 30_python_sdk.md
    │   │       ├── 40_llamactl.md
    │   │       ├── 50_observability.md
    │   │       ├── apiserver.json
    │   │       └── index.md
    ├── mkdocs.yml
    ├── overrides
    │   ├── main.html
    │   └── partials
    │   │   ├── copyright.html
    │   │   └── search.html
    ├── pyproject.toml
    └── uv.lock
├── e2e_tests
    ├── README.md
    ├── __init__.py
    ├── apiserver
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── deployments
    │   │   ├── deployment1.yml
    │   │   ├── deployment2.yml
    │   │   ├── deployment_env_git.yml
    │   │   ├── deployment_env_local.yml
    │   │   ├── deployment_hitl.yml
    │   │   ├── deployment_reload1.yml
    │   │   ├── deployment_reload2.yml
    │   │   ├── deployment_streaming.yml
    │   │   └── src
    │   │   │   ├── .env
    │   │   │   ├── __init__.py
    │   │   │   ├── workflow.py
    │   │   │   ├── workflow_env.py
    │   │   │   ├── workflow_hitl.py
    │   │   │   └── workflow_reload.py
    │   ├── rc
    │   │   ├── deployment.yml
    │   │   └── src
    │   │   │   ├── __init__.py
    │   │   │   └── workflow.py
    │   ├── test_autodeploy.py
    │   ├── test_deploy.py
    │   ├── test_env_vars_git.py
    │   ├── test_env_vars_local.py
    │   ├── test_hitl.py
    │   ├── test_reload.py
    │   ├── test_service_entrypoint.py
    │   ├── test_status.py
    │   └── test_streaming.py
    ├── basic_hitl
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── test_run_client.py
    │   └── workflow.py
    ├── basic_session
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── test_run_client.py
    │   └── workflow.py
    ├── basic_streaming
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── test_run_client.py
    │   └── workflow.py
    ├── basic_workflow
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── test_run_client.py
    │   └── workflow.py
    ├── conftest.py
    ├── core
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── test_services.py
    │   └── workflow.py
    ├── message_queues
    │   ├── __init__.py
    │   ├── kafka
    │   │   ├── __init__.py
    │   │   ├── conftest.py
    │   │   ├── docker-compose.yml
    │   │   ├── test_message_queue.py
    │   │   └── workflow.py
    │   ├── rabbitmq
    │   │   ├── __init__.py
    │   │   ├── conftest.py
    │   │   ├── docker-compose.yml
    │   │   ├── test_message_queue.py
    │   │   └── workflow.py
    │   ├── redis
    │   │   ├── __init__.py
    │   │   ├── conftest.py
    │   │   ├── docker-compose.yml
    │   │   ├── test_message_queue.py
    │   │   └── workflow.py
    │   └── simple
    │   │   ├── __init__.py
    │   │   ├── conftest.py
    │   │   ├── test_message_queue.py
    │   │   └── test_server.py
    └── utils.py
├── examples
    ├── google_cloud_run
    │   ├── Dockerfile
    │   ├── README.md
    │   ├── deployment.yml
    │   └── src
    │   │   └── workflow.py
    ├── llamacloud
    │   └── google_drive
    │   │   ├── README.md
    │   │   ├── deployment.yml
    │   │   └── src
    │   │       ├── config.yml
    │   │       ├── setup_pipeline.py
    │   │       └── workflow.py
    ├── python_fullstack
    │   ├── README.md
    │   ├── docker-compose.yml
    │   ├── frontend
    │   │   ├── .gitignore
    │   │   ├── assets
    │   │   │   └── favicon.ico
    │   │   ├── dockerfile
    │   │   ├── frontend
    │   │   │   ├── __init__.py
    │   │   │   ├── frontend.py
    │   │   │   ├── session_list
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── component.py
    │   │   │   │   └── state.py
    │   │   │   ├── state.py
    │   │   │   └── style.py
    │   │   ├── requirements.txt
    │   │   └── rxconfig.py
    │   ├── llama_deploy_frontend.png
    │   ├── python_fullstack.yaml
    │   └── workflows
    │   │   ├── __init__.py
    │   │   ├── agent_workflow.py
    │   │   ├── data
    │   │       └── attention.pdf
    │   │   ├── dockerfile
    │   │   ├── rag_workflow.py
    │   │   └── requirements.txt
    ├── quick_start
    │   ├── README.md
    │   ├── quick_start.yml
    │   ├── src
    │   │   └── workflow.py
    │   └── ui
    │   │   ├── .gitignore
    │   │   ├── app
    │   │       ├── confetti
    │   │       │   └── page.tsx
    │   │       ├── favicon.ico
    │   │       ├── globals.css
    │   │       ├── layout.tsx
    │   │       └── page.tsx
    │   │   ├── eslint.config.mjs
    │   │   ├── next.config.ts
    │   │   ├── package-lock.json
    │   │   ├── package.json
    │   │   ├── pnpm-lock.yaml
    │   │   ├── postcss.config.mjs
    │   │   ├── public
    │   │       ├── file.svg
    │   │       └── logo-dark-light.svg
    │   │   └── tsconfig.json
    ├── redis_message_queue
    │   ├── README.md
    │   ├── docker-compose.yml
    │   └── src
    │   │   ├── deployment.yml
    │   │   └── workflow.py
    └── redis_state_store
    │   ├── README.md
    │   ├── docker-compose.yml
    │   ├── redis_store.yml
    │   ├── requirements.txt
    │   └── src
    │       └── workflow.py
├── llama_deploy
    ├── __init__.py
    ├── apiserver
    │   ├── __init__.py
    │   ├── __main__.py
    │   ├── app.py
    │   ├── deployment.py
    │   ├── deployment_config_parser.py
    │   ├── routers
    │   │   ├── __init__.py
    │   │   ├── deployments.py
    │   │   └── status.py
    │   ├── server.py
    │   ├── settings.py
    │   ├── source_managers
    │   │   ├── __init__.py
    │   │   ├── base.py
    │   │   ├── git.py
    │   │   └── local.py
    │   ├── stats.py
    │   └── tracing.py
    ├── cli
    │   ├── __init__.py
    │   ├── __main__.py
    │   ├── config.py
    │   ├── deploy.py
    │   ├── init.py
    │   ├── internal
    │   │   ├── config.py
    │   │   └── utils.py
    │   ├── run.py
    │   ├── serve.py
    │   ├── sessions.py
    │   └── status.py
    ├── client
    │   ├── __init__.py
    │   ├── base.py
    │   ├── client.py
    │   └── models
    │   │   ├── __init__.py
    │   │   ├── apiserver.py
    │   │   ├── core.py
    │   │   └── model.py
    ├── control_plane
    │   ├── __init__.py
    │   ├── config.py
    │   ├── server.py
    │   └── utils.py
    ├── message_queues
    │   ├── __init__.py
    │   ├── apache_kafka.py
    │   ├── base.py
    │   ├── rabbitmq.py
    │   ├── redis.py
    │   └── simple
    │   │   ├── __init__.py
    │   │   ├── client.py
    │   │   ├── config.py
    │   │   └── server.py
    ├── services
    │   ├── __init__.py
    │   ├── network_service_manager.py
    │   └── workflow.py
    └── types
    │   ├── __init__.py
    │   ├── apiserver.py
    │   └── core.py
├── pyproject.toml
├── system_diagram.png
├── templates
    └── basic
    │   ├── src
    │       ├── __init__.py
    │       └── workflow.py
    │   └── ui
    │       ├── .gitignore
    │       ├── app
    │           ├── favicon.ico
    │           ├── globals.css
    │           ├── layout.tsx
    │           └── page.tsx
    │       ├── eslint.config.mjs
    │       ├── next.config.ts
    │       ├── package-lock.json
    │       ├── package.json
    │       ├── postcss.config.mjs
    │       ├── public
    │           ├── file.svg
    │           └── logo-dark-light.svg
    │       └── tsconfig.json
├── tests
    ├── __init__.py
    ├── apiserver
    │   ├── conftest.py
    │   ├── data
    │   │   ├── .env
    │   │   ├── env_variables.yaml
    │   │   ├── example.yaml
    │   │   ├── git_service.yaml
    │   │   ├── local.yaml
    │   │   ├── python_dependencies.yaml
    │   │   ├── service_ports.yaml
    │   │   ├── with_ui.yaml
    │   │   └── workflow
    │   │   │   ├── __init__.py
    │   │   │   └── workflow_test.py
    │   ├── routers
    │   │   ├── __init__.py
    │   │   ├── test_deployments.py
    │   │   └── test_status.py
    │   ├── source_managers
    │   │   ├── __init__.py
    │   │   ├── test_git.py
    │   │   └── test_local.py
    │   ├── test_app.py
    │   ├── test_config_parser.py
    │   ├── test_deployment.py
    │   ├── test_server.py
    │   └── test_settings.py
    ├── cli
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── data
    │   │   ├── config.yaml
    │   │   └── deployment.yaml
    │   ├── internal
    │   │   ├── __init__.py
    │   │   └── test_config.py
    │   ├── test_cli.py
    │   ├── test_config.py
    │   ├── test_deploy.py
    │   ├── test_init.py
    │   ├── test_run.py
    │   ├── test_serve.py
    │   ├── test_sessions.py
    │   └── test_status.py
    ├── client
    │   ├── models
    │   │   ├── __init__.py
    │   │   ├── conftest.py
    │   │   ├── test_apiserver.py
    │   │   ├── test_core.py
    │   │   └── test_model.py
    │   └── test_client.py
    ├── conftest.py
    ├── control_plane
    │   ├── __init__.py
    │   ├── conftest.py
    │   ├── test_config.py
    │   ├── test_server.py
    │   └── test_utils.py
    ├── message_queues
    │   ├── simple
    │   │   ├── __init__.py
    │   │   ├── conftest.py
    │   │   ├── test_client.py
    │   │   ├── test_config.py
    │   │   └── test_server.py
    │   ├── test_apache_kafka.py
    │   ├── test_rabbitmq.py
    │   └── test_redis.py
    └── services
    │   ├── __init__.py
    │   ├── test_network_workflow.py
    │   ├── test_workflow_service.py
    │   ├── test_workflow_service_config.py
    │   └── test_workflow_state.py
└── uv.lock


/.github/release.yml:
--------------------------------------------------------------------------------
 1 | changelog:
 2 |   categories:
 3 |     - title: Breaking Changes ⚠️
 4 |       labels:
 5 |         - breaking-change
 6 |     - title: New Features 🎉
 7 |       labels:
 8 |         - '*'
 9 |     - title: Bug Fixes 🐛
10 |       labels:
11 |         - bug
12 |     - title: Documentation 📚
13 |       labels:
14 |         - documentation
15 |         - example
16 | 


--------------------------------------------------------------------------------
/.github/workflows/docker_release.yml:
--------------------------------------------------------------------------------
 1 | name: Docker image release
 2 | 
 3 | on:
 4 |   workflow_dispatch:
 5 |   push:
 6 |     branches:
 7 |       - main
 8 |     tags:
 9 |       - "v[0-9]+.[0-9]+.[0-9]+*"
10 | 
11 | env:
12 |   DOCKER_REPO_NAME: llamaindex/llama-deploy
13 | 
14 | jobs:
15 |   build-and-push:
16 |     name: Build base image
17 |     runs-on: ubuntu-latest
18 |     # don't run from forks
19 |     if: github.repository_owner == 'run-llama'
20 | 
21 |     steps:
22 |       - name: Checkout
23 |         uses: actions/checkout@v4
24 | 
25 |       - name: Set up QEMU
26 |         uses: docker/setup-qemu-action@v3
27 | 
28 |       - name: Set up Docker Buildx
29 |         uses: docker/setup-buildx-action@v3
30 | 
31 |       - name: Login to DockerHub
32 |         uses: docker/login-action@v3
33 |         with:
34 |           username: ${{ secrets.DOCKER_HUB_USER }}
35 |           password: ${{ secrets.DOCKER_HUB_TOKEN }}
36 | 
37 |       - name: Docker meta
38 |         id: meta
39 |         uses: docker/metadata-action@v5
40 |         with:
41 |           images: $DOCKER_REPO_NAME
42 | 
43 |       - name: Build images
44 |         uses: docker/bake-action@v5
45 |         env:
46 |           IMAGE_TAG_SUFFIX: ${{ steps.meta.outputs.version }}
47 |           LLAMA_DEPLOY_VERSION: ${{ steps.meta.outputs.version }}
48 |         with:
49 |           workdir: docker
50 |           targets: all
51 |           push: true
52 | 


--------------------------------------------------------------------------------
/.github/workflows/e2e_test.yml:
--------------------------------------------------------------------------------
 1 | name: E2E Testing
 2 | 
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - main
 7 |   pull_request:
 8 | 
 9 | jobs:
10 |   e2e-tests:
11 |     runs-on: ubuntu-latest
12 |     # E2E tests might get stuck, timeout aggressively for faster feedback
13 |     timeout-minutes: 10
14 |     strategy:
15 |       # Let the matrix finish to see if the failure was transient
16 |       fail-fast: false
17 |       matrix:
18 |         python-version: ["3.10", "3.11", "3.12"]
19 |         test-package:
20 |           [
21 |             "basic_hitl",
22 |             "basic_streaming",
23 |             "apiserver",
24 |             "basic_session",
25 |             "basic_workflow",
26 |             "core",
27 |           ]
28 |     steps:
29 |       - uses: actions/checkout@v3
30 | 
31 |       - name: Install uv and set the python version
32 |         uses: astral-sh/setup-uv@v5
33 |         with:
34 |           python-version: ${{ matrix.python-version }}
35 | 
36 |       - name: Run All E2E Tests
37 |         run: uv run -- pytest e2e_tests/${{ matrix.test-package }} -s
38 | 
39 |   e2e-message-queues:
40 |     runs-on: ubuntu-latest
41 |     # E2E tests might get stuck, timeout aggressively for faster feedback
42 |     timeout-minutes: 10
43 |     strategy:
44 |       # Let the matrix finish to see if the failure was transient
45 |       fail-fast: false
46 |       matrix:
47 |         test-package: ["kafka", "rabbitmq", "redis", "simple"]
48 |     steps:
49 |       - uses: actions/checkout@v3
50 | 
51 |       - name: Install uv and set the python version
52 |         uses: astral-sh/setup-uv@v5
53 | 
54 |       - name: Run E2E Tests for message queues
55 |         run: uv run -- pytest e2e_tests/message_queues/${{ matrix.test-package }} -s
56 | 


--------------------------------------------------------------------------------
/.github/workflows/gh_project.yml:
--------------------------------------------------------------------------------
 1 | name: Add issues to GitHub project
 2 | 
 3 | on:
 4 |   issues:
 5 |     types:
 6 |       - opened
 7 | 
 8 | jobs:
 9 |   add-to-project:
10 |     name: Add new issues to project for triage
11 |     runs-on: ubuntu-latest
12 |     steps:
13 |       - uses: actions/add-to-project@v1.0.2
14 |         with:
15 |           project-url: https://github.com/orgs/run-llama/projects/8
16 |           github-token: ${{ secrets.ADD_TO_PROJECT_PAT }}
17 | 


--------------------------------------------------------------------------------
/.github/workflows/lint.yml:
--------------------------------------------------------------------------------
 1 | name: Linting
 2 | 
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - main
 7 |   pull_request:
 8 | 
 9 | jobs:
10 |   lint:
11 |     runs-on: ubuntu-latest
12 |     steps:
13 |       - uses: actions/checkout@v3
14 | 
15 |       - name: Install uv
16 |         uses: astral-sh/setup-uv@v5
17 | 
18 |       - name: Set up Python
19 |         run: uv python install
20 | 
21 |       - name: Run linter
22 |         shell: bash
23 |         run: uv run -- pre-commit run -a
24 | 


--------------------------------------------------------------------------------
/.github/workflows/publish_release.yml:
--------------------------------------------------------------------------------
 1 | name: Publish llama-index to PyPI / GitHub
 2 | 
 3 | on:
 4 |   workflow_dispatch:
 5 |   push:
 6 |     tags:
 7 |       - "v*"
 8 | 
 9 | jobs:
10 |   build-n-publish:
11 |     name: Build and publish to PyPI
12 |     if: github.repository == 'run-llama/llama_deploy'
13 |     runs-on: ubuntu-latest
14 |     permissions:
15 |       contents: write
16 | 
17 |     steps:
18 |       - uses: actions/checkout@v4
19 | 
20 |       - name: Install uv
21 |         uses: astral-sh/setup-uv@v5
22 | 
23 |       - name: Build and publish
24 |         env:
25 |           UV_PUBLISH_TOKEN: ${{ secrets.LLAMA_AGENTS_PYPI_TOKEN }}
26 |         run: |
27 |           uv build
28 |           uv publish
29 | 
30 |       - name: Create GitHub Release
31 |         uses: ncipollo/release-action@v1
32 |         with:
33 |           artifacts: "dist/*"
34 |           generateReleaseNotes: true
35 | 


--------------------------------------------------------------------------------
/.github/workflows/unit_test.yml:
--------------------------------------------------------------------------------
 1 | name: Unit Testing
 2 | 
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - main
 7 |   pull_request:
 8 | 
 9 | jobs:
10 |   unit-tests:
11 |     runs-on: ubuntu-latest
12 |     strategy:
13 |       # You can use PyPy versions in python-version.
14 |       # For example, pypy-2.7 and pypy-3.8
15 |       matrix:
16 |         python-version: ["3.10", "3.11", "3.12"]
17 |     steps:
18 |       - uses: actions/checkout@v3
19 | 
20 |       - name: Install uv and set the python version
21 |         uses: astral-sh/setup-uv@v5
22 |         with:
23 |           python-version: ${{ matrix.python-version }}
24 | 
25 |       - name: Run testing
26 |         shell: bash
27 |         run: uv run -- pytest --cov --cov-report=xml tests
28 | 
29 |       - if: matrix.python-version == '3.12'
30 |         name: Report Coveralls
31 |         uses: coverallsapp/github-action@v2
32 |         env:
33 |           COVERALLS_REPO_TOKEN: ${{ secrets.COVERALLS_REPO_TOKEN }}
34 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | # Byte-compiled / optimized
 2 | __pycache__/
 3 | *.py[cod]
 4 | 
 5 | # Unit test / coverage reports
 6 | .coverage
 7 | .coverage.*
 8 | coverage.*
 9 | .pytest_cache/
10 | 
11 | # Build artifacts
12 | dist/
13 | 
14 | # Project related
15 | .tool-versions
16 | 
17 | # IDEs
18 | .idea
19 | .DS_Store
20 | .vscode
21 | .zed
22 | .claude
23 | 


--------------------------------------------------------------------------------
/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | ---
 2 | default_language_version:
 3 |   python: python3
 4 | 
 5 | repos:
 6 |   - repo: https://github.com/pre-commit/pre-commit-hooks
 7 |     rev: v5.0.0
 8 |     hooks:
 9 |       - id: check-byte-order-marker
10 |       - id: check-merge-conflict
11 |       - id: check-symlinks
12 |       - id: check-toml
13 |       - id: check-yaml
14 |         args: [--allow-multiple-documents]
15 |       - id: detect-private-key
16 |       - id: end-of-file-fixer
17 |       - id: mixed-line-ending
18 |       - id: trailing-whitespace
19 | 
20 |   - repo: https://github.com/charliermarsh/ruff-pre-commit
21 |     rev: v0.7.3
22 | 
23 |     hooks:
24 |       - id: ruff
25 |         args: [--fix, --exit-non-zero-on-fix]
26 |       - id: ruff-format
27 | 
28 |   - repo: https://github.com/pre-commit/mirrors-mypy
29 |     rev: v1.15.0
30 |     hooks:
31 |       - id: mypy
32 |         additional_dependencies:
33 |           [
34 |             "llama_deploy[kafka,rabbitmq,redis,awssqs]",
35 |             "llama_index_core",
36 |             "types-Deprecated",
37 |             "types-PyYAML",
38 |             "types-botocore",
39 |             "types-aiobotocore",
40 |             "types-protobuf==4.24.0.4",
41 |             "types-redis",
42 |             "types-requests",
43 |             "types-setuptools",
44 |             "types-click",
45 |           ]
46 |         args:
47 |           [
48 |             --disallow-untyped-defs,
49 |             --ignore-missing-imports,
50 |             --python-version=3.11,
51 |           ]
52 |         exclude: ^(examples/|e2e_tests/|tests/message_queues/test_aws.py)
53 | 
54 |   - repo: https://github.com/adamchainz/blacken-docs
55 |     rev: 1.16.0
56 |     hooks:
57 |       - id: blacken-docs
58 |         name: black-docs-text
59 |         alias: black
60 |         types_or: [rst, markdown, tex]
61 |         additional_dependencies: [black==23.10.1]
62 |         # Using PEP 8's line length in docs prevents excess left/right scrolling
63 |         args: [--line-length=79]
64 | 
65 |   - repo: https://github.com/codespell-project/codespell
66 |     rev: v2.3.0
67 |     hooks:
68 |       - id: codespell
69 |         additional_dependencies: [tomli]
70 | 
71 |   - repo: https://github.com/pappasam/toml-sort
72 |     rev: v0.23.1
73 |     hooks:
74 |       - id: toml-sort-fix
75 | 


--------------------------------------------------------------------------------
/.taplo.toml:
--------------------------------------------------------------------------------
1 | [formatting]
2 | align_comments = false
3 | reorder_keys = false
4 | # Following are to be consistent with toml-sort
5 | indent_string = "  "
6 | array_trailing_comma = false
7 | compact_arrays = true
8 | compact_inline_tables = true
9 | 


--------------------------------------------------------------------------------
/CHANGELOG.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/CHANGELOG.md


--------------------------------------------------------------------------------
/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | # Contributing to llama_deploy
 2 | 
 3 | Thank you for your interest in contributing to llama_deploy! This document provides guidelines and
 4 | instructions for contributing to the project.
 5 | 
 6 | ## Getting Started
 7 | 
 8 | 1. Fork the repository
 9 | 2. Clone your fork: `git clone https://github.com/yourusername/llama_deploy.git`
10 | 3. Set up your development environment (see below)
11 | 4. Create a feature branch: `git checkout -b feature/my-feature`
12 | 
13 | ## Development Environment
14 | 
15 | ### Installing uv
16 | 
17 | We use `uv` for package management. If you don't have it installed:
18 | 
19 | ```
20 | curl -LsSf https://astral.sh/uv/install.sh | sh
21 | ```
22 | 
23 | Or on macOS with Homebrew:
24 | ```
25 | brew install uv
26 | ```
27 | 
28 | For more installation options, visit the [uv documentation](https://docs.astral.sh/uv/getting-started/installation/).
29 | 
30 | ### Setting up the project
31 | 
32 | Run the unit tests to verify your setup:
33 | ```
34 | uv run -- pytest tests
35 | ```
36 | 
37 | You can also run the end-to-end tests:
38 | ```
39 | uv run -- pytest e2e_tests
40 | ```
41 | 
42 | ## Making Changes
43 | 
44 | 1. Make your changes
45 | 2. Add or update tests as needed
46 | 3. Run tests to make sure everything passes
47 | 4. Update documentation if necessary
48 | 5. Commit your changes with a descriptive message
49 | 
50 | ## Pull Request Process
51 | 
52 | 1. Push changes to your fork
53 | 2. Submit a pull request to the main repository
54 | 3. Add a clear description of the changes
55 | 4. Address any review comments
56 | 
57 | ## Code Style
58 | 
59 | Follow the existing code style in the project. We use:
60 | 
61 | - Black for code formatting
62 | - Ruff for linting
63 | 
64 | ## Testing
65 | 
66 | - Write tests for any new functionality
67 | - Ensure all tests pass before submitting a PR
68 | - Run tests with: `uv run -- pytest`
69 | 
70 | ## Documentation
71 | 
72 | - Update documentation for any changed functionality
73 | - Document new features thoroughly
74 | 
75 | ## Questions?
76 | 
77 | If you have questions about contributing, please open an issue in the repository.
78 | 
79 | Thank you for contributing to llama_deploy!
80 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2024 LlamaIndex
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/Makefile:
--------------------------------------------------------------------------------
 1 | GIT_ROOT ?= $(shell git rev-parse --show-toplevel)
 2 | 
 3 | help:	## Show all Makefile targets.
 4 | 	@grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[33m%-30s\033[0m %s\n", $$1, $$2}'
 5 | 
 6 | format:	## Run code autoformatters (black).
 7 | 	pre-commit install
 8 | 	git ls-files | xargs pre-commit run black --files
 9 | 
10 | lint:	## Run linters: pre-commit (black, ruff, codespell) and mypy
11 | 	pre-commit install && git ls-files | xargs pre-commit run --show-diff-on-failure --files
12 | 
13 | test:	## Run tests via pytest
14 | 	pytest tests
15 | 


--------------------------------------------------------------------------------
/docker/Dockerfile.base:
--------------------------------------------------------------------------------
 1 | ARG build_image
 2 | ARG dist_image
 3 | 
 4 | FROM $build_image AS build-image
 5 | 
 6 | ARG llama_deploy_version
 7 | ARG llama_deploy_version_sha
 8 | ARG llama_deploy_extras=""
 9 | ARG git_clone_options
10 | 
11 | RUN apt-get update && \
12 |     apt-get install -y --no-install-recommends \
13 |     build-essential \
14 |     git
15 | 
16 | # Shallow clone the repo, we install from git
17 | RUN git clone ${git_clone_options} --branch=${llama_deploy_version} https://github.com/run-llama/llama_deploy.git /opt/llama_deploy
18 | WORKDIR /opt/llama_deploy
19 | RUN git checkout ${llama_deploy_version_sha}
20 | 
21 | # Use a virtualenv we can copy over the next build stage
22 | RUN python3 -m venv --system-site-packages /opt/venv
23 | ENV PATH="/opt/venv/bin:$PATH"
24 | 
25 | # Install llama_deploy
26 | RUN pip install --upgrade pip && \
27 |     pip install --no-cache-dir ".$llama_deploy_extras"
28 | 
29 | FROM $dist_image AS final
30 | 
31 | ENV PATH="/opt/venv/bin:$PATH"
32 | RUN apt-get update && \
33 |     apt-get install -y --no-install-recommends git nodejs npm && \
34 |     npm i pnpm --global
35 | 
36 | ARG apiserver_port
37 | ARG rc_path
38 | ARG prometheus_enabled
39 | ARG prometheus_port
40 | 
41 | EXPOSE ${apiserver_port}
42 | EXPOSE ${prometheus_port}
43 | 
44 | COPY --from=build-image /opt/venv /opt/venv
45 | COPY ./run_apiserver.py /opt
46 | COPY ./run_autodeploy.py /opt
47 | 
48 | # Default configuration, override with "docker run -e NAME=value"
49 | ENV LLAMA_DEPLOY_APISERVER_RC_PATH=${rc_path}
50 | ENV LLAMA_DEPLOY_APISERVER_HOST=0.0.0.0
51 | ENV LLAMA_DEPLOY_APISERVER_PORT=${apiserver_port}
52 | ENV LLAMA_DEPLOY_APISERVER_PROMETHEUS_ENABLED=${prometheus_enabled}
53 | ENV LLAMA_DEPLOY_APISERVER_PROMETHEUS_PORT=${prometheus_port}
54 | 
55 | FROM final AS base
56 | 
57 | ENTRYPOINT [ "python", "/opt/run_apiserver.py" ]
58 | 
59 | FROM final AS autodeploy
60 | 
61 | ENTRYPOINT [ "python", "/opt/run_autodeploy.py" ]
62 | 


--------------------------------------------------------------------------------
/docker/README.md:
--------------------------------------------------------------------------------
 1 | # Docker build system
 2 | 
 3 | This folder contains the files needed to build the base `llama_deploy` images that
 4 | can be used to simplify deployments by reducing boiler plate code.
 5 | 
 6 | ## Image Development
 7 | 
 8 | Images are built with [BuildKit](https://docs.docker.com/build/buildkit/) and we use
 9 | `bake` to orchestrate the process. To build all the available images run:
10 | 
11 | ```sh
12 | docker buildx bake all
13 | ```
14 | 
15 | You can override any `variable` defined in the `docker-bake.hcl` file and build custom
16 | images, for example if you want to use a branch from the llama_deploy repo instead of
17 | an official release, run:
18 | 
19 | ```sh
20 | LLAMA_DEPLOY_VERSION=mybranch_or_tag docker buildx bake
21 | ```
22 | 
23 | ### Multi-Platform Builds
24 | 
25 | `llama_deploy` images support multiple architectures. Depending on your operating
26 | system and Docker environment, you might not be able to build all of them locally.
27 | 
28 | This is the error you might encounter:
29 | 
30 | ```
31 | multiple platforms feature is currently not supported for docker driver. Please switch to a different driver
32 | (eg. “docker buildx create --use”)
33 | ```
34 | 
35 | Make sure `containerd` image store is enabled, following the instruction in the [Docker documentation](https://docs.docker.com/build/building/multi-platform/#enable-the-containerd-image-store).
36 | 
37 | If the problem persists, one solution is to override the `platform` option and
38 | limit local builds to the same architecture as your computer's. For example, on an Apple M1 you can limit the builds
39 | to ARM only by invoking `bake` like this:
40 | 
41 | ```sh
42 | docker buildx bake control_plane --set "*.platform=linux/arm64"
43 | ```
44 | 


--------------------------------------------------------------------------------
/docker/docker-bake.hcl:
--------------------------------------------------------------------------------
 1 | variable "IMAGE_NAME" {
 2 |     default = "llamaindex/llama-deploy"
 3 | }
 4 | 
 5 | variable "IMAGE_TAG_SUFFIX" {
 6 |     default = "local"
 7 | }
 8 | 
 9 | variable "LLAMA_DEPLOY_VERSION" {
10 |     default = "main"
11 | }
12 | 
13 | variable "LLAMA_DEPLOY_VERSION_SHA" {
14 |     default = ""
15 | }
16 | 
17 | variable "GIT_CLONE_OPTIONS" {
18 |     default = "--depth=1"
19 | }
20 | 
21 | variable "BUILD_IMAGE" {
22 |     default = "python:3.12-slim"
23 | }
24 | 
25 | variable "DIST_IMAGE" {
26 |     default = "python:3.12-slim"
27 | }
28 | 
29 | variable "APISERVER_PORT" {
30 |     default = 4501
31 | }
32 | 
33 | variable "PROMETHEUS_PORT" {
34 |     default = 9000
35 | }
36 | 
37 | variable "PROMETHEUS_ENABLED" {
38 |     default = true
39 | }
40 | 
41 | variable "ENTRYPOINT_SCRIPT" {
42 |     default = "run_apiserver.py"
43 | }
44 | 
45 | variable "RC_PATH" {
46 |     default = "/data"
47 | }
48 | 
49 | target "default" {
50 |     dockerfile = "Dockerfile.base"
51 |     tags = ["${IMAGE_NAME}:${IMAGE_TAG_SUFFIX}"]
52 |     target = "base"
53 |     args = {
54 |         build_image = "${BUILD_IMAGE}"
55 |         dist_image = "${DIST_IMAGE}"
56 |         llama_deploy_version = "${LLAMA_DEPLOY_VERSION}"
57 |         llama_deploy_version_sha = "${LLAMA_DEPLOY_VERSION_SHA}"
58 |         llama_deploy_extras = "[awssqs, rabbitmq, kafka, redis]"
59 |         git_clone_options = "${GIT_CLONE_OPTIONS}"
60 |         apiserver_port = "${APISERVER_PORT}"
61 |         prometheus_port = "${PROMETHEUS_PORT}"
62 |         prometheus_enabled = "${PROMETHEUS_ENABLED}"
63 |         entrypoint_script = "${ENTRYPOINT_SCRIPT}"
64 |         rc_path = "${RC_PATH}"
65 |     }
66 |     platforms = ["linux/amd64", "linux/arm64"]
67 | }
68 | 
69 | target "autodeploy" {
70 |     inherits = ["default"]
71 |     tags = ["${IMAGE_NAME}:${IMAGE_TAG_SUFFIX}-autodeploy"]
72 |     target = "autodeploy"
73 |     args = {
74 |         entrypoint_script = "run_autodeploy.py",
75 |         apiserver_port = 8080,
76 |     }
77 | }
78 | 
79 | group "all" {
80 |   targets = ["default", "autodeploy"]
81 | }
82 | 


--------------------------------------------------------------------------------
/docker/run_apiserver.py:
--------------------------------------------------------------------------------
 1 | import uvicorn
 2 | from prometheus_client import start_http_server
 3 | 
 4 | from llama_deploy.apiserver.settings import settings
 5 | 
 6 | if __name__ == "__main__":
 7 |     if settings.prometheus_enabled:
 8 |         start_http_server(settings.prometheus_port)
 9 | 
10 |     uvicorn.run(
11 |         "llama_deploy.apiserver.app:app",
12 |         host=settings.host,
13 |         port=settings.port,
14 |     )
15 | 


--------------------------------------------------------------------------------
/docs/README.md:
--------------------------------------------------------------------------------
 1 | # LlamaDeploy Documentation
 2 | 
 3 | This repository contains the documentation for LlamaDeploy, built using MkDocs with Material theme.
 4 | 
 5 | ## Setup
 6 | 
 7 | ### Prerequisites
 8 | - Python 3.10 or higher
 9 | - uv (for dependency management)
10 | 
11 | ### Installation
12 | 
13 | 1. Clone the repository
14 | 2. Install dependencies using uv:
15 | ```bash
16 | uv sync
17 | ```
18 | 
19 | ## Development
20 | 
21 | To start the documentation server locally:
22 | ```bash
23 | uv run mkdocs serve
24 | ```
25 | 
26 | This will start a development server at `http://127.0.0.1:8000`.
27 | 
28 | ## Building
29 | 
30 | LlamaDeploy is part of LlamaIndex [documentation portal](https://docs.llamaindex.ai/)
31 | so the build is performed from the [main repository](https://github.com/run-llama/llama_index).
32 | 
33 | > [!WARNING]
34 | > When a documentation change is merged here, the change won't be visible until a new
35 | > build is triggered from the LlamaIndex repository.
36 | 
37 | 
38 | ## Contributing
39 | 
40 | Contributions are very welcome!
41 | 
42 | 1. Create a new branch for your changes
43 | 2. Make your changes to the documentation
44 | 3. Test locally using `uv run mkdocs serve`
45 | 4. Submit a pull request
46 | 


--------------------------------------------------------------------------------
/docs/docs/_static/assets/LlamaLogoBrowserTab.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/docs/docs/_static/assets/LlamaLogoBrowserTab.png


--------------------------------------------------------------------------------
/docs/docs/_static/css/custom.css:
--------------------------------------------------------------------------------
 1 | #my-component-root *,
 2 | #headlessui-portal-root * {
 3 |   z-index: 1000000000000;
 4 |   font-size: 100%;
 5 | }
 6 | 
 7 | textarea {
 8 |   border: 0;
 9 |   padding: 0;
10 | }
11 | 
12 | article p {
13 |   margin-bottom: 10px !important;
14 | }
15 | 


--------------------------------------------------------------------------------
/docs/docs/_static/js/leadfeeder.js:
--------------------------------------------------------------------------------
 1 | (function (ss, ex) {
 2 |   window.ldfdr =
 3 |     window.ldfdr ||
 4 |     function () {
 5 |       (ldfdr._q = ldfdr._q || []).push([].slice.call(arguments));
 6 |     };
 7 |   (function (d, s) {
 8 |     fs = d.getElementsByTagName(s)[0];
 9 |     function ce(src) {
10 |       var cs = d.createElement(s);
11 |       cs.src = src;
12 |       cs.async = 1;
13 |       fs.parentNode.insertBefore(cs, fs);
14 |     }
15 |     ce(
16 |       "https://sc.lfeeder.com/lftracker_v1_" +
17 |         ss +
18 |         (ex ? "_" + ex : "") +
19 |         ".js",
20 |     );
21 |   })(document, "script");
22 | })("Xbp1oaEnqwn8EdVj");
23 | 


--------------------------------------------------------------------------------
/docs/docs/_static/js/mendablesearch.js:
--------------------------------------------------------------------------------
 1 | document.addEventListener("DOMContentLoaded", () => {
 2 |   // Load the external dependencies
 3 |   function loadScript(src, onLoadCallback) {
 4 |     const script = document.createElement("script");
 5 |     script.src = src;
 6 |     script.onload = onLoadCallback;
 7 |     document.head.appendChild(script);
 8 |   }
 9 | 
10 |   function createRootElement() {
11 |     const rootElement = document.createElement("div");
12 |     rootElement.id = "my-component-root";
13 |     document.body.appendChild(rootElement);
14 |     return rootElement;
15 |   }
16 | 
17 |   function initializeMendable() {
18 |     const rootElement = createRootElement();
19 |     const { MendableFloatingButton } = Mendable;
20 | 
21 |     const icon = React.createElement(
22 |       "p",
23 |       {
24 |         style: {
25 |           color: "#ffffff",
26 |           fontSize: "40px",
27 |           width: "48px",
28 |           height: "48px",
29 |           margin: "0px",
30 |           padding: "0px",
31 |           display: "flex",
32 |           alignItems: "center",
33 |           justifyContent: "center",
34 |         },
35 |       },
36 |       "🦙",
37 |     );
38 | 
39 |     const mendableFloatingButton = React.createElement(MendableFloatingButton, {
40 |       style: { darkMode: false, accentColor: "#010810" },
41 |       floatingButtonStyle: { color: "#ffffff", backgroundColor: "#010810" },
42 |       anon_key: "d0fb5ab6-ae6c-49dc-8d38-5115fe8e4755", // Public ANON key, ok to be public
43 |       messageSettings: {
44 |         openSourcesInNewTab: false,
45 |         prettySources: true,
46 |       },
47 |       showSimpleSearch: true,
48 |       icon: icon,
49 |     });
50 | 
51 |     ReactDOM.render(mendableFloatingButton, rootElement);
52 |   }
53 | 
54 |   loadScript("https://unpkg.com/react@17/umd/react.production.min.js", () => {
55 |     loadScript(
56 |       "https://unpkg.com/react-dom@17/umd/react-dom.production.min.js",
57 |       () => {
58 |         loadScript(
59 |           "https://unpkg.com/@mendable/search@0.0.150/dist/umd/mendable.min.js",
60 |           initializeMendable,
61 |         );
62 |       },
63 |     );
64 |   });
65 | });
66 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/apiserver.md:
--------------------------------------------------------------------------------
 1 | # `apiserver`
 2 | 
 3 | ::: llama_deploy.apiserver.deployment
 4 | 
 5 | ::: llama_deploy.apiserver.deployment_config_parser
 6 |     options:
 7 |         members:
 8 |         - DeploymentConfig
 9 | 
10 | ::: llama_deploy.apiserver.source_managers
11 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/control_plane.md:
--------------------------------------------------------------------------------
1 | # `control_plane`
2 | 
3 | ::: llama_deploy.control_plane
4 |     options:
5 |       show_docstring_parameters: true
6 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/message_queues/index.md:
--------------------------------------------------------------------------------
1 | # message_queues
2 | 
3 | ::: llama_deploy.message_queues.base
4 |     options:
5 |         members:
6 |         - AbstractMessageQueue
7 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/message_queues/kafka.md:
--------------------------------------------------------------------------------
1 | # apache_kafka
2 | 
3 | ::: llama_deploy.message_queues.apache_kafka
4 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/message_queues/rabbitmq.md:
--------------------------------------------------------------------------------
1 | # rabbitmq
2 | 
3 | ::: llama_deploy.message_queues.rabbitmq
4 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/message_queues/redis.md:
--------------------------------------------------------------------------------
1 | # redis
2 | 
3 | ::: llama_deploy.message_queues.redis
4 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/message_queues/simple.md:
--------------------------------------------------------------------------------
1 | # simple
2 | 
3 | ::: llama_deploy.message_queues.simple
4 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/python_sdk.md:
--------------------------------------------------------------------------------
 1 | # Python SDK
 2 | 
 3 | ## Client
 4 | 
 5 | ::: llama_deploy.client.Client
 6 |     options:
 7 |       show_bases: false
 8 | 
 9 | 
10 | ## API Server functionalities
11 | 
12 | ::: llama_deploy.client.models.apiserver
13 | 
14 | ## Control Plane functionalities
15 | 
16 | ::: llama_deploy.client.models.core
17 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/services.md:
--------------------------------------------------------------------------------
1 | # `services`
2 | 
3 | ::: llama_deploy.services
4 | 


--------------------------------------------------------------------------------
/docs/docs/api_reference/llama_deploy/types.md:
--------------------------------------------------------------------------------
1 | # `types`
2 | 
3 | ::: llama_deploy.types
4 | 


--------------------------------------------------------------------------------
/docs/docs/css/custom.css:
--------------------------------------------------------------------------------
 1 | #my-component-root *,
 2 | #headlessui-portal-root * {
 3 |   z-index: 1000000000000;
 4 |   font-size: 100%;
 5 | }
 6 | 
 7 | textarea {
 8 |   border: 0;
 9 |   padding: 0;
10 | }
11 | 
12 | article p {
13 |   margin-bottom: 10px !important;
14 | }
15 | 


--------------------------------------------------------------------------------
/docs/docs/css/style.css:
--------------------------------------------------------------------------------
 1 | .md-container .jp-Cell-outputWrapper .jp-OutputPrompt.jp-OutputArea-prompt,
 2 | .md-container .jp-Cell-inputWrapper .jp-InputPrompt.jp-InputArea-prompt {
 3 |   display: none !important;
 4 | }
 5 | 
 6 | /* CSS styles for side-by-side layout */
 7 | .container {
 8 |   display: flex-col;
 9 |   justify-content: space-between;
10 |   margin-bottom: 20px; /* Adjust spacing between sections */
11 |   position: sticky;
12 |   top: 2.4rem;
13 |   z-index: 1000; /* Ensure it's above other content */
14 |   background-color: white; /* Match your page background */
15 |   padding: 0.2rem;
16 | }
17 | 
18 | .example-heading {
19 |   margin: 0.2rem !important;
20 | }
21 | 
22 | .usage-examples {
23 |   width: 100%; /* Adjust the width as needed */
24 |   border: 1px solid var(--md-default-fg-color--light);
25 |   border-radius: 2px;
26 |   padding: 0.2rem;
27 | }
28 | 
29 | /* Additional styling for the toggle */
30 | .toggle-example {
31 |   cursor: pointer;
32 |   color: white;
33 |   text-decoration: underline;
34 |   background-color: var(--md-primary-fg-color);
35 |   padding: 0.2rem;
36 |   border-radius: 2px;
37 | }
38 | 
39 | .hidden {
40 |   display: none;
41 | }
42 | 
43 | /* mendable search styling */
44 | #my-component-root > div {
45 |   bottom: 100px;
46 | }
47 | 


--------------------------------------------------------------------------------
/docs/docs/index.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/docs/docs/index.md


--------------------------------------------------------------------------------
/docs/docs/javascript/llms_example.js:
--------------------------------------------------------------------------------
 1 | var exampleTemplate = `<h3 class="example-heading toggle-example">Framework Usage</h3>
 2 |   <div class="usage-examples hidden">
 3 |       <div class="example">
 4 |       </div>
 5 |   </div>`;
 6 | 
 7 | var exampleMarkdown = `\`\`\`python
 8 | from llama_index.core import Settings
 9 | 
10 | # global default
11 | Settings.llm = llm
12 | 
13 | # per-component
14 | # objects that use an LLM accept it as a kwarg
15 | index.as_query_engine(llm=llm)
16 | 
17 | index.as_chat_engine(llm=llm)
18 | \`\`\``;
19 | 
20 | function addToggleToExample() {
21 |   const toggleExample = document.querySelector(".toggle-example");
22 |   const usageExamples = document.querySelector(".usage-examples");
23 | 
24 |   toggleExample.addEventListener("click", function () {
25 |     console.log("clicked!");
26 |     console.log(usageExamples);
27 |     usageExamples.classList.toggle("hidden");
28 |   });
29 | }
30 | 
31 | // Add marked package as <script> tag
32 | var script = document.createElement("script");
33 | script.type = "text/javascript";
34 | script.async = true;
35 | script.onload = function () {
36 |   document$.subscribe(function () {
37 |     console.log("document loaded");
38 |     console.log(window.location.pathname);
39 | 
40 |     if (window.location.pathname.includes("/LLMS/")) {
41 |       var exampleElement = document.createElement("div");
42 |       exampleElement.className = "container";
43 |       exampleElement.innerHTML = exampleTemplate;
44 |       exampleElement.children[1].children[0].innerHTML =
45 |         marked.parse(exampleMarkdown);
46 |       document.querySelector(".md-content__inner").prepend(exampleElement);
47 |       addToggleToExample();
48 |     }
49 |   });
50 | };
51 | script.src = "https://cdn.jsdelivr.net/npm/marked/marked.min.js";
52 | document.head.appendChild(script);
53 | 


--------------------------------------------------------------------------------
/docs/docs/javascript/mendablesearch.js:
--------------------------------------------------------------------------------
 1 | document.addEventListener("DOMContentLoaded", () => {
 2 |   // Load the external dependencies
 3 |   function loadScript(src, onLoadCallback) {
 4 |     const script = document.createElement("script");
 5 |     script.src = src;
 6 |     script.onload = onLoadCallback;
 7 |     document.head.appendChild(script);
 8 |   }
 9 | 
10 |   function createRootElement() {
11 |     const rootElement = document.createElement("div");
12 |     rootElement.id = "my-component-root";
13 |     document.body.appendChild(rootElement);
14 |     return rootElement;
15 |   }
16 | 
17 |   function initializeMendable() {
18 |     const rootElement = createRootElement();
19 |     const { MendableFloatingButton } = Mendable;
20 | 
21 |     const icon = React.createElement(
22 |       "p",
23 |       {
24 |         style: {
25 |           color: "#ffffff",
26 |           fontSize: "40px",
27 |           width: "48px",
28 |           height: "48px",
29 |           margin: "0px",
30 |           padding: "0px",
31 |           display: "flex",
32 |           alignItems: "center",
33 |           justifyContent: "center",
34 |         },
35 |       },
36 |       "🦙",
37 |     );
38 | 
39 |     const mendableFloatingButton = React.createElement(MendableFloatingButton, {
40 |       style: { darkMode: false, accentColor: "#010810" },
41 |       floatingButtonStyle: { color: "#ffffff", backgroundColor: "#010810" },
42 |       anon_key: "d0fb5ab6-ae6c-49dc-8d38-5115fe8e4755", // Public ANON key, ok to be public
43 |       messageSettings: {
44 |         openSourcesInNewTab: false,
45 |         prettySources: true,
46 |       },
47 |       showSimpleSearch: true,
48 |       icon: icon,
49 |     });
50 | 
51 |     ReactDOM.render(mendableFloatingButton, rootElement);
52 |   }
53 | 
54 |   loadScript("https://unpkg.com/react@17/umd/react.production.min.js", () => {
55 |     loadScript(
56 |       "https://unpkg.com/react-dom@17/umd/react-dom.production.min.js",
57 |       () => {
58 |         loadScript(
59 |           "https://unpkg.com/@mendable/search@0.0.206/dist/umd/mendable.min.js",
60 |           initializeMendable,
61 |         );
62 |       },
63 |     );
64 |   });
65 | });
66 | 


--------------------------------------------------------------------------------
/docs/docs/module_guides/llama_deploy/40_llamactl.md:
--------------------------------------------------------------------------------
1 | # CLI
2 | 
3 | `llamactl` is a command line interface that ships with LlamaDeploy and has the main goal to easily interact with a
4 | running [API Server](./20_core_components.md#api-server).
5 | 
6 | ::: mkdocs-click
7 |     :module: llama_deploy.cli
8 |     :command: llamactl
9 | 


--------------------------------------------------------------------------------
/docs/mkdocs.yml:
--------------------------------------------------------------------------------
 1 | extra:
 2 |   analytics:
 3 |     property: G-BYVB1ZVE6J
 4 |     provider: google
 5 | extra_css:
 6 |   - css/style.css
 7 |   - css/algolia.css
 8 | extra_javascript:
 9 |   - javascript/mendablesearch.js
10 |   - javascript/algolia.js
11 | markdown_extensions:
12 |   - attr_list
13 |   - admonition
14 |   - pymdownx.details
15 |   - pymdownx.superfences
16 |   - md_in_html
17 |   - mkdocs-click
18 |   - toc:
19 |       permalink: "#"
20 | nav:
21 |   - Home: index.md
22 |   - API Reference:
23 |       - LlamaDeploy:
24 |           - api_reference/llama_deploy
25 |   - Component Guides:
26 |       - LlamaDeploy:
27 |           - module_guides/llama_deploy
28 | plugins:
29 |   - search
30 |   - include_dir_to_nav
31 |   - render_swagger
32 |   - gh-admonitions
33 |   - mkdocstrings:
34 |       handlers:
35 |         python:
36 |           options:
37 |             docstring_options:
38 |               ignore_init_summary: true
39 |             docstring_style: google
40 |             filters:
41 |               - "!^_"
42 |               - "!^__init__"
43 |             members_order: source
44 |             merge_init_into_class: false
45 |             separate_signature: true
46 |             show_root_full_path: true
47 |             show_root_heading: false
48 |             show_root_toc_entry: false
49 |             show_signature_annotations: true
50 |             signature_crossrefs: true
51 |             extensions:
52 |               - griffe_fieldz
53 |           paths:
54 |             - ../llama_deploy
55 | site_name: LlamaDeploy
56 | theme:
57 |   custom_dir: overrides
58 |   favicon: _static/assets/LlamaLogoBrowserTab.png
59 |   features:
60 |     - navigation.instant
61 |     - navigation.tabs
62 |     - navigation.indexes
63 |     - navigation.top
64 |     - navigation.footer
65 |     - toc.follow
66 |     - content.code.copy
67 |     - search.suggest
68 |     - search.highlight
69 |   logo: _static/assets/LlamaSquareBlack.svg
70 |   name: material
71 |   palette:
72 |     - media: (prefers-color-scheme)
73 |       toggle:
74 |         icon: material/brightness-auto
75 |         name: Switch to light mode
76 |     - accent: purple
77 |       media: "(prefers-color-scheme: light)"
78 |       primary: white
79 |       scheme: default
80 |       toggle:
81 |         icon: material/brightness-7
82 |         name: Switch to dark mode
83 |     - accent: purple
84 |       media: "(prefers-color-scheme: dark)"
85 |       primary: black
86 |       scheme: slate
87 |       toggle:
88 |         icon: material/brightness-4
89 |         name: Switch to system preference
90 | 


--------------------------------------------------------------------------------
/docs/overrides/main.html:
--------------------------------------------------------------------------------
1 | {% extends "base.html" %} {% block header %} {{ super() }} {% endblock %}
2 | 


--------------------------------------------------------------------------------
/docs/overrides/partials/copyright.html:
--------------------------------------------------------------------------------
1 | <readthedocs-flyout position="bottom-left"></readthedocs-flyout>
2 | 


--------------------------------------------------------------------------------
/docs/overrides/partials/search.html:
--------------------------------------------------------------------------------
1 | {% import "partials/language.html" as lang with context %}
2 | 
3 | <!-- Search interface -->
4 | <div id="docsearch"></div>
5 | 


--------------------------------------------------------------------------------
/docs/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | requires = ["hatchling"]
 3 | build-backend = "hatchling.build"
 4 | 
 5 | [project]
 6 | name = "docs"
 7 | version = "0.1.0"
 8 | description = ""
 9 | authors = [{name = "Your Name", email = "you@example.com"}]
10 | requires-python = "~=3.11"
11 | readme = "README.md"
12 | dependencies = [
13 |   "llama_deploy[awssqs, rabbitmq, kafka, redis]",
14 |   "mkdocs>=1.6.1,<2",
15 |   "mkdocstrings[python]>=0.26.1,<0.27",
16 |   "mkdocs-include-dir-to-nav>=1.2.0,<2",
17 |   "mkdocs-material>=9.5.39,<10",
18 |   "mkdocs-redirects>=1.2.1,<2",
19 |   "mkdocs-click>=0.8.1,<0.9",
20 |   "mkdocs-render-swagger-plugin>=0.1.2,<0.2",
21 |   "griffe-fieldz>=0.2.0,<0.3",
22 |   "mkdocs-github-admonitions-plugin>=0.0.3,<0.0.4"
23 | ]
24 | 
25 | [tool.uv]
26 | package = false
27 | 
28 | [tool.uv.sources]
29 | llama_deploy = {path = "../", editable = true}
30 | 


--------------------------------------------------------------------------------
/e2e_tests/README.md:
--------------------------------------------------------------------------------
 1 | # E2E Tests
 2 | 
 3 | E2E tests are run in the `e2e-tests` workflow in `.github/workflows/e2e-tests.yml`.
 4 | 
 5 | Each folder in this directory contains a Python package representing a set of tests for a simple scenario.
 6 | 
 7 | When new folders are added, they will be executed automatically in the CI/CD pipeline by `pytest`.
 8 | 
 9 | To run all the tests:
10 | 
11 | ```sh
12 | $ uv run -- pytest -m"e2e"
13 | ```
14 | or
15 | ```sh
16 | $ uv run -- pytest ./e2e_tests
17 | ```
18 | 
19 | To run a specific scenario:
20 | 
21 | ```sh
22 | $ uv run -- pytest e2e_tests/basic_streaming
23 | ```
24 | 
25 | If you want to see the output of the different services running, pass the `-s` flag to pytest:
26 | 
27 | ```sh
28 | $ uv run -- pytest e2e_tests/basic_streaming -s
29 | ```
30 | 


--------------------------------------------------------------------------------
/e2e_tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/apiserver/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/apiserver/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/apiserver/conftest.py:
--------------------------------------------------------------------------------
 1 | import multiprocessing
 2 | from pathlib import Path
 3 | 
 4 | import httpx
 5 | import pytest
 6 | import uvicorn
 7 | from tenacity import retry, wait_exponential
 8 | 
 9 | from llama_deploy.client import Client
10 | 
11 | 
12 | def run_apiserver():
13 |     uvicorn.run("llama_deploy.apiserver.app:app", host="127.0.0.1", port=4501)
14 | 
15 | 
16 | @retry(wait=wait_exponential(min=1, max=10))
17 | def wait_for_healthcheck():
18 |     response = httpx.get("http://127.0.0.1:4501/status/")
19 |     response.raise_for_status()
20 | 
21 | 
22 | @pytest.fixture(scope="function")
23 | def apiserver():
24 |     ctx = multiprocessing.get_context("spawn")
25 |     p = ctx.Process(target=run_apiserver)
26 |     p.start()
27 |     wait_for_healthcheck()
28 | 
29 |     yield
30 | 
31 |     p.terminate()
32 |     p.join(timeout=3)
33 |     if p.is_alive():
34 |         p.kill()
35 | 
36 | 
37 | @pytest.fixture(scope="function")
38 | def apiserver_with_rc(monkeypatch):
39 |     here = Path(__file__).parent
40 |     rc_path = here / "rc"
41 |     monkeypatch.setenv("LLAMA_DEPLOY_APISERVER_RC_PATH", str(rc_path))
42 | 
43 |     p = multiprocessing.Process(target=run_apiserver)
44 |     p.start()
45 |     wait_for_healthcheck()
46 | 
47 |     yield
48 | 
49 |     p.terminate()
50 |     p.join(timeout=3)
51 |     if p.is_alive():
52 |         p.kill()
53 |     p.close()
54 | 
55 | 
56 | @pytest.fixture
57 | def client():
58 |     return Client(api_server_url="http://127.0.0.1:4501")
59 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/deployment1.yml:
--------------------------------------------------------------------------------
 1 | name: TestDeployment1
 2 | 
 3 | control-plane: {}
 4 | 
 5 | default-service: dummy_workflow
 6 | 
 7 | services:
 8 |   test-workflow:
 9 |     name: Test Workflow
10 |     port: 8002
11 |     host: localhost
12 |     source:
13 |       type: git
14 |       name: https://github.com/run-llama/llama_deploy.git
15 |     path: e2e_tests/apiserver/deployments/src:my_workflow
16 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/deployment2.yml:
--------------------------------------------------------------------------------
 1 | name: TestDeployment2
 2 | 
 3 | control-plane: {}
 4 | 
 5 | default-service: dummy_workflow
 6 | 
 7 | services:
 8 |   test-workflow:
 9 |     name: Test Workflow
10 |     port: 8002
11 |     host: localhost
12 |     source:
13 |       type: local
14 |       name: src
15 |     path: src:my_workflow
16 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/deployment_env_git.yml:
--------------------------------------------------------------------------------
 1 | name: EnvironmentVariablesGit
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | services:
 7 |   workflow_git:
 8 |     name: Git Workflow
 9 |     source:
10 |       type: git
11 |       name: https://github.com/run-llama/llama_deploy.git
12 |     env:
13 |       VAR_1: x # this gets overwritten because VAR_1 also exists in the provided .env
14 |       VAR_2: y
15 |     env-files:
16 |       - tests/apiserver/data/.env # relative to source path
17 |     path: tests/apiserver/data/workflow:env_reader_workflow
18 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/deployment_env_local.yml:
--------------------------------------------------------------------------------
 1 | name: EnvironmentVariablesLocal
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | default-service: test_env_workflow
 7 | 
 8 | services:
 9 |   test_env_workflow:
10 |     name: Workflow
11 |     source:
12 |       type: local
13 |       name: src
14 |     env:
15 |       VAR_1: x # this gets overwritten because VAR_1 also exists in the provided .env
16 |       VAR_2: y
17 |     env-files:
18 |       - src/.env # relative to source path
19 |     path: src/workflow_env:workflow
20 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/deployment_hitl.yml:
--------------------------------------------------------------------------------
 1 | name: HumanInTheLoop
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | default-service: hitl_workflow
 7 | 
 8 | services:
 9 |   hitl_workflow:
10 |     name: HITL Workflow
11 |     source:
12 |       type: local
13 |       name: src
14 |     path: src/workflow_hitl:workflow
15 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/deployment_reload1.yml:
--------------------------------------------------------------------------------
 1 | name: ReloadMe
 2 | 
 3 | control-plane: {}
 4 | 
 5 | default-service: test-workflow
 6 | 
 7 | services:
 8 |   test-workflow:
 9 |     name: Test Workflow
10 |     port: 8002
11 |     host: localhost
12 |     source:
13 |       type: git
14 |       name: https://github.com/run-llama/llama_deploy.git
15 |     path: e2e_tests/apiserver/deployments/src:echo_workflow_en
16 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/deployment_reload2.yml:
--------------------------------------------------------------------------------
 1 | name: ReloadMe
 2 | 
 3 | control-plane: {}
 4 | 
 5 | default-service: test-workflow
 6 | 
 7 | services:
 8 |   test-workflow:
 9 |     name: Test Workflow
10 |     port: 8002
11 |     host: localhost
12 |     source:
13 |       type: git
14 |       name: https://github.com/run-llama/llama_deploy.git
15 |     path: e2e_tests/apiserver/deployments/src:echo_workflow_it
16 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/deployment_streaming.yml:
--------------------------------------------------------------------------------
 1 | name: Streaming
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | default-service: streaming_workflow
 7 | 
 8 | services:
 9 |   streaming_workflow:
10 |     name: Streaming Workflow
11 |     source:
12 |       type: local
13 |       name: src
14 |     path: src/workflow:streaming_workflow
15 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/src/.env:
--------------------------------------------------------------------------------
1 | VAR_1=z
2 | API_KEY=123
3 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/src/__init__.py:
--------------------------------------------------------------------------------
1 | from .workflow import EchoWorkflow
2 | from .workflow_reload import EchoWithPrompt
3 | 
4 | my_workflow = EchoWorkflow()
5 | echo_workflow_en = EchoWithPrompt(prompt_msg="I have received:")
6 | echo_workflow_it = EchoWithPrompt(prompt_msg="Ho ricevuto:")
7 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/src/workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | from llama_index.core.workflow import (
 4 |     Context,
 5 |     Event,
 6 |     StartEvent,
 7 |     StopEvent,
 8 |     Workflow,
 9 |     step,
10 | )
11 | 
12 | 
13 | class Message(Event):
14 |     text: str
15 | 
16 | 
17 | class EchoWorkflow(Workflow):
18 |     """A dummy workflow streaming three events."""
19 | 
20 |     @step()
21 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
22 |         for i in range(3):
23 |             ctx.write_event_to_stream(Message(text=f"message number {i+1}"))
24 |             await asyncio.sleep(0.5)
25 | 
26 |         return StopEvent(result="Done.")
27 | 
28 | 
29 | streaming_workflow = EchoWorkflow()
30 | 
31 | 
32 | async def main():
33 |     h = streaming_workflow.run(message="Hello!")
34 |     async for ev in h.stream_events():
35 |         if type(ev) is Message:
36 |             print(ev.text)
37 |     print(await h)
38 | 
39 | 
40 | if __name__ == "__main__":
41 |     asyncio.run(main())
42 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/src/workflow_env.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import os
 3 | 
 4 | from llama_index.core.workflow import (
 5 |     Context,
 6 |     StartEvent,
 7 |     StopEvent,
 8 |     Workflow,
 9 |     step,
10 | )
11 | 
12 | 
13 | class MyWorkflow(Workflow):
14 |     @step()
15 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
16 |         var_1 = os.environ.get("VAR_1")
17 |         var_2 = os.environ.get("VAR_2")
18 |         api_key = os.environ.get("API_KEY")
19 |         return StopEvent(
20 |             # result depends on variables read from environment
21 |             result=(f"var_1: {var_1}, " f"var_2: {var_2}, " f"api_key: {api_key}")
22 |         )
23 | 
24 | 
25 | workflow = MyWorkflow()
26 | 
27 | 
28 | async def main(w: Workflow):
29 |     h = w.run()
30 |     print(await h)
31 | 
32 | 
33 | if __name__ == "__main__":
34 |     import os
35 | 
36 |     # set env variables
37 |     os.environ["VAR_1"] = "x"
38 |     os.environ["VAR_1"] = "y"
39 |     os.environ["API_KEY"] = "123"
40 | 
41 |     w = MyWorkflow()
42 | 
43 |     asyncio.run(main(w))
44 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/src/workflow_hitl.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import (
 2 |     StartEvent,
 3 |     StopEvent,
 4 |     Workflow,
 5 |     step,
 6 | )
 7 | from llama_index.core.workflow.events import (
 8 |     HumanResponseEvent,
 9 |     InputRequiredEvent,
10 | )
11 | 
12 | 
13 | class HumanInTheLoopWorkflow(Workflow):
14 |     @step
15 |     async def step1(self, ev: StartEvent) -> InputRequiredEvent:
16 |         return InputRequiredEvent(prefix="Enter a number: ")
17 | 
18 |     @step
19 |     async def step2(self, ev: HumanResponseEvent) -> StopEvent:
20 |         return StopEvent(result=ev.response)
21 | 
22 | 
23 | workflow = HumanInTheLoopWorkflow()
24 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/deployments/src/workflow_reload.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import Context, StartEvent, StopEvent, Workflow, step
 2 | 
 3 | 
 4 | class EchoWithPrompt(Workflow):
 5 |     def __init__(self, prompt_msg):
 6 |         super().__init__()
 7 |         self._prompt_msg = prompt_msg
 8 | 
 9 |     @step
10 |     def do_something(self, ctx: Context, ev: StartEvent) -> StopEvent:
11 |         return StopEvent(result=f"{self._prompt_msg}{ev.data}")
12 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/rc/deployment.yml:
--------------------------------------------------------------------------------
 1 | name: AutoDeployed
 2 | 
 3 | control-plane: {}
 4 | 
 5 | default-service: test-workflow
 6 | 
 7 | services:
 8 |   test-workflow:
 9 |     name: Test Workflow
10 |     port: 8002
11 |     host: localhost
12 |     source:
13 |       type: local
14 |       name: src
15 |     path: src/workflow:echo_workflow
16 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/rc/src/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/apiserver/rc/src/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/apiserver/rc/src/workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | from llama_index.core.workflow import (
 4 |     Context,
 5 |     Event,
 6 |     StartEvent,
 7 |     StopEvent,
 8 |     Workflow,
 9 |     step,
10 | )
11 | 
12 | 
13 | class Message(Event):
14 |     text: str
15 | 
16 | 
17 | class EchoWorkflow(Workflow):
18 |     """A dummy workflow streaming three events."""
19 | 
20 |     @step()
21 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
22 |         for i in range(3):
23 |             ctx.write_event_to_stream(Message(text=f"message number {i + 1}"))
24 |             await asyncio.sleep(0.5)
25 | 
26 |         return StopEvent(result="Done.")
27 | 
28 | 
29 | echo_workflow = EchoWorkflow()
30 | 
31 | 
32 | async def main():
33 |     h = echo_workflow.run(message="Hello!")
34 |     async for ev in h.stream_events():
35 |         if type(ev) is Message:
36 |             print(ev.text)
37 |     print(await h)
38 | 
39 | 
40 | if __name__ == "__main__":
41 |     asyncio.run(main())
42 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_autodeploy.py:
--------------------------------------------------------------------------------
1 | import pytest
2 | 
3 | 
4 | @pytest.mark.asyncio
5 | async def test_autodeploy(client, apiserver_with_rc):
6 |     status = await client.apiserver.status()
7 |     assert "AutoDeployed" in status.deployments
8 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_deploy.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | 
 3 | import pytest
 4 | 
 5 | 
 6 | @pytest.mark.asyncio
 7 | async def test_deploy(apiserver, client):
 8 |     here = Path(__file__).parent
 9 |     deployment_fp = here / "deployments" / "deployment1.yml"
10 |     with open(deployment_fp) as f:
11 |         await client.apiserver.deployments.create(f, base_path=deployment_fp.parent)
12 | 
13 |     status = await client.apiserver.status()
14 |     assert "TestDeployment1" in status.deployments
15 | 
16 | 
17 | def test_deploy_sync(apiserver, client):
18 |     here = Path(__file__).parent
19 |     deployment_fp = here / "deployments" / "deployment1.yml"
20 |     with open(deployment_fp) as f:
21 |         client.sync.apiserver.deployments.create(f, base_path=deployment_fp.parent)
22 | 
23 |     assert "TestDeployment1" in client.sync.apiserver.status().deployments
24 | 
25 | 
26 | @pytest.mark.asyncio
27 | async def test_deploy_local(apiserver, client):
28 |     here = Path(__file__).parent
29 |     deployment_fp = here / "deployments" / "deployment2.yml"
30 |     with open(deployment_fp) as f:
31 |         await client.apiserver.deployments.create(
32 |             f, base_path=str(deployment_fp.parent.resolve())
33 |         )
34 | 
35 |     status = await client.apiserver.status()
36 |     assert "TestDeployment2" in status.deployments
37 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_env_vars_git.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from pathlib import Path
 3 | 
 4 | import pytest
 5 | 
 6 | 
 7 | @pytest.mark.asyncio
 8 | async def test_read_env_vars_git(apiserver, client):
 9 |     here = Path(__file__).parent
10 |     deployment_fp = here / "deployments" / "deployment_env_git.yml"
11 |     with open(deployment_fp) as f:
12 |         await client.apiserver.deployments.create(f, base_path=deployment_fp.parent)
13 |         await asyncio.sleep(5)
14 | 
15 |     session = await client.core.sessions.create()
16 | 
17 |     # run workflow
18 |     result = await session.run(
19 |         "workflow_git", env_vars_to_read=["VAR_1", "VAR_2", "API_KEY"]
20 |     )
21 | 
22 |     assert result == "VAR_1: x, VAR_2: y, API_KEY: 123"
23 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_env_vars_local.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from pathlib import Path
 3 | 
 4 | import pytest
 5 | 
 6 | 
 7 | @pytest.mark.asyncio
 8 | async def test_read_env_vars_local(apiserver, client):
 9 |     here = Path(__file__).parent
10 |     deployment_fp = here / "deployments" / "deployment_env_local.yml"
11 |     with open(deployment_fp) as f:
12 |         await client.apiserver.deployments.create(f, base_path=deployment_fp.parent)
13 |         await asyncio.sleep(5)
14 | 
15 |     session = await client.core.sessions.create()
16 | 
17 |     # run workflow
18 |     result = await session.run("test_env_workflow")
19 | 
20 |     assert result == "var_1: z, var_2: y, api_key: 123"
21 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_hitl.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from pathlib import Path
 3 | 
 4 | import pytest
 5 | from llama_index.core.workflow.events import HumanResponseEvent
 6 | 
 7 | from llama_deploy.types import TaskDefinition
 8 | 
 9 | 
10 | @pytest.mark.asyncio
11 | async def test_hitl(apiserver, client):
12 |     here = Path(__file__).parent
13 |     deployment_fp = here / "deployments" / "deployment_hitl.yml"
14 |     with open(deployment_fp) as f:
15 |         deployment = await client.apiserver.deployments.create(
16 |             f, base_path=deployment_fp.parent
17 |         )
18 |         await asyncio.sleep(5)
19 | 
20 |     tasks = deployment.tasks
21 |     task_handler = await tasks.create(TaskDefinition(input="{}"))
22 |     ev_def = await task_handler.send_event(
23 |         ev=HumanResponseEvent(response="42"), service_name="hitl_workflow"
24 |     )
25 | 
26 |     # wait for workflow to finish
27 |     await asyncio.sleep(2)
28 | 
29 |     result = await task_handler.results()
30 |     assert ev_def.service_id == "hitl_workflow"
31 |     assert result.result == "42", "The human's response is not consistent."
32 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_reload.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from pathlib import Path
 3 | 
 4 | import pytest
 5 | 
 6 | from llama_deploy.types import TaskDefinition
 7 | 
 8 | 
 9 | @pytest.mark.asyncio
10 | async def test_reload(apiserver, client):
11 |     here = Path(__file__).parent
12 |     deployment_fp = here / "deployments" / "deployment_reload1.yml"
13 |     with open(deployment_fp) as f:
14 |         deployment = await client.apiserver.deployments.create(
15 |             f, base_path=deployment_fp.parent
16 |         )
17 |         await asyncio.sleep(3)
18 | 
19 |     tasks = deployment.tasks
20 |     res = await tasks.run(TaskDefinition(input='{"data": "bar"}'))
21 |     assert res == "I have received:bar"
22 | 
23 |     deployment_fp = here / "deployments" / "deployment_reload2.yml"
24 |     with open(deployment_fp) as f:
25 |         deployment = await client.apiserver.deployments.create(
26 |             f, base_path=deployment_fp.parent, reload=True
27 |         )
28 |         await asyncio.sleep(3)
29 | 
30 |     tasks = deployment.tasks
31 |     res = await tasks.run(TaskDefinition(input='{"data": "bar"}'))
32 |     assert res == "Ho ricevuto:bar"
33 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_service_entrypoint.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import subprocess
 3 | import time
 4 | 
 5 | import requests
 6 | 
 7 | 
 8 | def test_apiserver_entrypoint():
 9 |     # Customize host and port
10 |     env = os.environ.copy()
11 |     env["LLAMA_DEPLOY_APISERVER_HOST"] = "localhost"
12 |     env["LLAMA_DEPLOY_APISERVER_PORT"] = "4502"
13 |     # Start the API server as a subprocess
14 |     process = subprocess.Popen(
15 |         ["python", "-m", "llama_deploy.apiserver"],
16 |         stdout=subprocess.PIPE,
17 |         stderr=subprocess.PIPE,
18 |         env=env,
19 |     )
20 | 
21 |     try:
22 |         # Wait a bit for the server to start
23 |         time.sleep(2)
24 | 
25 |         response = requests.get("http://localhost:4502/status")
26 |         assert response.status_code == 200
27 |     finally:
28 |         # Clean up: terminate the server process
29 |         process.terminate()
30 |         process.wait()
31 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_status.py:
--------------------------------------------------------------------------------
 1 | import pytest
 2 | 
 3 | 
 4 | @pytest.mark.asyncio
 5 | async def test_status_down(client):
 6 |     res = await client.apiserver.status()
 7 |     assert res.status.value == "Down"
 8 | 
 9 | 
10 | def test_status_down_sync(client):
11 |     res = client.sync.apiserver.status()
12 |     assert res.status.value == "Down"
13 | 
14 | 
15 | @pytest.mark.asyncio
16 | async def test_status_up(apiserver, client):
17 |     res = await client.apiserver.status()
18 |     assert res.status.value == "Healthy"
19 | 
20 | 
21 | def test_status_up_sync(apiserver, client):
22 |     res = client.sync.apiserver.status()
23 |     assert res.status.value == "Healthy"
24 | 


--------------------------------------------------------------------------------
/e2e_tests/apiserver/test_streaming.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from pathlib import Path
 3 | 
 4 | import pytest
 5 | 
 6 | from llama_deploy.types import TaskDefinition
 7 | 
 8 | 
 9 | @pytest.mark.asyncio
10 | async def test_stream(apiserver, client):
11 |     here = Path(__file__).parent
12 |     deployment_fp = here / "deployments" / "deployment_streaming.yml"
13 |     with open(deployment_fp) as f:
14 |         deployment = await client.apiserver.deployments.create(
15 |             f, base_path=deployment_fp.parent
16 |         )
17 |         await asyncio.sleep(5)
18 | 
19 |     tasks = deployment.tasks
20 |     task = await tasks.create(TaskDefinition(input='{"a": "b"}'))
21 |     read_events = []
22 |     async for ev in task.events():
23 |         if "text" in ev:
24 |             read_events.append(ev)
25 |     assert len(read_events) == 3
26 |     # the workflow produces events sequentially, so here we can assume events arrived in order
27 |     for i, ev in enumerate(read_events):
28 |         assert ev["text"] == f"message number {i + 1}"
29 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_hitl/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/basic_hitl/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/basic_hitl/conftest.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import multiprocessing
 3 | import time
 4 | 
 5 | import pytest
 6 | 
 7 | from llama_deploy.control_plane import ControlPlaneConfig
 8 | from llama_deploy.services import WorkflowServiceConfig
 9 | 
10 | from ..utils import deploy_workflow
11 | from .workflow import HumanInTheLoopWorkflow
12 | 
13 | 
14 | def run_async_workflow():
15 |     asyncio.run(
16 |         deploy_workflow(
17 |             HumanInTheLoopWorkflow(timeout=60),
18 |             WorkflowServiceConfig(
19 |                 host="127.0.0.1",
20 |                 port=8002,
21 |                 service_name="hitl_workflow",
22 |             ),
23 |             ControlPlaneConfig(),
24 |         )
25 |     )
26 | 
27 | 
28 | @pytest.fixture
29 | def services(core):
30 |     p = multiprocessing.Process(target=run_async_workflow)
31 |     p.start()
32 |     time.sleep(5)
33 | 
34 |     yield
35 | 
36 |     p.kill()
37 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_hitl/test_run_client.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import time
 3 | 
 4 | import pytest
 5 | from llama_index.core.workflow.events import HumanResponseEvent
 6 | 
 7 | from llama_deploy.client import Client
 8 | 
 9 | 
10 | def test_run_client(services):
11 |     client = Client(timeout=10)
12 | 
13 |     # sanity check
14 |     sessions = client.sync.core.sessions.list()
15 |     assert len(sessions) == 0, "Sessions list is not empty"
16 | 
17 |     # create a session
18 |     session = client.sync.core.sessions.create()
19 | 
20 |     # kick off run
21 |     task_id = session.run_nowait("hitl_workflow")
22 | 
23 |     # send event
24 |     session.send_event(
25 |         ev=HumanResponseEvent(response="42"),
26 |         service_name="hitl_workflow",
27 |         task_id=task_id,
28 |     )
29 | 
30 |     # get final result, polling to wait for workflow to finish after send event
31 |     final_result = None
32 |     while final_result is None:
33 |         final_result = session.get_task_result(task_id)
34 |         time.sleep(0.1)
35 |     assert final_result.result == "42", "The human's response is not consistent."
36 | 
37 |     # delete the session
38 |     client.sync.core.sessions.delete(session.id)
39 |     sessions = client.sync.core.sessions.list()
40 |     assert len(sessions) == 0, "Sessions list is not empty"
41 | 
42 | 
43 | @pytest.mark.asyncio
44 | async def test_run_client_async(services):
45 |     client = Client(timeout=10)
46 | 
47 |     # sanity check
48 |     sessions = await client.core.sessions.list()
49 |     assert len(sessions) == 0, "Sessions list is not empty"
50 | 
51 |     # create a session
52 |     session = await client.core.sessions.create()
53 | 
54 |     # kick off run
55 |     task_id = await session.run_nowait("hitl_workflow")
56 | 
57 |     # send event
58 |     await session.send_event(
59 |         ev=HumanResponseEvent(response="42"),
60 |         service_name="hitl_workflow",
61 |         task_id=task_id,
62 |     )
63 | 
64 |     # get final result, polling to wait for workflow to finish after send event
65 |     final_result = None
66 |     while final_result is None:
67 |         final_result = await session.get_task_result(task_id)
68 |         await asyncio.sleep(0.1)
69 |     assert final_result.result == "42", "The human's response is not consistent."
70 | 
71 |     # delete the session
72 |     await client.core.sessions.delete(session.id)
73 |     sessions = await client.core.sessions.list()
74 |     assert len(sessions) == 0, "Sessions list is not empty"
75 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_hitl/workflow.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import (
 2 |     StartEvent,
 3 |     StopEvent,
 4 |     Workflow,
 5 |     step,
 6 | )
 7 | from llama_index.core.workflow.events import (
 8 |     HumanResponseEvent,
 9 |     InputRequiredEvent,
10 | )
11 | 
12 | 
13 | class HumanInTheLoopWorkflow(Workflow):
14 |     @step
15 |     async def step1(self, ev: StartEvent) -> InputRequiredEvent:
16 |         return InputRequiredEvent(prefix="Enter a number: ")
17 | 
18 |     @step
19 |     async def step2(self, ev: HumanResponseEvent) -> StopEvent:
20 |         return StopEvent(result=ev.response)
21 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_session/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/basic_session/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/basic_session/conftest.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import multiprocessing
 3 | import time
 4 | 
 5 | import pytest
 6 | 
 7 | from llama_deploy.control_plane import ControlPlaneConfig
 8 | from llama_deploy.services import WorkflowServiceConfig
 9 | 
10 | from ..utils import deploy_workflow
11 | from .workflow import SessionWorkflow
12 | 
13 | 
14 | def run_async_workflow():
15 |     asyncio.run(
16 |         deploy_workflow(
17 |             SessionWorkflow(timeout=10),
18 |             WorkflowServiceConfig(
19 |                 host="127.0.0.1",
20 |                 port=8002,
21 |                 service_name="session_workflow",
22 |             ),
23 |             ControlPlaneConfig(),
24 |         )
25 |     )
26 | 
27 | 
28 | @pytest.fixture
29 | def workflow(core):
30 |     p = multiprocessing.Process(target=run_async_workflow)
31 |     p.start()
32 |     time.sleep(5)
33 | 
34 |     yield
35 | 
36 |     p.kill()
37 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_session/test_run_client.py:
--------------------------------------------------------------------------------
 1 | import pytest
 2 | 
 3 | from llama_deploy.client import Client
 4 | 
 5 | 
 6 | def test_run_client(workflow):
 7 |     client = Client(timeout=10)
 8 | 
 9 |     # create session
10 |     session = client.sync.core.sessions.create()
11 | 
12 |     # test run with session
13 |     result = session.run("session_workflow")
14 |     assert result == "1"
15 | 
16 |     # run again
17 |     result = session.run("session_workflow")
18 |     assert result == "2"
19 | 
20 |     # create new session and run
21 |     session = client.sync.core.sessions.create()
22 |     result = session.run("session_workflow")
23 |     assert result == "1"
24 | 
25 | 
26 | @pytest.mark.asyncio
27 | async def test_run_client_async(workflow):
28 |     client = Client(timeout=10)
29 | 
30 |     # create session
31 |     session = await client.core.sessions.create()
32 | 
33 |     # run
34 |     result = await session.run("session_workflow")
35 |     assert result == "1"
36 | 
37 |     # run again
38 |     result = await session.run("session_workflow")
39 |     assert result == "2"
40 | 
41 |     # create new session and run
42 |     session = await client.core.sessions.create()
43 |     result = await session.run("session_workflow")
44 |     assert result == "1"
45 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_session/workflow.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import (
 2 |     Context,
 3 |     Workflow,
 4 |     StartEvent,
 5 |     StopEvent,
 6 |     step,
 7 | )
 8 | 
 9 | 
10 | class SessionWorkflow(Workflow):
11 |     @step()
12 |     async def step_1(self, ctx: Context, ev: StartEvent) -> StopEvent:
13 |         cur_val = await ctx.get("count", default=0)
14 |         await ctx.set("count", cur_val + 1)
15 | 
16 |         return StopEvent(result=cur_val + 1)
17 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_streaming/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/basic_streaming/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/basic_streaming/conftest.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import multiprocessing
 3 | import time
 4 | 
 5 | import pytest
 6 | 
 7 | from llama_deploy.control_plane import ControlPlaneConfig
 8 | from llama_deploy.services import WorkflowServiceConfig
 9 | 
10 | from ..utils import deploy_workflow
11 | from .workflow import StreamingWorkflow
12 | 
13 | 
14 | def run_async_workflow():
15 |     asyncio.run(
16 |         deploy_workflow(
17 |             StreamingWorkflow(timeout=10),
18 |             WorkflowServiceConfig(
19 |                 host="127.0.0.1",
20 |                 port=8002,
21 |                 service_name="streaming_workflow",
22 |             ),
23 |             ControlPlaneConfig(),
24 |         )
25 |     )
26 | 
27 | 
28 | @pytest.fixture
29 | def services(core):
30 |     p = multiprocessing.Process(target=run_async_workflow)
31 |     p.start()
32 |     time.sleep(5)
33 | 
34 |     yield
35 | 
36 |     p.kill()
37 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_streaming/test_run_client.py:
--------------------------------------------------------------------------------
 1 | import pytest
 2 | 
 3 | from llama_deploy.client import Client
 4 | 
 5 | 
 6 | def test_run_client(services):
 7 |     client = Client(timeout=20)
 8 | 
 9 |     # sanity check
10 |     sessions = client.sync.core.sessions.list()
11 |     assert len(sessions) == 0, "Sessions list is not empty"
12 | 
13 |     # test streaming
14 |     session = client.sync.core.sessions.create()
15 | 
16 |     # kick off run
17 |     task_id = session.run_nowait("streaming_workflow", arg1="hello_world")
18 | 
19 |     progress_received = []
20 |     for event in session.get_task_result_stream(task_id):
21 |         if "progress" in event:
22 |             progress_received.append(event["progress"])
23 |     assert progress_received == [0.3, 0.6, 0.9]
24 | 
25 |     # get final result
26 |     final_result = session.get_task_result(task_id)
27 |     assert final_result.result == "hello_world_result_result_result"  # type: ignore
28 | 
29 |     # delete everything
30 |     client.sync.core.sessions.delete(session.id)
31 | 
32 | 
33 | @pytest.mark.asyncio
34 | async def test_run_client_async(services):
35 |     client = Client(timeout=20)
36 | 
37 |     # test streaming
38 |     session = await client.core.sessions.create()
39 | 
40 |     # kick off run
41 |     task_id = await session.run_nowait("streaming_workflow", arg1="hello_world")
42 | 
43 |     progress_received = []
44 |     async for event in session.get_task_result_stream(task_id):
45 |         if "progress" in event:
46 |             progress_received.append(event["progress"])
47 |     assert progress_received == [0.3, 0.6, 0.9]
48 | 
49 |     final_result = await session.get_task_result(task_id)
50 |     assert final_result.result == "hello_world_result_result_result"  # type: ignore
51 | 
52 |     # delete everything
53 |     await client.core.sessions.delete(session.id)
54 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_streaming/workflow.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import (
 2 |     Context,
 3 |     Event,
 4 |     StartEvent,
 5 |     StopEvent,
 6 |     Workflow,
 7 |     step,
 8 | )
 9 | 
10 | 
11 | class ProgressEvent(Event):
12 |     progress: float
13 | 
14 | 
15 | class Step1(Event):
16 |     arg1: str
17 | 
18 | 
19 | class Step2(Event):
20 |     arg1: str
21 | 
22 | 
23 | class StreamingWorkflow(Workflow):
24 |     @step()
25 |     async def run_step_1(self, ctx: Context, ev: StartEvent) -> Step1:
26 |         arg1 = ev.get("arg1")
27 |         if not arg1:
28 |             raise ValueError("arg1 is required.")
29 | 
30 |         ctx.write_event_to_stream(ProgressEvent(progress=0.3))
31 | 
32 |         return Step1(arg1=str(arg1) + "_result")
33 | 
34 |     @step()
35 |     async def run_step_2(self, ctx: Context, ev: Step1) -> Step2:
36 |         arg1 = ev.arg1
37 |         if not arg1:
38 |             raise ValueError("arg1 is required.")
39 | 
40 |         ctx.write_event_to_stream(ProgressEvent(progress=0.6))
41 | 
42 |         return Step2(arg1=str(arg1) + "_result")
43 | 
44 |     @step()
45 |     async def run_step_3(self, ctx: Context, ev: Step2) -> StopEvent:
46 |         arg1 = ev.arg1
47 |         if not arg1:
48 |             raise ValueError("arg1 is required.")
49 | 
50 |         ctx.write_event_to_stream(ProgressEvent(progress=0.9))
51 | 
52 |         return StopEvent(result=str(arg1) + "_result")
53 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_workflow/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/basic_workflow/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/basic_workflow/conftest.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import multiprocessing
 3 | import time
 4 | 
 5 | import pytest
 6 | 
 7 | from llama_deploy.control_plane import ControlPlaneConfig
 8 | from llama_deploy.services import WorkflowServiceConfig
 9 | 
10 | from ..utils import deploy_workflow
11 | from .workflow import OuterWorkflow
12 | 
13 | 
14 | def run_async_workflow():
15 |     asyncio.run(
16 |         deploy_workflow(
17 |             OuterWorkflow(timeout=10),
18 |             WorkflowServiceConfig(
19 |                 host="127.0.0.1",
20 |                 port=8002,
21 |                 service_name="outer",
22 |             ),
23 |             ControlPlaneConfig(),
24 |         )
25 |     )
26 | 
27 | 
28 | @pytest.fixture
29 | def workflow(core):
30 |     p = multiprocessing.Process(target=run_async_workflow)
31 |     p.start()
32 |     time.sleep(5)
33 | 
34 |     yield
35 | 
36 |     p.kill()
37 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_workflow/test_run_client.py:
--------------------------------------------------------------------------------
 1 | import pytest
 2 | 
 3 | from llama_deploy.client import Client
 4 | 
 5 | 
 6 | def test_run_client(workflow):
 7 |     client = Client(timeout=10)
 8 | 
 9 |     # test connections
10 |     assert len(client.sync.core.services.list()) == 1
11 |     assert len(client.sync.core.sessions.list()) == 0
12 | 
13 |     # test create session
14 |     session = client.sync.core.sessions.get_or_create("fake_session_id")
15 |     sessions = client.sync.core.sessions.list()
16 |     assert len(sessions) == 1
17 |     assert sessions[0].id == session.id
18 | 
19 |     # test run with session
20 |     result = session.run("outer", arg1="hello_world")
21 |     assert result == "hello_world_result"
22 | 
23 |     # test number of tasks
24 |     tasks = session.get_tasks()
25 |     assert len(tasks) == 1
26 |     assert tasks[0].service_id == "outer"
27 | 
28 |     # delete everything
29 |     client.sync.core.sessions.delete(session.id)
30 |     assert len(client.sync.core.sessions.list()) == 0
31 | 
32 | 
33 | @pytest.mark.asyncio
34 | async def test_run_client_async(workflow):
35 |     client = Client(timeout=10)
36 | 
37 |     # test connections
38 |     assert len(await client.core.services.list()) == 1
39 |     assert len(await client.core.sessions.list()) == 0
40 | 
41 |     # test create session
42 |     session = await client.core.sessions.get_or_create("fake_session_id")
43 |     sessions = await client.core.sessions.list()
44 |     assert len(sessions) == 1, f"Expected 1 session, got {sessions}"
45 |     assert sessions[0].id == session.id
46 | 
47 |     # test run with session
48 |     result = await session.run("outer", arg1="hello_world")
49 |     assert result == "hello_world_result"
50 | 
51 |     # test number of tasks
52 |     tasks = await session.get_tasks()
53 |     assert len(tasks) == 1, f"Expected 1 task, got {len(tasks)} tasks"
54 |     assert (
55 |         tasks[0].service_id == "outer"
56 |     ), f"Expected id to be 'outer', got {tasks[0].service_id}"
57 | 
58 |     # delete everything
59 |     await client.core.sessions.delete(session.id)
60 |     assert len(await client.core.sessions.list()) == 0
61 | 


--------------------------------------------------------------------------------
/e2e_tests/basic_workflow/workflow.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import (
 2 |     Context,
 3 |     Event,
 4 |     StartEvent,
 5 |     StopEvent,
 6 |     Workflow,
 7 |     step,
 8 | )
 9 | 
10 | 
11 | class CustomEvent(Event):
12 |     pass
13 | 
14 | 
15 | class OuterWorkflow(Workflow):
16 |     @step()
17 |     async def run_step(self, ctx: Context, ev: StartEvent) -> CustomEvent:
18 |         await ctx.set("arg1", ev.get("arg1"))
19 |         # ensure the collect_events system serializes correctly
20 |         ctx.collect_events(ev, [CustomEvent])
21 |         return CustomEvent()
22 | 
23 |     @step
24 |     async def run_final_step(self, ctx: Context, ev: CustomEvent) -> StopEvent:
25 |         arg1 = await ctx.get("arg1")
26 |         return StopEvent(result=str(arg1) + "_result")
27 | 


--------------------------------------------------------------------------------
/e2e_tests/conftest.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import multiprocessing
 3 | import time
 4 | 
 5 | import pytest
 6 | 
 7 | from llama_deploy.control_plane import ControlPlaneConfig
 8 | from llama_deploy.message_queues.simple import SimpleMessageQueueConfig
 9 | 
10 | from .utils import deploy_core
11 | 
12 | 
13 | def run_async_core():
14 |     asyncio.run(deploy_core(ControlPlaneConfig(), SimpleMessageQueueConfig()))
15 | 
16 | 
17 | @pytest.fixture
18 | def core():
19 |     p = multiprocessing.Process(target=run_async_core)
20 |     p.start()
21 |     time.sleep(3)
22 | 
23 |     yield
24 | 
25 |     p.kill()
26 | 


--------------------------------------------------------------------------------
/e2e_tests/core/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/core/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/core/conftest.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import multiprocessing
 3 | import time
 4 | 
 5 | import pytest
 6 | 
 7 | from llama_deploy.control_plane import ControlPlaneConfig
 8 | from llama_deploy.services import WorkflowServiceConfig
 9 | 
10 | from ..utils import deploy_workflow
11 | from .workflow import BasicWorkflow
12 | 
13 | 
14 | def run_async_workflow():
15 |     asyncio.run(
16 |         deploy_workflow(
17 |             BasicWorkflow(timeout=10),
18 |             WorkflowServiceConfig(
19 |                 host="127.0.0.1",
20 |                 port=8002,
21 |                 service_name="basic",
22 |             ),
23 |             ControlPlaneConfig(),
24 |         )
25 |     )
26 | 
27 | 
28 | @pytest.fixture
29 | def workflow(core):
30 |     p = multiprocessing.Process(target=run_async_workflow)
31 |     p.start()
32 |     time.sleep(5)
33 | 
34 |     yield
35 | 
36 |     p.kill()
37 | 


--------------------------------------------------------------------------------
/e2e_tests/core/test_services.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import multiprocessing
 3 | 
 4 | import pytest
 5 | 
 6 | from llama_deploy.client import Client
 7 | from llama_deploy.types.core import ServiceDefinition
 8 | 
 9 | from .conftest import run_async_workflow
10 | 
11 | 
12 | def test_services(workflow):
13 |     client = Client()
14 | 
15 |     services = client.sync.core.services
16 |     assert len(services.list()) == 1
17 | 
18 |     services.deregister("basic")
19 |     assert len(services.items) == 0
20 | 
21 |     new_s = services.register(
22 |         ServiceDefinition(service_name="another_basic", description="none")
23 |     )
24 |     assert new_s.id == "another_basic"
25 |     assert len(services.items) == 1
26 | 
27 | 
28 | @pytest.mark.asyncio
29 | async def test_services_async(workflow):
30 |     client = Client()
31 | 
32 |     assert len(await client.core.services.list()) == 1
33 |     await client.core.services.deregister("basic")
34 |     assert len(await client.core.services.list()) == 0
35 | 
36 |     new_s = await client.core.services.register(
37 |         ServiceDefinition(service_name="another_basic", description="none")
38 |     )
39 |     assert new_s.id == "another_basic"
40 |     assert len(await client.core.services.list()) == 1
41 | 
42 | 
43 | @pytest.mark.asyncio
44 | async def test_service_restart(core):
45 |     client = Client()
46 | 
47 |     # create workflow service in a separate process
48 |     p = multiprocessing.Process(target=run_async_workflow)
49 |     p.start()
50 |     await asyncio.sleep(5)
51 | 
52 |     # create session
53 |     session = await client.core.sessions.create()
54 | 
55 |     # run
56 |     result = await session.run("basic")
57 |     assert result == "n/a_result"
58 | 
59 |     # kill the service
60 |     p.kill()
61 |     p.join()
62 | 
63 |     # restart the service
64 |     p = multiprocessing.Process(target=run_async_workflow)
65 |     p.start()
66 |     await asyncio.sleep(5)
67 | 
68 |     # run again, same session
69 |     result = await session.run("basic")
70 |     assert result == "n/a_result"
71 | 
72 |     p.kill()
73 |     p.join()
74 | 


--------------------------------------------------------------------------------
/e2e_tests/core/workflow.py:
--------------------------------------------------------------------------------
1 | from llama_index.core.workflow import Context, StartEvent, StopEvent, Workflow, step
2 | 
3 | 
4 | class BasicWorkflow(Workflow):
5 |     @step()
6 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
7 |         arg1 = ev.get("arg1", "n/a")
8 |         return StopEvent(result=str(arg1) + "_result")
9 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/message_queues/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/message_queues/kafka/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/message_queues/kafka/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/message_queues/kafka/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   kafka:
 3 |     image: apache/kafka:3.7.1
 4 |     ports:
 5 |       - "9092:9092"
 6 |     environment:
 7 |       KAFKA_NODE_ID: 1
 8 |       KAFKA_LISTENER_SECURITY_PROTOCOL_MAP: "CONTROLLER:PLAINTEXT,PLAINTEXT:PLAINTEXT,PLAINTEXT_HOST:PLAINTEXT"
 9 |       KAFKA_ADVERTISED_LISTENERS: "PLAINTEXT_HOST://localhost:9092,PLAINTEXT://kafka:19092"
10 |       KAFKA_PROCESS_ROLES: "broker,controller"
11 |       KAFKA_CONTROLLER_QUORUM_VOTERS: "1@kafka:29093"
12 |       KAFKA_LISTENERS: "CONTROLLER://:29093,PLAINTEXT_HOST://:9092,PLAINTEXT://:19092"
13 |       KAFKA_INTER_BROKER_LISTENER_NAME: "PLAINTEXT"
14 |       KAFKA_CONTROLLER_LISTENER_NAMES: "CONTROLLER"
15 |       KAFKA_OFFSETS_TOPIC_REPLICATION_FACTOR: 1
16 |       KAFKA_GROUP_INITIAL_REBALANCE_DELAY_MS: 0
17 |       KAFKA_TRANSACTION_STATE_LOG_MIN_ISR: 1
18 |       KAFKA_TRANSACTION_STATE_LOG_REPLICATION_FACTOR: 1
19 |       KAFKA_LOG_DIRS: "/tmp/kraft-combined-logs"
20 |     healthcheck:
21 |       test:
22 |         - CMD-SHELL
23 |         - -c
24 |         - |
25 |           nc -z localhost 9092 || exit -1
26 |       start_period: 15s
27 |       interval: 30s
28 |       timeout: 10s
29 |       retries: 5
30 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/kafka/test_message_queue.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | import pytest
 4 | 
 5 | from llama_deploy.client import Client
 6 | from llama_deploy.types import QueueMessage
 7 | 
 8 | 
 9 | @pytest.mark.asyncio
10 | async def test_roundtrip(mq):
11 |     # produce a message
12 |     test_message = QueueMessage(type="test_message", data={"message": "this is a test"})
13 |     await mq.publish(test_message, topic="test")
14 | 
15 |     await asyncio.sleep(0)
16 | 
17 |     async for m in mq.get_messages("test"):
18 |         assert m == test_message
19 |         break
20 | 
21 |     # Give time for shutting down kafka consumer
22 |     await asyncio.sleep(1)
23 | 
24 | 
25 | @pytest.mark.asyncio
26 | async def test_multiple_control_planes(control_planes):
27 |     c1 = Client(control_plane_url="http://localhost:8001")
28 |     c2 = Client(control_plane_url="http://localhost:8002")
29 | 
30 |     session = await c1.core.sessions.create()
31 |     r1 = await session.run("basic", arg="Hello One!")
32 |     await c1.core.sessions.delete(session.id)
33 |     assert r1 == "Workflow one received Hello One!"
34 | 
35 |     session = await c2.core.sessions.create()
36 |     r2 = await session.run("basic", arg="Hello Two!")
37 |     await c2.core.sessions.delete(session.id)
38 |     assert r2 == "Workflow two received Hello Two!"
39 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/kafka/workflow.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import Context, StartEvent, StopEvent, Workflow, step
 2 | 
 3 | 
 4 | class BasicWorkflow(Workflow):
 5 |     def __init__(self, *args, **kwargs):
 6 |         self._name = kwargs.pop("name")
 7 |         super().__init__(*args, **kwargs)
 8 | 
 9 |     @step()
10 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
11 |         received = ev.get("arg")
12 |         return StopEvent(result=f"{self._name} received {received}")
13 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/rabbitmq/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/message_queues/rabbitmq/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/message_queues/rabbitmq/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   rabbitmq:
 3 |     image: rabbitmq:3-management-alpine
 4 |     hostname: "rabbitmq"
 5 |     ports:
 6 |       - "5672:5672"
 7 |       - "15672:15672"
 8 |     healthcheck:
 9 |       test:
10 |         - CMD-SHELL
11 |         - -c
12 |         - |
13 |           rabbitmq-diagnostics -q check_running
14 |           rabbitmq-diagnostics -q check_port_connectivity
15 |       interval: 5s
16 |       timeout: 3s
17 |       retries: 5
18 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/rabbitmq/test_message_queue.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | import pytest
 4 | 
 5 | from llama_deploy.client import Client
 6 | from llama_deploy.types import QueueMessage
 7 | 
 8 | 
 9 | @pytest.mark.asyncio
10 | async def test_roundtrip(mq):
11 |     async def consume():
12 |         async for m in mq.get_messages("test"):
13 |             return m
14 | 
15 |     t = asyncio.create_task(consume())
16 |     await asyncio.sleep(1)
17 | 
18 |     test_message = QueueMessage(type="test_message", data={"message": "this is a test"})
19 |     await mq.publish(test_message, topic="test")
20 | 
21 |     result = await t
22 |     assert result == test_message
23 |     await asyncio.sleep(1)
24 | 
25 | 
26 | @pytest.mark.asyncio
27 | async def test_multiple_control_planes(control_planes):
28 |     c1 = Client(control_plane_url="http://localhost:8001")
29 |     c2 = Client(control_plane_url="http://localhost:8002")
30 | 
31 |     session = await c1.core.sessions.create()
32 |     r1 = await session.run("basic", arg="Hello One!")
33 |     await c1.core.sessions.delete(session.id)
34 |     assert r1 == "Workflow one received Hello One!"
35 | 
36 |     session = await c2.core.sessions.create()
37 |     r2 = await session.run("basic", arg="Hello Two!")
38 |     await c2.core.sessions.delete(session.id)
39 |     assert r2 == "Workflow two received Hello Two!"
40 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/rabbitmq/workflow.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import Context, StartEvent, StopEvent, Workflow, step
 2 | 
 3 | 
 4 | class BasicWorkflow(Workflow):
 5 |     def __init__(self, *args, **kwargs):
 6 |         self._name = kwargs.pop("name")
 7 |         super().__init__(*args, **kwargs)
 8 | 
 9 |     @step()
10 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
11 |         received = ev.get("arg")
12 |         return StopEvent(result=f"{self._name} received {received}")
13 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/redis/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/message_queues/redis/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/message_queues/redis/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   redis:
 3 |     image: redis:latest
 4 |     hostname: redis
 5 |     ports:
 6 |       - "6379:6379"
 7 |     healthcheck:
 8 |       test:
 9 |         - CMD-SHELL
10 |         - -c
11 |         - |
12 |           redis-cli --raw incr ping
13 |       interval: 5s
14 |       timeout: 3s
15 |       retries: 5
16 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/redis/test_message_queue.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | import pytest
 4 | 
 5 | from llama_deploy.client import Client
 6 | from llama_deploy.message_queues.redis import RedisMessageQueue
 7 | from llama_deploy.types import QueueMessage
 8 | 
 9 | 
10 | @pytest.mark.asyncio
11 | async def test_roundtrip(mq: RedisMessageQueue):
12 |     # Redis pubsub has no persistence, we need to start the subscriber
13 |     # before publishing
14 |     async def consume():
15 |         async for m in mq.get_messages("test"):
16 |             return m
17 | 
18 |     t = asyncio.create_task(consume())
19 |     await asyncio.sleep(1)
20 | 
21 |     test_message = QueueMessage(type="test_message", data={"message": "this is a test"})
22 |     await mq.publish(test_message, topic="test")
23 | 
24 |     result = await t
25 |     assert result == test_message
26 | 
27 | 
28 | @pytest.mark.asyncio
29 | async def test_multiple_control_planes(control_planes):
30 |     c1 = Client(control_plane_url="http://localhost:8001")
31 |     c2 = Client(control_plane_url="http://localhost:8002")
32 | 
33 |     session = await c1.core.sessions.create()
34 |     r1 = await session.run("basic", arg="Hello One!")
35 |     await c1.core.sessions.delete(session.id)
36 |     assert r1 == "Workflow one received Hello One!"
37 | 
38 |     session = await c2.core.sessions.create()
39 |     r2 = await session.run("basic", arg="Hello Two!")
40 |     await c2.core.sessions.delete(session.id)
41 |     assert r2 == "Workflow two received Hello Two!"
42 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/redis/workflow.py:
--------------------------------------------------------------------------------
 1 | from llama_index.core.workflow import Context, StartEvent, StopEvent, Workflow, step
 2 | 
 3 | 
 4 | class BasicWorkflow(Workflow):
 5 |     def __init__(self, *args, **kwargs):
 6 |         self._name = kwargs.pop("name")
 7 |         super().__init__(*args, **kwargs)
 8 | 
 9 |     @step()
10 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
11 |         received = ev.get("arg")
12 |         return StopEvent(result=f"{self._name} received {received}")
13 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/simple/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/e2e_tests/message_queues/simple/__init__.py


--------------------------------------------------------------------------------
/e2e_tests/message_queues/simple/conftest.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | import pytest
 4 | import pytest_asyncio
 5 | 
 6 | from llama_deploy.message_queues.simple import (
 7 |     SimpleMessageQueue,
 8 |     SimpleMessageQueueConfig,
 9 |     SimpleMessageQueueServer,
10 | )
11 | 
12 | 
13 | @pytest_asyncio.fixture()
14 | async def simple_server():
15 |     queue = SimpleMessageQueueServer(SimpleMessageQueueConfig(port=8009))
16 |     t = asyncio.create_task(queue.launch_server())
17 |     # let message queue boot up
18 |     await asyncio.sleep(1)
19 | 
20 |     yield
21 | 
22 |     t.cancel()
23 |     await t
24 | 
25 | 
26 | @pytest.fixture
27 | def mq(simple_server):
28 |     return SimpleMessageQueue(SimpleMessageQueueConfig(port=8009))
29 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/simple/test_message_queue.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | import pytest
 4 | 
 5 | from llama_deploy.message_queues import SimpleMessageQueue
 6 | from llama_deploy.types import QueueMessage
 7 | 
 8 | 
 9 | @pytest.mark.asyncio
10 | async def test_roundtrip(mq: SimpleMessageQueue):
11 |     # produce a message
12 |     test_message = QueueMessage(type="test_message", data={"message": "this is a test"})
13 |     await mq.publish(test_message, topic="test")
14 | 
15 |     await asyncio.sleep(0)
16 | 
17 |     async for m in mq.get_messages("test"):
18 |         assert m == test_message
19 |         break
20 | 


--------------------------------------------------------------------------------
/e2e_tests/message_queues/simple/test_server.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | import pytest
 4 | 
 5 | from llama_deploy.message_queues import (
 6 |     SimpleMessageQueueConfig,
 7 |     SimpleMessageQueueServer,
 8 | )
 9 | 
10 | 
11 | @pytest.mark.asyncio
12 | async def test_cancel_launch_server():
13 |     mq = SimpleMessageQueueServer(SimpleMessageQueueConfig(port=8009))
14 |     t = asyncio.create_task(mq.launch_server())
15 | 
16 |     # Make sure the queue starts
17 |     await asyncio.sleep(1)
18 | 
19 |     # Cancel
20 |     t.cancel()
21 |     await t
22 | 


--------------------------------------------------------------------------------
/examples/google_cloud_run/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM llamaindex/llama-deploy:main
 2 | 
 3 | # This will be passed at build time
 4 | ARG SOURCE_DIR=""
 5 | 
 6 | # Copy the application code (for example, your workflow)
 7 | COPY ${SOURCE_DIR} /app/code
 8 | WORKDIR  /app/code
 9 | 
10 | # Deploy automatically what's in /app/code when the container starts
11 | ENV LLAMA_DEPLOY_APISERVER_RC_PATH=/app/code
12 | COPY deployment.yml /app/code
13 | 
14 | # Cloud Run requires the container to listen to port 8080
15 | ENV LLAMA_DEPLOY_APISERVER_HOST=0.0.0.0
16 | ENV LLAMA_DEPLOY_APISERVER_PORT=8080
17 | EXPOSE 8080
18 | 
19 | # In Cloud Run localhost resolves to the public URI on port 80,
20 | # let's override the default and point explicitly to the internal
21 | # host and port
22 | ENV LLAMA_DEPLOY_API_SERVER_URL="http://127.0.0.1:8080"
23 | 


--------------------------------------------------------------------------------
/examples/google_cloud_run/deployment.yml:
--------------------------------------------------------------------------------
 1 | name: CloudRunExample
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | default-service: dummy_workflow
 7 | 
 8 | services:
 9 |   dummy_workflow:
10 |     name: Dummy Workflow
11 |     source:
12 |       type: local
13 |       name: .
14 |     path: workflow:echo_workflow
15 | 


--------------------------------------------------------------------------------
/examples/google_cloud_run/src/workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | from llama_index.core.workflow import Workflow, StartEvent, StopEvent, step
 4 | 
 5 | 
 6 | # create a dummy workflow
 7 | class EchoWorkflow(Workflow):
 8 |     """A dummy workflow with only one step sending back the input given."""
 9 | 
10 |     @step()
11 |     async def run_step(self, ev: StartEvent) -> StopEvent:
12 |         message = str(ev.get("message", ""))
13 |         return StopEvent(result=f"Message received: {message}")
14 | 
15 | 
16 | echo_workflow = EchoWorkflow()
17 | 
18 | 
19 | async def main():
20 |     print(await echo_workflow.run(message="Hello!"))
21 | 
22 | 
23 | if __name__ == "__main__":
24 |     asyncio.run(main())
25 | 


--------------------------------------------------------------------------------
/examples/llamacloud/google_drive/deployment.yml:
--------------------------------------------------------------------------------
 1 | name: LlamaCloud_LlamaDeploy_GoogleDrive
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | default-service: llamacloud_workflow
 7 | 
 8 | services:
 9 |   llamacloud_workflow:
10 |     name: LlamaCloud GoogleDrive Data Source Workflow
11 |     # We tell LlamaDeploy where to look for our workflow
12 |     source:
13 |       # In this case, we instruct LlamaDeploy to look in the local filesystem
14 |       type: local
15 |       # The path relative to this deployment config file where to look for the code. This assumes
16 |       # there's an src folder along with the config file containing the file workflow.py we created previously
17 |       name: ./src
18 |     # This assumes the file workflow.py contains a variable called `echo_workflow` containing our workflow instance
19 |     path: workflow:llamacloud_workflow
20 | 


--------------------------------------------------------------------------------
/examples/llamacloud/google_drive/src/config.yml:
--------------------------------------------------------------------------------
1 | llamacloud:
2 |   index_name: "<YOUR INDEX NAME>"
3 |   project_name: "<YOUR PROJECT NAME>"
4 |   organization_id: "<YOUR ORGANIZATION ID>"
5 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   qdrant:
 3 |     # Used by the RAG workflow
 4 |     image: qdrant/qdrant:latest
 5 |     ports:
 6 |       - "6333:6333"
 7 |       - "6334:6334"
 8 |     volumes:
 9 |       - qdrant_data:/qdrant/storage
10 | 
11 |   redis:
12 |     # LlamaDeploy message queue
13 |     image: redis:latest
14 |     hostname: redis
15 |     ports:
16 |       - "6379:6379"
17 |     healthcheck:
18 |       test: redis-cli --raw incr ping
19 |       interval: 5s
20 |       timeout: 3s
21 |       retries: 5
22 | 
23 |   apiserver:
24 |     # LlamaDeploy API server, will run the workflows
25 |     image: llamaindex/llama-deploy:main
26 |     environment:
27 |       QDRANT_HOST: qdrant
28 |       OPENAI_API_KEY: $OPENAI_API_KEY
29 |     ports:
30 |       - "4501:4501"
31 |     depends_on:
32 |       redis:
33 |         condition: service_healthy
34 |     healthcheck:
35 |       test: llamactl status
36 |       interval: 5s
37 |       timeout: 3s
38 |       retries: 5
39 |     volumes:
40 |       - ./:/opt/app
41 |     working_dir: /opt/app
42 | 
43 |   deploy_workflows:
44 |     # Init container, it deploys python_fullstack.yaml and exits
45 |     image: llamaindex/llama-deploy:main
46 |     volumes:
47 |       - ./python_fullstack.yaml:/opt/python_fullstack.yaml
48 |     working_dir: /opt/
49 |     depends_on:
50 |       apiserver:
51 |         condition: service_healthy
52 |     entrypoint: llamactl -s http://apiserver:4501 -t 60 deploy python_fullstack.yaml
53 | 
54 |   frontend:
55 |     # UI for this deployment, running at http://localhost:3000
56 |     environment:
57 |       APISERVER_URL: http://apiserver:4501
58 |       DEPLOYMENT_NAME: MyDeployment
59 |     build:
60 |       context: ./frontend
61 |       dockerfile: dockerfile
62 |     ports:
63 |       - "3000:3000"
64 |       - "9000:9000"
65 |     volumes:
66 |       - ./frontend:/app
67 |     depends_on:
68 |       deploy_workflows:
69 |         condition: service_completed_successfully
70 | 
71 | volumes:
72 |   qdrant_data:
73 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/.gitignore:
--------------------------------------------------------------------------------
1 | *.db
2 | *.py[cod]
3 | .web
4 | __pycache__/
5 | assets/external/
6 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/assets/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/examples/python_fullstack/frontend/assets/favicon.ico


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/dockerfile:
--------------------------------------------------------------------------------
 1 | # This Dockerfile is used to deploy a simple single-container Reflex app instance.
 2 | FROM python:3.10-slim
 3 | 
 4 | # Copy local context to `/app` inside container (see .dockerignore)
 5 | WORKDIR /app
 6 | COPY . .
 7 | 
 8 | # Install app requirements and reflex in the container
 9 | # Deploy templates and prepare app
10 | # Download all npm dependencies and compile frontend
11 | RUN apt-get clean && apt-get update \
12 |     && apt-get --no-install-recommends install zip unzip curl -y \
13 |     && pip install -r requirements.txt \
14 |     && reflex export --frontend-only --no-zip
15 | 
16 | # Needed until Reflex properly passes SIGTERM on backend.
17 | STOPSIGNAL SIGKILL
18 | 
19 | # Always apply migrations before starting the backend.
20 | CMD [ -d alembic ] && reflex db migrate; reflex run --env prod
21 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/frontend/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/examples/python_fullstack/frontend/frontend/__init__.py


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/frontend/frontend.py:
--------------------------------------------------------------------------------
 1 | import reflex as rx
 2 | 
 3 | from frontend import style
 4 | from frontend.state import State
 5 | from frontend.session_list.component import session_list
 6 | from frontend.session_list.state import SessionState
 7 | 
 8 | 
 9 | def qa(content: str, idx: int) -> rx.Component:
10 |     return rx.box(
11 |         rx.text(content, style=style.answer_style),
12 |         text_align=rx.cond(idx % 2 == 0, "right", "left"),
13 |         margin_left="1em",
14 |     )
15 | 
16 | 
17 | def chat() -> rx.Component:
18 |     return rx.box(
19 |         rx.foreach(State.chat_history, lambda messages, idx: qa(messages, idx))
20 |     )
21 | 
22 | 
23 | def action_bar() -> rx.Component:
24 |     return rx.hstack(
25 |         rx.input(
26 |             value=State.question,
27 |             placeholder="Ask a question",
28 |             on_change=State.set_question,
29 |             on_key_down=lambda key: State.handle_key_down(
30 |                 key, SessionState.selected_session_id
31 |             ),
32 |             style=style.input_style,
33 |         ),
34 |         rx.button(
35 |             "Ask",
36 |             on_click=lambda: State.answer(SessionState.selected_session_id),
37 |             style=style.button_style,
38 |         ),
39 |     )
40 | 
41 | 
42 | def index() -> rx.Component:
43 |     return rx.center(
44 |         rx.hstack(
45 |             session_list(),
46 |             rx.vstack(
47 |                 chat(),
48 |                 action_bar(),
49 |                 align="center",
50 |             ),
51 |             margin_left="4",
52 |         ),
53 |     )
54 | 
55 | 
56 | app = rx.App()
57 | app.add_page(index, on_load=SessionState.create_default_session)
58 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/frontend/session_list/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/examples/python_fullstack/frontend/frontend/session_list/__init__.py


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/frontend/session_list/component.py:
--------------------------------------------------------------------------------
 1 | import reflex as rx
 2 | 
 3 | from .state import SessionState
 4 | 
 5 | 
 6 | def session_item(session: dict, index: int):
 7 |     return rx.cond(
 8 |         index == SessionState.editing_index,
 9 |         edit_mode(index),
10 |         display_mode(session, index),
11 |     )
12 | 
13 | 
14 | def edit_mode(index: int):
15 |     return rx.input(
16 |         value=SessionState.edit_value,
17 |         on_change=SessionState.set_edit_value,
18 |         on_blur=lambda _: SessionState.save_edit(),
19 |         on_key_down=SessionState.handle_key_press,
20 |         auto_focus=True,
21 |     )
22 | 
23 | 
24 | def display_mode(session: dict, index: int):
25 |     return rx.box(
26 |         rx.text(
27 |             session["session_name"],
28 |             font_weight="medium",
29 |         ),
30 |         cursor="pointer",
31 |         on_click=SessionState.select_session(index),
32 |         padding="0.75em",
33 |         border_radius="8px",
34 |         background=rx.cond(
35 |             index == SessionState.selected_session_index,
36 |             "rgba(59, 130, 246, 0.1)",  # Light blue background for selected item
37 |             "transparent",
38 |         ),
39 |         border_left=rx.cond(
40 |             index == SessionState.selected_session_index,
41 |             "4px solid rgb(59, 130, 246)",  # Blue left border for selected item
42 |             "4px solid transparent",
43 |         ),
44 |         _hover={
45 |             "background": rx.cond(
46 |                 index == SessionState.selected_session_index,
47 |                 "rgba(59, 130, 246, 0.1)",
48 |                 "rgba(0, 0, 0, 0.05)",
49 |             )
50 |         },
51 |         transition="all 0.2s ease-in-out",
52 |     )
53 | 
54 | 
55 | def session_list():
56 |     return rx.vstack(
57 |         rx.heading("Sessions", size="lg"),
58 |         rx.vstack(
59 |             rx.foreach(SessionState.sessions, session_item),
60 |             width="100%",
61 |             spacing="4",
62 |         ),
63 |         # Add button at the bottom
64 |         rx.button(
65 |             "+",
66 |             on_click=SessionState.add_session,
67 |             margin_top="4",
68 |             border_radius="25px",
69 |         ),
70 |         width="100%",
71 |         max_width="600px",
72 |         padding="4",
73 |         spacing="4",
74 |     )
75 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/frontend/session_list/state.py:
--------------------------------------------------------------------------------
 1 | import httpx
 2 | import reflex as rx
 3 | import os
 4 | from ..state import State
 5 | 
 6 | 
 7 | class SessionState(rx.State):
 8 |     # List to store session items
 9 |     sessions: list[dict] = []
10 |     # Default text for new items
11 |     default_new_text: str = "New Session"
12 |     # Index of session being edited
13 |     editing_index: int = -1
14 |     # Temporary value for editing
15 |     edit_value: str = ""
16 |     # Currently selected session index
17 |     selected_session_index: int = -1
18 | 
19 |     async def _create_session(self, name: str):
20 |         client = httpx.AsyncClient()
21 | 
22 |         deployment_name = os.environ.get("DEPLOYMENT_NAME", "MyDeployment")
23 |         apiserver_url = os.environ.get("APISERVER_URL", "http://localhost:4501")
24 |         response = await client.post(
25 |             f"{apiserver_url}/deployments/{deployment_name}/sessions/create",
26 |             timeout=60,
27 |         )
28 |         data = response.json()
29 |         session_id = data["session_id"]
30 |         return {"id": session_id, "session_name": name}
31 | 
32 |     async def create_default_session(self):
33 |         if len(self.sessions) == 0:
34 |             session = await self._create_session("Default")
35 |             self.sessions.append(session)
36 |             await self.select_session(0)
37 | 
38 |     async def select_session(self, index: int):
39 |         self.selected_session_index = index
40 |         return State.update_chat_history(self.selected_session_id)
41 | 
42 |     @rx.var
43 |     def selected_session_id(self) -> str | None:
44 |         if self.selected_session_index == -1:
45 |             return None
46 |         return self.sessions[self.selected_session_index]["id"]
47 | 
48 |     def add_session(self):
49 |         self.sessions.append(self.default_new_text)
50 |         # Automatically start editing the new item
51 |         self.start_edit(len(self.sessions) - 1)
52 | 
53 |     def start_edit(self, index: int):
54 |         self.editing_index = index
55 |         self.edit_value = self.sessions[index]
56 | 
57 |     async def save_edit(self):
58 |         if self.edit_value.strip():
59 |             session = await self._create_session(self.edit_value)
60 |             self.sessions[self.editing_index] = session
61 |         self.editing_index = -1
62 |         self.edit_value = ""
63 | 
64 |     def handle_key_press(self, key: str):
65 |         if key == "Enter":
66 |             self.save_edit()
67 |         elif key == "Escape":
68 |             self.save_edit()
69 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/frontend/style.py:
--------------------------------------------------------------------------------
 1 | # style.py
 2 | import reflex as rx
 3 | 
 4 | # Common styles for questions and answers.
 5 | shadow = "rgba(0, 0, 0, 0.15) 0px 2px 8px"
 6 | chat_margin = "20%"
 7 | message_style = dict(
 8 |     padding="1em",
 9 |     border_radius="5px",
10 |     margin_y="0.5em",
11 |     box_shadow=shadow,
12 |     max_width="30em",
13 |     display="inline-block",
14 | )
15 | 
16 | # Set specific styles for questions and answers.
17 | question_style = message_style | dict(
18 |     background_color=rx.color("gray", 4),
19 |     margin_left=chat_margin,
20 | )
21 | answer_style = message_style | dict(
22 |     background_color=rx.color("accent", 8),
23 |     margin_right=chat_margin,
24 | )
25 | 
26 | # Styles for the action bar.
27 | input_style = dict(
28 |     border_width="1px",
29 |     padding="0.25em",
30 |     box_shadow=shadow,
31 |     width="350px",
32 | )
33 | button_style = dict(
34 |     background_color=rx.color("accent", 10),
35 |     box_shadow=shadow,
36 | )
37 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/requirements.txt:
--------------------------------------------------------------------------------
1 | llama-deploy
2 | reflex
3 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/frontend/rxconfig.py:
--------------------------------------------------------------------------------
1 | import reflex as rx
2 | 
3 | config = rx.Config(
4 |     app_name="frontend",
5 |     api_url="http://localhost:9000",
6 |     backend_port=9000,
7 |     deployment_name="deployment",
8 | )
9 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/llama_deploy_frontend.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/examples/python_fullstack/llama_deploy_frontend.png


--------------------------------------------------------------------------------
/examples/python_fullstack/python_fullstack.yaml:
--------------------------------------------------------------------------------
 1 | name: MyDeployment
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | message-queue:
 7 |   type: redis
 8 |   # what follows depends on what's in the docker compose file
 9 |   host: redis
10 |   port: 6379
11 | 
12 | default-service: agentic_workflow
13 | 
14 | services:
15 |   agentic_workflow:
16 |     name: Agentic Workflow
17 |     source:
18 |       type: local
19 |       name: .
20 |     path: workflows:agentic_w
21 |     python-dependencies:
22 |       - llama-index-postprocessor-rankgpt-rerank>=0.2.0
23 |       - llama-index-vector-stores-qdrant>=0.3.0
24 |       - llama-index-llms-openai>=0.2.2
25 |       - llama-index-embeddings-openai>=0.2.4
26 |       - llama-index-readers-file>=0.2.0
27 | 
28 |   rag_workflow:
29 |     name: RAG Workflow
30 |     source:
31 |       type: local
32 |       name: .
33 |     path: workflows:rag_w
34 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/workflows/__init__.py:
--------------------------------------------------------------------------------
1 | from .agent_workflow import build_agentic_workflow
2 | from .rag_workflow import build_rag_workflow
3 | 
4 | 
5 | rag_w = build_rag_workflow()
6 | agentic_w = build_agentic_workflow(rag_w)
7 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/workflows/data/attention.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/examples/python_fullstack/workflows/data/attention.pdf


--------------------------------------------------------------------------------
/examples/python_fullstack/workflows/dockerfile:
--------------------------------------------------------------------------------
 1 | FROM python:3.10-slim
 2 | 
 3 | EXPOSE 8002
 4 | EXPOSE 8003
 5 | 
 6 | WORKDIR /app
 7 | 
 8 | # Copy source code
 9 | COPY . .
10 | 
11 | # Install libraries for necessary python package builds
12 | RUN apt-get clean && apt-get update \
13 |     && apt-get --no-install-recommends install build-essential python3-dev libpq-dev curl -y \
14 |     && pip install --no-cache-dir --upgrade pip \
15 |     && apt-get -yq update && apt-get -yqq install ssh \
16 |     && apt-get clean \
17 |     && pip install -r requirements.txt
18 | 
19 | # Run the deploy.py script
20 | ENTRYPOINT ["python", "./deploy.py"]
21 | 


--------------------------------------------------------------------------------
/examples/python_fullstack/workflows/requirements.txt:
--------------------------------------------------------------------------------
1 | llama-deploy[rabbitmq, kafka, redis]==0.1.1
2 | llama-index-postprocessor-rankgpt-rerank>=0.2.0
3 | llama-index-vector-stores-qdrant>=0.3.0
4 | llama-index-llms-openai>=0.2.2
5 | llama-index-embeddings-openai>=0.2.4
6 | llama-index-readers-file>=0.2.0
7 | 


--------------------------------------------------------------------------------
/examples/quick_start/quick_start.yml:
--------------------------------------------------------------------------------
 1 | name: QuickStart
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | default-service: echo_workflow
 7 | 
 8 | services:
 9 |   echo_workflow:
10 |     name: Echo Workflow
11 |     source:
12 |       type: local
13 |       name: src
14 |     path: src/workflow:echo_workflow
15 | 
16 | ui:
17 |   name: My Nextjs App
18 |   source:
19 |     type: local
20 |     name: ui
21 | 


--------------------------------------------------------------------------------
/examples/quick_start/src/workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | from llama_index.core.workflow import Workflow, StartEvent, StopEvent, step
 4 | 
 5 | 
 6 | # create a dummy workflow
 7 | class EchoWorkflow(Workflow):
 8 |     """A dummy workflow with only one step sending back the input given."""
 9 | 
10 |     @step()
11 |     async def run_step(self, ev: StartEvent) -> StopEvent:
12 |         message = str(ev.get("message", ""))
13 |         return StopEvent(result=f"Message received: {message}")
14 | 
15 | 
16 | echo_workflow = EchoWorkflow()
17 | 
18 | 
19 | async def main():
20 |     print(await echo_workflow.run(message="Hello!"))
21 | 
22 | 
23 | if __name__ == "__main__":
24 |     asyncio.run(main())
25 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/.gitignore:
--------------------------------------------------------------------------------
 1 | # See https://help.github.com/articles/ignoring-files/ for more about ignoring files.
 2 | 
 3 | # dependencies
 4 | /node_modules
 5 | /.pnp
 6 | .pnp.*
 7 | .yarn/*
 8 | !.yarn/patches
 9 | !.yarn/plugins
10 | !.yarn/releases
11 | !.yarn/versions
12 | 
13 | # testing
14 | /coverage
15 | 
16 | # next.js
17 | /.next/
18 | /out/
19 | 
20 | # production
21 | /build
22 | 
23 | # misc
24 | .DS_Store
25 | *.pem
26 | 
27 | # debug
28 | npm-debug.log*
29 | yarn-debug.log*
30 | yarn-error.log*
31 | .pnpm-debug.log*
32 | 
33 | # env files (can opt-in for committing if needed)
34 | .env*
35 | 
36 | # vercel
37 | .vercel
38 | 
39 | # typescript
40 | *.tsbuildinfo
41 | next-env.d.ts
42 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/app/confetti/page.tsx:
--------------------------------------------------------------------------------
 1 | 'use client';
 2 | 
 3 | import { useEffect } from 'react';
 4 | import Image from 'next/image';
 5 | import Link from 'next/link';
 6 | import confetti from 'canvas-confetti';
 7 | 
 8 | export default function LlamaPartyPage() {
 9 |   // Trigger confetti on page load
10 |   useEffect(() => {
11 |     const timer = setTimeout(() => {
12 |       celebrate();
13 |     }, 500);
14 | 
15 |     return () => clearTimeout(timer);
16 |   }, []);
17 | 
18 |   const celebrate = () => {
19 |     // Fire confetti from both sides
20 |     confetti({
21 |       particleCount: 500,
22 |       spread: 90,
23 |       origin: { y: 0.6, x: 0.1 }
24 |     });
25 |     confetti({
26 |       particleCount: 500,
27 |       spread: 90,
28 |       origin: { y: 0.6, x: 0.9 }
29 |     });
30 |   };
31 | 
32 |   return (
33 |     <div className="flex flex-col min-h-screen p-8 items-center justify-center font-[family-name:var(--font-geist-sans)]">
34 |       <Image
35 |         src={`${process.env.NEXT_PUBLIC_BASE_PATH}/logo-dark-light.svg`}
36 |         alt="LlamaIndex logo"
37 |         width={120}
38 |         height={120}
39 |         className="mb-8"
40 |       />
41 | 
42 |       <div className="max-w-lg p-6 bg-white dark:bg-gray-800 rounded-lg shadow-md text-center">
43 |         <h2 className="text-xl font-bold mb-4">Congratulations!</h2>
44 |         <p className="text-gray-600 mb-6">You found the secret page!</p>
45 | 
46 |         <div className="flex flex-col gap-4">
47 |           <button
48 |             onClick={celebrate}
49 |             className="py-2 px-4 bg-foreground text-background rounded-md hover:opacity-80"
50 |           >
51 |             Celebrate again
52 |           </button>
53 | 
54 |           <Link
55 |             href="/"
56 |             className="py-2 px-4 bg-white text-foreground border border-gray-300 rounded-md hover:bg-gray-50 text-center"
57 |           >
58 |             Back to workflow
59 |           </Link>
60 |         </div>
61 |       </div>
62 |     </div>
63 |   );
64 | }
65 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/app/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/examples/quick_start/ui/app/favicon.ico


--------------------------------------------------------------------------------
/examples/quick_start/ui/app/globals.css:
--------------------------------------------------------------------------------
 1 | @import "tailwindcss";
 2 | 
 3 | :root {
 4 |   --background: #ffffff;
 5 |   --foreground: #171717;
 6 | }
 7 | 
 8 | @theme inline {
 9 |   --color-background: var(--background);
10 |   --color-foreground: var(--foreground);
11 |   --font-sans: var(--font-geist-sans);
12 |   --font-mono: var(--font-geist-mono);
13 | }
14 | 
15 | @media (prefers-color-scheme: dark) {
16 |   :root {
17 |     --background: #0a0a0a;
18 |     --foreground: #ededed;
19 |   }
20 | }
21 | 
22 | body {
23 |   background: var(--background);
24 |   color: var(--foreground);
25 |   font-family: Arial, Helvetica, sans-serif;
26 | }
27 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/app/layout.tsx:
--------------------------------------------------------------------------------
 1 | import type { Metadata } from "next";
 2 | import { Geist, Geist_Mono } from "next/font/google";
 3 | import "./globals.css";
 4 | 
 5 | const geistSans = Geist({
 6 |   variable: "--font-geist-sans",
 7 | });
 8 | 
 9 | const geistMono = Geist_Mono({
10 |   variable: "--font-geist-mono",
11 | });
12 | 
13 | export const metadata: Metadata = {
14 |   title: "Create Next App",
15 |   description: "Generated by create next app",
16 | };
17 | 
18 | export default function RootLayout({
19 |   children,
20 | }: Readonly<{
21 |   children: React.ReactNode;
22 | }>) {
23 |   return (
24 |     <html lang="en">
25 |       <body
26 |         className={`${geistSans.variable} ${geistMono.variable} antialiased`}
27 |       >
28 |         {children}
29 |       </body>
30 |     </html>
31 |   );
32 | }
33 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/eslint.config.mjs:
--------------------------------------------------------------------------------
 1 | import { dirname } from "path";
 2 | import { fileURLToPath } from "url";
 3 | import { FlatCompat } from "@eslint/eslintrc";
 4 | 
 5 | const __filename = fileURLToPath(import.meta.url);
 6 | const __dirname = dirname(__filename);
 7 | 
 8 | const compat = new FlatCompat({
 9 |   baseDirectory: __dirname,
10 | });
11 | 
12 | const eslintConfig = [
13 |   ...compat.extends("next/core-web-vitals", "next/typescript"),
14 | ];
15 | 
16 | export default eslintConfig;
17 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/next.config.ts:
--------------------------------------------------------------------------------
 1 | import type { NextConfig } from "next";
 2 | const nextConfig: NextConfig = {
 3 |   basePath: process.env.LLAMA_DEPLOY_NEXTJS_BASE_PATH,
 4 |   env: {
 5 |     NEXT_PUBLIC_LLAMA_DEPLOY_NEXTJS_DEPLOYMENT_NAME:
 6 |       process.env.LLAMA_DEPLOY_NEXTJS_DEPLOYMENT_NAME || "default",
 7 |     NEXT_PUBLIC_BASE_PATH:
 8 |       process.env.LLAMA_DEPLOY_NEXTJS_BASE_PATH || "",
 9 |   },
10 | };
11 | 
12 | export default nextConfig;
13 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "ui",
 3 |   "version": "0.1.0",
 4 |   "private": true,
 5 |   "scripts": {
 6 |     "dev": "next dev --turbopack",
 7 |     "build": "next build",
 8 |     "start": "next start",
 9 |     "lint": "next lint"
10 |   },
11 |   "dependencies": {
12 |     "@types/canvas-confetti": "^1.9.0",
13 |     "canvas-confetti": "^1.9.3",
14 |     "next": "15.3.2",
15 |     "react": "^19.0.0",
16 |     "react-dom": "^19.0.0"
17 |   },
18 |   "devDependencies": {
19 |     "@eslint/eslintrc": "^3",
20 |     "@tailwindcss/postcss": "^4",
21 |     "@types/node": "^20",
22 |     "@types/react": "^19",
23 |     "@types/react-dom": "^19",
24 |     "eslint": "^9",
25 |     "eslint-config-next": "15.3.2",
26 |     "tailwindcss": "^4",
27 |     "typescript": "^5"
28 |   },
29 |   "packageManager": "pnpm@10.11.0+sha512.6540583f41cc5f628eb3d9773ecee802f4f9ef9923cc45b69890fb47991d4b092964694ec3a4f738a420c918a333062c8b925d312f42e4f0c263eb603551f977"
30 | }
31 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/postcss.config.mjs:
--------------------------------------------------------------------------------
1 | const config = {
2 |   plugins: ["@tailwindcss/postcss"],
3 | };
4 | 
5 | export default config;
6 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/public/file.svg:
--------------------------------------------------------------------------------
1 | <svg fill="none" viewBox="0 0 16 16" xmlns="http://www.w3.org/2000/svg"><path d="M14.5 13.5V5.41a1 1 0 0 0-.3-.7L9.8.29A1 1 0 0 0 9.08 0H1.5v13.5A2.5 2.5 0 0 0 4 16h8a2.5 2.5 0 0 0 2.5-2.5m-1.5 0v-7H8v-5H3v12a1 1 0 0 0 1 1h8a1 1 0 0 0 1-1M9.5 5V2.12L12.38 5zM5.13 5h-.62v1.25h2.12V5zm-.62 3h7.12v1.25H4.5zm.62 3h-.62v1.25h7.12V11z" clip-rule="evenodd" fill="#666" fill-rule="evenodd"/></svg>
2 | 


--------------------------------------------------------------------------------
/examples/quick_start/ui/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "target": "ES2017",
 4 |     "lib": ["dom", "dom.iterable", "esnext"],
 5 |     "allowJs": true,
 6 |     "skipLibCheck": true,
 7 |     "strict": true,
 8 |     "noEmit": true,
 9 |     "esModuleInterop": true,
10 |     "module": "esnext",
11 |     "moduleResolution": "bundler",
12 |     "resolveJsonModule": true,
13 |     "isolatedModules": true,
14 |     "jsx": "preserve",
15 |     "incremental": true,
16 |     "plugins": [
17 |       {
18 |         "name": "next"
19 |       }
20 |     ],
21 |     "paths": {
22 |       "@/*": ["./*"]
23 |     }
24 |   },
25 |   "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
26 |   "exclude": ["node_modules"]
27 | }
28 | 


--------------------------------------------------------------------------------
/examples/redis_message_queue/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   redis:
 3 |     # Use as KV store
 4 |     image: redis:latest
 5 |     hostname: redis
 6 |     ports:
 7 |       - "6379:6379"
 8 |     healthcheck:
 9 |       test:
10 |         - CMD-SHELL
11 |         - -c
12 |         - |
13 |           redis-cli --raw incr ping
14 |       interval: 5s
15 |       timeout: 3s
16 |       retries: 5
17 | 
18 |   apiserver:
19 |     image: llamaindex/llama-deploy:main
20 |     hostname: apiserver
21 |     ports:
22 |       - "4501:4501"
23 |     environment:
24 |       LLAMA_DEPLOY_APISERVER_RC_PATH: /opt/app/
25 |     depends_on:
26 |       redis:
27 |         condition: service_healthy
28 |     healthcheck:
29 |       test:
30 |         - CMD-SHELL
31 |         - -c
32 |         - llamactl status
33 |       interval: 5s
34 |       timeout: 3s
35 |       retries: 5
36 |     volumes:
37 |       - ./src:/opt/app
38 |     working_dir: /opt/app
39 | 


--------------------------------------------------------------------------------
/examples/redis_message_queue/src/deployment.yml:
--------------------------------------------------------------------------------
 1 | name: RedisMessageQueue
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | message-queue:
 7 |   type: redis
 8 |   # what follows depends on what's in the docker compose file
 9 |   host: redis
10 |   port: 6379
11 | 
12 | default-service: counter_workflow_service
13 | 
14 | services:
15 |   counter_workflow_service:
16 |     name: Counter Workflow
17 |     source:
18 |       type: local
19 |       name: .
20 |     path: workflow:counter_workflow
21 | 


--------------------------------------------------------------------------------
/examples/redis_message_queue/src/workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | from llama_index.core.workflow import Context, StartEvent, StopEvent, Workflow, step
 4 | 
 5 | 
 6 | # create a dummy workflow
 7 | class CounterWorkflow(Workflow):
 8 |     """A dummy workflow with only one step sending back the input given."""
 9 | 
10 |     @step()
11 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
12 |         amount = float(ev.get("amount", 0.0))
13 |         total = await ctx.get("total", 0.0) + amount
14 |         await ctx.set("total", total)
15 |         return StopEvent(result=f"Current balance: {total}")
16 | 
17 | 
18 | counter_workflow = CounterWorkflow()
19 | 
20 | 
21 | async def main():
22 |     print(await counter_workflow.run(message=10.0))
23 | 
24 | 
25 | if __name__ == "__main__":
26 |     asyncio.run(main())
27 | 


--------------------------------------------------------------------------------
/examples/redis_state_store/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   redis:
 3 |     # Use as KV store
 4 |     image: redis:latest
 5 |     hostname: redis
 6 |     ports:
 7 |       - "6379:6379"
 8 |     healthcheck:
 9 |       test: redis-cli --raw incr ping
10 |       interval: 5s
11 |       timeout: 3s
12 |       retries: 5
13 | 


--------------------------------------------------------------------------------
/examples/redis_state_store/redis_store.yml:
--------------------------------------------------------------------------------
 1 | name: RedisStateStore
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 |   state_store_uri: redis://localhost:6379
 6 | 
 7 | default-service: counter_workflow_service
 8 | 
 9 | services:
10 |   counter_workflow_service:
11 |     name: Counter Workflow
12 |     source:
13 |       type: local
14 |       name: src
15 |     path: workflow:counter_workflow
16 | 


--------------------------------------------------------------------------------
/examples/redis_state_store/requirements.txt:
--------------------------------------------------------------------------------
1 | llama-index-storage-kvstore-redis
2 | 


--------------------------------------------------------------------------------
/examples/redis_state_store/src/workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | from llama_index.core.workflow import Context, StartEvent, StopEvent, Workflow, step
 4 | 
 5 | 
 6 | # create a dummy workflow
 7 | class CounterWorkflow(Workflow):
 8 |     """A dummy workflow with only one step sending back the input given."""
 9 | 
10 |     @step()
11 |     async def run_step(self, ctx: Context, ev: StartEvent) -> StopEvent:
12 |         amount = float(ev.get("amount", 0.0))
13 |         total = await ctx.get("total", 0.0) + amount
14 |         await ctx.set("total", total)
15 |         return StopEvent(result=f"Current balance: {total}")
16 | 
17 | 
18 | counter_workflow = CounterWorkflow()
19 | 
20 | 
21 | async def main():
22 |     print(await counter_workflow.run(message=10.0))
23 | 
24 | 
25 | if __name__ == "__main__":
26 |     asyncio.run(main())
27 | 


--------------------------------------------------------------------------------
/llama_deploy/__init__.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | 
 3 | root_logger = logging.getLogger("llama_deploy")
 4 | 
 5 | formatter = logging.Formatter("%(levelname)s:%(name)s - %(message)s")
 6 | console_handler = logging.StreamHandler()
 7 | console_handler.setFormatter(formatter)
 8 | root_logger.addHandler(console_handler)
 9 | 
10 | root_logger.setLevel(logging.INFO)
11 | root_logger.propagate = True
12 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/llama_deploy/apiserver/__init__.py


--------------------------------------------------------------------------------
/llama_deploy/apiserver/__main__.py:
--------------------------------------------------------------------------------
 1 | import uvicorn
 2 | from prometheus_client import start_http_server
 3 | 
 4 | from .settings import settings
 5 | 
 6 | if __name__ == "__main__":
 7 |     if settings.prometheus_enabled:
 8 |         start_http_server(settings.prometheus_port)
 9 | 
10 |     uvicorn.run(
11 |         "llama_deploy.apiserver.app:app",
12 |         host=settings.host,
13 |         port=settings.port,
14 |     )
15 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/app.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | import os
 3 | 
 4 | from fastapi import FastAPI
 5 | from fastapi.middleware.cors import CORSMiddleware
 6 | from fastapi.requests import Request
 7 | from fastapi.responses import JSONResponse
 8 | 
 9 | from .routers import deployments_router, status_router
10 | from .server import lifespan
11 | from .settings import settings
12 | from .tracing import configure_tracing
13 | 
14 | logger = logging.getLogger("uvicorn.info")
15 | 
16 | 
17 | app = FastAPI(lifespan=lifespan)
18 | 
19 | # Setup tracing
20 | configure_tracing(settings)
21 | 
22 | # Configure CORS middleware if the environment variable is set
23 | if not os.environ.get("DISABLE_CORS", False):
24 |     app.add_middleware(
25 |         CORSMiddleware,
26 |         allow_origins=["*"],  # Allows all origins
27 |         allow_credentials=True,
28 |         allow_methods=["GET", "POST"],
29 |         allow_headers=["Content-Type", "Authorization"],
30 |     )
31 | 
32 | app.include_router(deployments_router)
33 | app.include_router(status_router)
34 | 
35 | 
36 | @app.get("/")
37 | async def root(request: Request) -> JSONResponse:
38 |     return JSONResponse(
39 |         {
40 |             "swagger_docs": f"{request.base_url}docs",
41 |             "status": f"{request.base_url}status",
42 |         }
43 |     )
44 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/routers/__init__.py:
--------------------------------------------------------------------------------
1 | from .deployments import deployments_router
2 | from .status import status_router
3 | 
4 | __all__ = ["deployments_router", "status_router"]
5 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/routers/status.py:
--------------------------------------------------------------------------------
 1 | import httpx
 2 | from fastapi import APIRouter
 3 | from fastapi.exceptions import HTTPException
 4 | from fastapi.responses import PlainTextResponse
 5 | 
 6 | from llama_deploy.apiserver.server import manager
 7 | from llama_deploy.apiserver.settings import settings
 8 | from llama_deploy.types.apiserver import Status, StatusEnum
 9 | 
10 | status_router = APIRouter(
11 |     prefix="/status",
12 | )
13 | 
14 | 
15 | @status_router.get("/")
16 | async def status() -> Status:
17 |     return Status(
18 |         status=StatusEnum.HEALTHY,
19 |         max_deployments=manager._max_deployments,
20 |         deployments=list(manager._deployments.keys()),
21 |         status_message="",
22 |     )
23 | 
24 | 
25 | @status_router.get("/metrics")
26 | async def metrics() -> PlainTextResponse:
27 |     """Proxies the Prometheus metrics endpoint through the API Server.
28 | 
29 |     This endpoint is mostly used in serverless environments where the LlamaDeploy
30 |     container cannot expose more than one port (e.g. Knative, Google Cloud Run).
31 |     If Prometheus is not enabled, this endpoint returns an empty HTTP-204 response.
32 |     """
33 |     if not settings.prometheus_enabled:
34 |         return PlainTextResponse(status_code=204)
35 | 
36 |     try:
37 |         async with httpx.AsyncClient() as client:
38 |             response = await client.get(f"http://127.0.0.1:{settings.prometheus_port}/")
39 |             return PlainTextResponse(content=response.text)
40 |     except httpx.RequestError as exc:
41 |         raise HTTPException(status_code=500, detail=str(exc))
42 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/server.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | import logging
 3 | from contextlib import asynccontextmanager
 4 | from typing import Any, AsyncGenerator
 5 | 
 6 | from fastapi import FastAPI
 7 | 
 8 | from .deployment import Manager
 9 | from .deployment_config_parser import DeploymentConfig
10 | from .settings import settings
11 | from .stats import apiserver_state
12 | 
13 | logger = logging.getLogger("uvicorn.info")
14 | manager = Manager()
15 | 
16 | 
17 | @asynccontextmanager
18 | async def lifespan(app: FastAPI) -> AsyncGenerator[None, Any]:
19 |     apiserver_state.state("starting")
20 | 
21 |     manager.set_deployments_path(settings.deployments_path)
22 |     t = asyncio.create_task(manager.serve())
23 |     await asyncio.sleep(0)
24 | 
25 |     logger.info(f"deployments folder: {manager.deployments_path}")
26 |     logger.info(f"rc folder: {settings.rc_path}")
27 | 
28 |     if settings.rc_path.exists():
29 |         logger.info(
30 |             f"Browsing the rc folder {settings.rc_path} for deployments to start"
31 |         )
32 |         # match both .yml and .yaml files with the glob
33 |         for yaml_file in settings.rc_path.glob("*.y*ml"):
34 |             try:
35 |                 logger.info(f"Deploying startup configuration from {yaml_file}")
36 |                 config = DeploymentConfig.from_yaml(yaml_file)
37 |                 await manager.deploy(config, base_path=str(settings.rc_path))
38 |             except Exception as e:
39 |                 logger.error(f"Failed to deploy {yaml_file}: {str(e)}")
40 | 
41 |     apiserver_state.state("running")
42 |     yield
43 | 
44 |     t.cancel()
45 | 
46 |     apiserver_state.state("stopped")
47 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/source_managers/__init__.py:
--------------------------------------------------------------------------------
1 | from .base import SourceManager
2 | from .git import GitSourceManager
3 | from .local import LocalSourceManager
4 | 
5 | __all__ = ["GitSourceManager", "LocalSourceManager", "SourceManager"]
6 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/source_managers/base.py:
--------------------------------------------------------------------------------
 1 | from abc import ABC, abstractmethod
 2 | from enum import Enum, auto
 3 | from pathlib import Path
 4 | 
 5 | from llama_deploy.apiserver.deployment_config_parser import DeploymentConfig
 6 | 
 7 | 
 8 | class SyncPolicy(Enum):
 9 |     """Define the sync behaviour in case the destination target exists."""
10 | 
11 |     REPLACE = auto()
12 |     MERGE = auto()
13 |     SKIP = auto()
14 |     FAIL = auto()
15 | 
16 | 
17 | class SourceManager(ABC):
18 |     """Protocol to be implemented by classes responsible for managing Deployment sources."""
19 | 
20 |     def __init__(self, config: DeploymentConfig, base_path: Path | None = None) -> None:
21 |         self._config = config
22 |         self._base_path = base_path
23 | 
24 |     @abstractmethod
25 |     def sync(
26 |         self,
27 |         source: str,
28 |         destination: str | None = None,
29 |         sync_policy: SyncPolicy = SyncPolicy.REPLACE,
30 |     ) -> None:  # pragma: no cover
31 |         """Fetches resources from `source` so they can be used in a deployment.
32 | 
33 |         Optionally uses `destination` to store data when this makes sense for the
34 |         specific source type.
35 |         """
36 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/source_managers/git.py:
--------------------------------------------------------------------------------
 1 | import shutil
 2 | from pathlib import Path
 3 | from typing import Any
 4 | 
 5 | from git import Repo
 6 | 
 7 | from .base import SourceManager, SyncPolicy
 8 | 
 9 | 
10 | class GitSourceManager(SourceManager):
11 |     """A SourceManager specialized for sources of type `git`."""
12 | 
13 |     def sync(
14 |         self,
15 |         source: str,
16 |         destination: str | None = None,
17 |         sync_policy: SyncPolicy = SyncPolicy.REPLACE,
18 |     ) -> None:
19 |         """Clones the repository at URL `source` into a local path `destination`.
20 | 
21 |         Args:
22 |             source: The URL of the git repository. It can optionally contain a branch target using the name convention
23 |                 `git_repo_url@branch_name`. For example, "https://example.com/llama_deploy.git@branch_name".
24 |             destination: The path in the local filesystem where to clone the git repository.
25 |         """
26 |         if not destination:
27 |             raise ValueError("Destination cannot be empty")
28 | 
29 |         if Path(destination).exists():
30 |             # FIXME: pull when SyncPolicy is MERGE
31 |             shutil.rmtree(destination)
32 | 
33 |         url, branch_name = self._parse_source(source)
34 |         kwargs: dict[str, Any] = {"url": url, "to_path": destination}
35 |         if branch_name:
36 |             kwargs["multi_options"] = [f"-b {branch_name}", "--single-branch"]
37 | 
38 |         Repo.clone_from(**kwargs)
39 | 
40 |     @staticmethod
41 |     def _parse_source(source: str) -> tuple[str, str | None]:
42 |         branch_name = None
43 |         toks = source.split("@")
44 |         url = toks[0]
45 |         if len(toks) > 1:
46 |             branch_name = toks[1]
47 | 
48 |         return url, branch_name
49 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/source_managers/local.py:
--------------------------------------------------------------------------------
 1 | import shutil
 2 | from pathlib import Path
 3 | 
 4 | from .base import SourceManager, SyncPolicy
 5 | 
 6 | 
 7 | class LocalSourceManager(SourceManager):
 8 |     """A SourceManager specialized for sources of type `local`."""
 9 | 
10 |     def sync(
11 |         self,
12 |         source: str,
13 |         destination: str | None = None,
14 |         sync_policy: SyncPolicy = SyncPolicy.REPLACE,
15 |     ) -> None:
16 |         """Copies the folder with path `source` into a local path `destination`.
17 | 
18 |         Args:
19 |             source: The filesystem path to the folder containing the source code.
20 |             destination: The path in the local filesystem where to copy the source directory.
21 |         """
22 |         if sync_policy == SyncPolicy.SKIP:
23 |             return
24 | 
25 |         if not destination:
26 |             raise ValueError("Destination cannot be empty")
27 | 
28 |         if Path(source).is_absolute():
29 |             raise ValueError("Source path must be relative to the deployment file")
30 | 
31 |         base = self._base_path or Path()
32 |         final_path = base / source
33 |         destination_path = Path(destination)
34 |         dirs_exist_ok: bool = False
35 |         if destination_path.exists():
36 |             # Path is a non-empty directory
37 |             if sync_policy == SyncPolicy.REPLACE:
38 |                 shutil.rmtree(destination_path)
39 |             elif sync_policy == SyncPolicy.MERGE:
40 |                 dirs_exist_ok = True
41 | 
42 |         try:
43 |             shutil.copytree(
44 |                 final_path, destination_path / source, dirs_exist_ok=dirs_exist_ok
45 |             )
46 |         except Exception as e:
47 |             msg = f"Unable to copy {source} into {destination}: {e}"
48 |             raise ValueError(msg) from e
49 | 


--------------------------------------------------------------------------------
/llama_deploy/apiserver/stats.py:
--------------------------------------------------------------------------------
 1 | from prometheus_client import Enum
 2 | 
 3 | apiserver_state = Enum(
 4 |     "apiserver_state",
 5 |     "Current state of the API server",
 6 |     states=[
 7 |         "starting",
 8 |         "running",
 9 |         "stopped",
10 |     ],
11 | )
12 | 
13 | deployment_state = Enum(
14 |     "deployment_state",
15 |     "Current state of a deployment",
16 |     ["deployment_name"],
17 |     states=[
18 |         "loading_services",
19 |         "ready",
20 |         "starting_services",
21 |         "running",
22 |         "stopped",
23 |     ],
24 | )
25 | 
26 | service_state = Enum(
27 |     "service_state",
28 |     "Current state of a service attached to a deployment",
29 |     ["deployment_name", "service_name"],
30 |     states=[
31 |         "loading",
32 |         "syncing",
33 |         "installing",
34 |         "ready",
35 |     ],
36 | )
37 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/__init__.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | 
 3 | import click
 4 | 
 5 | from .config import config as config_cmd
 6 | from .deploy import deploy as deploy_cmd
 7 | from .init import init as init_cmd
 8 | from .internal.config import DEFAULT_PROFILE_NAME, load_config
 9 | from .run import run as run_cmd
10 | from .serve import serve as serve_cmd
11 | from .sessions import sessions as sessions_cmd
12 | from .status import status as status_cmd
13 | 
14 | 
15 | @click.group(
16 |     context_settings={"help_option_names": ["-h", "--help"]},
17 |     invoke_without_command=True,
18 | )
19 | @click.version_option(prog_name="llamactl")
20 | @click.option(
21 |     "-c",
22 |     "--config",
23 |     type=Path,
24 |     default=None,
25 |     help="Path to llamactl config file",
26 | )
27 | @click.option(
28 |     "-p",
29 |     "--profile",
30 |     type=str,
31 |     default=None,
32 |     help="Configuration profile to use",
33 | )
34 | @click.option(
35 |     "-s",
36 |     "--server",
37 |     type=str,
38 |     default=None,
39 |     help="Apiserver URL",
40 | )
41 | @click.option(
42 |     "-k",
43 |     "--insecure",
44 |     default=None,
45 |     type=bool,
46 |     is_flag=True,
47 |     help="Disable SSL certificate verification",
48 | )
49 | @click.option(
50 |     "-t",
51 |     "--timeout",
52 |     default=None,
53 |     type=float,
54 |     help="Timeout on apiserver HTTP requests",
55 | )
56 | @click.pass_context
57 | def llamactl(
58 |     ctx: click.Context,
59 |     config: Path,
60 |     profile: str,
61 |     server: str,
62 |     insecure: bool,
63 |     timeout: float,
64 | ) -> None:
65 |     config_obj = load_config(config)
66 |     profile = profile or DEFAULT_PROFILE_NAME
67 |     if profile not in config_obj.profiles:
68 |         raise click.ClickException(f"Profile {profile} does not exist.")
69 |     config_profile = config_obj.profiles[profile]
70 |     # Parameters passed via command line take precedence
71 |     config_profile.server = server or config_profile.server
72 |     config_profile.insecure = insecure or config_profile.insecure
73 |     config_profile.timeout = timeout or config_profile.timeout
74 | 
75 |     ctx.obj = config_profile
76 |     if ctx.invoked_subcommand is None:
77 |         click.echo(ctx.get_help())  # show the help if no subcommand was provided
78 | 
79 | 
80 | llamactl.add_command(config_cmd)
81 | llamactl.add_command(deploy_cmd)
82 | llamactl.add_command(init_cmd)
83 | llamactl.add_command(run_cmd)
84 | llamactl.add_command(serve_cmd)
85 | llamactl.add_command(sessions_cmd)
86 | llamactl.add_command(status_cmd)
87 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/__main__.py:
--------------------------------------------------------------------------------
 1 | import sys
 2 | from llama_deploy.cli import llamactl
 3 | 
 4 | 
 5 | def main() -> None:
 6 |     """CLI entrypoint."""
 7 |     sys.exit(llamactl())
 8 | 
 9 | 
10 | if __name__ == "__main__":  # pragma: no cover
11 |     main()
12 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/deploy.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | 
 3 | import click
 4 | 
 5 | from llama_deploy.client import Client
 6 | 
 7 | from .internal.config import ConfigProfile
 8 | 
 9 | 
10 | @click.command()
11 | @click.pass_obj  # config_profile
12 | @click.option("--reload", is_flag=True)
13 | @click.option(
14 |     "--base-path",
15 |     required=False,
16 |     type=click.Path(file_okay=False, resolve_path=True, path_type=Path),  # type: ignore
17 | )
18 | @click.argument(
19 |     "deployment_config_file",
20 |     type=click.Path(dir_okay=False, resolve_path=True, path_type=Path),  # type: ignore
21 | )
22 | def deploy(
23 |     config_profile: ConfigProfile,
24 |     reload: bool,
25 |     deployment_config_file: Path,
26 |     base_path: Path | None,
27 | ) -> None:
28 |     """Create or reload a deployment."""
29 |     client = Client(
30 |         api_server_url=config_profile.server,
31 |         disable_ssl=config_profile.insecure,
32 |         timeout=config_profile.timeout,
33 |     )
34 | 
35 |     final_base_path = base_path or deployment_config_file.parent
36 | 
37 |     try:
38 |         with open(deployment_config_file, "rb") as f:
39 |             deployment = client.sync.apiserver.deployments.create(
40 |                 f,
41 |                 base_path=final_base_path,
42 |                 reload=reload,
43 |             )
44 |     except Exception as e:
45 |         raise click.ClickException(str(e))
46 | 
47 |     click.echo(f"Deployment successful: {deployment.id}")
48 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/internal/config.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | from typing import cast
 3 | 
 4 | import yaml
 5 | from pydantic import BaseModel, Field
 6 | from typing_extensions import Self
 7 | 
 8 | from .utils import DEFAULT_PROFILE_NAME, _default_config_path
 9 | 
10 | 
11 | class ConfigProfile(BaseModel):
12 |     """Pydantic model representing a llamactl configuration profile."""
13 | 
14 |     server: str = "http://localhost:4501"
15 |     insecure: bool = False
16 |     timeout: float = 120.0
17 | 
18 | 
19 | class Config(BaseModel):
20 |     """Pydantic model representing a llamactl configuration."""
21 | 
22 |     current_profile: str
23 |     profiles: dict[str, ConfigProfile]
24 |     path: Path = Field(default_factory=_default_config_path)
25 | 
26 |     @classmethod
27 |     def from_path(cls, config_file_path: Path) -> Self:
28 |         """Get a Config instance from a configuration file."""
29 |         with open(config_file_path) as f:
30 |             config_dict = yaml.safe_load(f.read())
31 | 
32 |         config_dict["path"] = config_file_path
33 |         return cls(**config_dict)
34 | 
35 |     def write(self) -> None:
36 |         """Write the Config object in the configuration file."""
37 |         with open(cast(Path, self.path), "w") as f:
38 |             config_data = self.model_dump(exclude={"path"})
39 |             yaml.safe_dump(config_data, f)
40 | 
41 | 
42 | def load_config(path: Path | None = None) -> Config:
43 |     if path is None:
44 |         path = _default_config_path()
45 |         if not path.exists():
46 |             # Create the config folder if doesn't exist
47 |             path.parent.mkdir(parents=True, exist_ok=True)
48 |             # Use default
49 |             config = Config(
50 |                 current_profile=DEFAULT_PROFILE_NAME,
51 |                 profiles={DEFAULT_PROFILE_NAME: ConfigProfile()},
52 |             )
53 |             config.write()
54 |             return config
55 | 
56 |     return Config.from_path(path)
57 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/internal/utils.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | 
 3 | from platformdirs import user_config_dir
 4 | 
 5 | DEFAULT_PROFILE_NAME = "default"
 6 | DEFAULT_CONFIG_FILE_NAME = "config.yaml"
 7 | DEFAULT_CONFIG_FOLDER_NAME = "llamactl"
 8 | 
 9 | 
10 | def _default_config_path() -> Path:
11 |     base = user_config_dir(DEFAULT_CONFIG_FOLDER_NAME, appauthor=False)
12 |     return Path(base) / DEFAULT_CONFIG_FILE_NAME
13 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/run.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | 
 3 | import click
 4 | 
 5 | from llama_deploy.client import Client
 6 | from llama_deploy.types import TaskDefinition
 7 | 
 8 | from .internal.config import ConfigProfile
 9 | 
10 | 
11 | @click.command()
12 | @click.pass_obj  # config_profile
13 | @click.option(
14 |     "-d", "--deployment", required=True, is_flag=False, help="Deployment name"
15 | )
16 | @click.option(
17 |     "-a",
18 |     "--arg",
19 |     multiple=True,
20 |     is_flag=False,
21 |     type=(str, str),
22 |     help="'key value' argument to pass to the task, e.g. '-a age 30'",
23 | )
24 | @click.option("-s", "--service", is_flag=False, help="Service name")
25 | @click.option("-i", "--session-id", is_flag=False, help="Session ID")
26 | @click.pass_context
27 | def run(
28 |     ctx: click.Context,
29 |     config_profile: ConfigProfile,
30 |     deployment: str,
31 |     arg: tuple[tuple[str, str]],
32 |     service: str,
33 |     session_id: str,
34 | ) -> None:
35 |     """Run tasks from a given service."""
36 |     client = Client(
37 |         api_server_url=config_profile.server,
38 |         disable_ssl=config_profile.insecure,
39 |         timeout=config_profile.timeout,
40 |     )
41 | 
42 |     payload = {"input": json.dumps(dict(arg))}
43 |     if service:
44 |         payload["service_id"] = service
45 |     if session_id:
46 |         payload["session_id"] = session_id
47 | 
48 |     try:
49 |         d = client.sync.apiserver.deployments.get(deployment)
50 |         result = d.tasks.run(TaskDefinition(**payload))
51 |     except Exception as e:
52 |         raise click.ClickException(str(e))
53 | 
54 |     click.echo(result)
55 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/serve.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import subprocess
 3 | from pathlib import Path
 4 | 
 5 | import click
 6 | from prometheus_client import start_http_server
 7 | from tenacity import RetryError, Retrying, stop_after_attempt, wait_fixed
 8 | 
 9 | from llama_deploy.apiserver.settings import settings
10 | from llama_deploy.client import Client
11 | 
12 | RETRY_WAIT_SECONDS = 1
13 | 
14 | 
15 | @click.command()
16 | @click.argument(
17 |     "deployment_file",
18 |     required=False,
19 |     type=click.Path(dir_okay=False, resolve_path=True, path_type=Path),  # type: ignore
20 | )
21 | def serve(deployment_file: Path | None) -> None:
22 |     """Run the API Server in the foreground."""
23 |     if settings.prometheus_enabled:
24 |         start_http_server(settings.prometheus_port)
25 | 
26 |     env = os.environ.copy()
27 |     if deployment_file:
28 |         env["LLAMA_DEPLOY_APISERVER_DEPLOYMENTS_PATH"] = str(deployment_file.parent)
29 | 
30 |     uvicorn_p = subprocess.Popen(
31 |         [
32 |             "uvicorn",
33 |             "llama_deploy.apiserver.app:app",
34 |             "--host",
35 |             "localhost",
36 |             "--port",
37 |             "4501",
38 |         ],
39 |         env=env,
40 |     )
41 | 
42 |     if deployment_file:
43 |         client = Client()
44 |         retrying = Retrying(
45 |             stop=stop_after_attempt(5), wait=wait_fixed(RETRY_WAIT_SECONDS)
46 |         )
47 |         try:
48 |             for attempt in retrying:
49 |                 with attempt:
50 |                     client.sync.apiserver.deployments.create(
51 |                         deployment_file.open("rb"),
52 |                         base_path=deployment_file.parent,
53 |                         local=True,
54 |                     )
55 |         except RetryError:
56 |             uvicorn_p.terminate()
57 |             raise click.ClickException("Failed to create deployment")
58 | 
59 |     try:
60 |         uvicorn_p.wait()
61 |     except KeyboardInterrupt:
62 |         print("Shutting down...")
63 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/sessions.py:
--------------------------------------------------------------------------------
 1 | import click
 2 | 
 3 | from llama_deploy.client import Client
 4 | 
 5 | from .internal.config import ConfigProfile
 6 | 
 7 | 
 8 | @click.group()
 9 | def sessions() -> None:
10 |     """Manage sessions for a given deployment."""
11 |     pass
12 | 
13 | 
14 | @click.command()
15 | @click.pass_obj  # config_profile
16 | @click.option(
17 |     "-d", "--deployment", required=True, is_flag=False, help="Deployment name"
18 | )
19 | @click.pass_context
20 | def create(
21 |     ctx: click.Context,
22 |     config_profile: ConfigProfile,
23 |     deployment: str,
24 | ) -> None:
25 |     client = Client(
26 |         api_server_url=config_profile.server,
27 |         disable_ssl=config_profile.insecure,
28 |         timeout=config_profile.timeout,
29 |     )
30 | 
31 |     try:
32 |         d = client.sync.apiserver.deployments.get(deployment)
33 |         session_def = d.sessions.create()
34 |     except Exception as e:
35 |         raise click.ClickException(str(e))
36 | 
37 |     click.echo(session_def)
38 | 
39 | 
40 | sessions.add_command(create)
41 | 


--------------------------------------------------------------------------------
/llama_deploy/cli/status.py:
--------------------------------------------------------------------------------
 1 | import click
 2 | 
 3 | from llama_deploy.client import Client
 4 | from llama_deploy.types.apiserver import StatusEnum
 5 | 
 6 | from .internal.config import ConfigProfile
 7 | 
 8 | 
 9 | @click.command()
10 | @click.pass_obj  # config_profile
11 | def status(config_profile: ConfigProfile) -> None:
12 |     """Print the API Server status."""
13 |     client = Client(
14 |         api_server_url=config_profile.server,
15 |         disable_ssl=config_profile.insecure,
16 |         timeout=config_profile.timeout,
17 |     )
18 | 
19 |     try:
20 |         status = client.sync.apiserver.status()
21 |     except Exception as e:
22 |         raise click.ClickException(str(e))
23 | 
24 |     if status.status == StatusEnum.HEALTHY:
25 |         click.echo("LlamaDeploy is up and running.")
26 |         if status.deployments:
27 |             click.echo("\nActive deployments:")
28 |             for d in status.deployments:
29 |                 click.echo(f"- {d}")
30 |         else:
31 |             click.echo("\nCurrently there are no active deployments")
32 |     else:
33 |         click.echo(f"LlamaDeploy is unhealthy: {status.status_message}")
34 | 


--------------------------------------------------------------------------------
/llama_deploy/client/__init__.py:
--------------------------------------------------------------------------------
1 | from .client import Client
2 | 
3 | __all__ = ["Client"]
4 | 


--------------------------------------------------------------------------------
/llama_deploy/client/base.py:
--------------------------------------------------------------------------------
 1 | from typing import Any
 2 | 
 3 | import httpx
 4 | from pydantic_settings import BaseSettings, SettingsConfigDict
 5 | 
 6 | 
 7 | class _BaseClient(BaseSettings):
 8 |     """Base type for clients, to be used in Pydantic models to avoid circular imports.
 9 | 
10 |     Settings can be passed to the Client constructor when creating an instance, or defined with environment variables
11 |     having names prefixed with the string `LLAMA_DEPLOY_`, e.g. `LLAMA_DEPLOY_DISABLE_SSL`.
12 |     """
13 | 
14 |     model_config = SettingsConfigDict(env_prefix="LLAMA_DEPLOY_")
15 | 
16 |     api_server_url: str = "http://localhost:4501"
17 |     control_plane_url: str = "http://localhost:8000"
18 |     disable_ssl: bool = False
19 |     timeout: float | None = 120.0
20 |     poll_interval: float = 0.5
21 | 
22 |     async def request(
23 |         self, method: str, url: str | httpx.URL, **kwargs: Any
24 |     ) -> httpx.Response:
25 |         """Performs an async HTTP request using httpx."""
26 |         verify = kwargs.pop("verify", True)
27 |         timeout = kwargs.pop("timeout", self.timeout)
28 |         async with httpx.AsyncClient(verify=verify) as client:
29 |             response = await client.request(method, url, timeout=timeout, **kwargs)
30 |             response.raise_for_status()
31 |             return response
32 | 


--------------------------------------------------------------------------------
/llama_deploy/client/client.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from typing import Any
 3 | 
 4 | from .base import _BaseClient
 5 | from .models import ApiServer, Core, make_sync
 6 | 
 7 | 
 8 | class Client(_BaseClient):
 9 |     """The LlamaDeploy Python client.
10 | 
11 |     The client is gives access to both the asyncio and non-asyncio APIs. To access the sync
12 |     API just use methods of `client.sync`.
13 | 
14 |     Example usage:
15 |     ```py
16 |     from llama_deploy.client import Client
17 | 
18 |     # Use the same client instance
19 |     c = Client()
20 | 
21 |     async def an_async_function():
22 |         status = await client.apiserver.status()
23 | 
24 |     def normal_function():
25 |         status = client.sync.apiserver.status()
26 |     ```
27 |     """
28 | 
29 |     @property
30 |     def sync(self) -> "_SyncClient":
31 |         """Returns the sync version of the client API."""
32 |         try:
33 |             asyncio.get_running_loop()
34 |         except RuntimeError:
35 |             return _SyncClient(**self.model_dump())
36 | 
37 |         msg = "You cannot use the sync client within an async event loop - just await the async methods directly."
38 |         raise RuntimeError(msg)
39 | 
40 |     @property
41 |     def apiserver(self) -> ApiServer:
42 |         """Access the API Server functionalities."""
43 |         return ApiServer(client=self, id="apiserver")
44 | 
45 |     @property
46 |     def core(self) -> Core:
47 |         """Access the Control Plane functionalities."""
48 |         return Core(client=self, id="core")
49 | 
50 | 
51 | class _SyncClient(_BaseClient):
52 |     @property
53 |     def apiserver(self) -> Any:
54 |         return make_sync(ApiServer)(client=self, id="apiserver")
55 | 
56 |     @property
57 |     def core(self) -> Any:
58 |         return make_sync(Core)(client=self, id="core")
59 | 


--------------------------------------------------------------------------------
/llama_deploy/client/models/__init__.py:
--------------------------------------------------------------------------------
1 | from .apiserver import ApiServer
2 | from .core import Core
3 | from .model import Collection, Model, make_sync
4 | 
5 | __all__ = ["ApiServer", "Collection", "Core", "Model", "make_sync"]
6 | 


--------------------------------------------------------------------------------
/llama_deploy/control_plane/__init__.py:
--------------------------------------------------------------------------------
1 | from .config import ControlPlaneConfig
2 | from .server import ControlPlaneServer
3 | 
4 | __all__ = ["ControlPlaneServer", "ControlPlaneConfig"]
5 | 


--------------------------------------------------------------------------------
/llama_deploy/control_plane/utils.py:
--------------------------------------------------------------------------------
1 | def get_result_key(task_id: str) -> str:
2 |     return f"result_{task_id}"
3 | 
4 | 
5 | def get_stream_key(task_id: str) -> str:
6 |     return f"stream_{task_id}"
7 | 


--------------------------------------------------------------------------------
/llama_deploy/message_queues/__init__.py:
--------------------------------------------------------------------------------
 1 | from .apache_kafka import (
 2 |     KafkaMessageQueue,
 3 |     KafkaMessageQueueConfig,
 4 | )
 5 | from .base import AbstractMessageQueue
 6 | from .rabbitmq import (
 7 |     RabbitMQMessageQueue,
 8 |     RabbitMQMessageQueueConfig,
 9 | )
10 | from .redis import RedisMessageQueue, RedisMessageQueueConfig
11 | from .simple import (
12 |     SimpleMessageQueue,
13 |     SimpleMessageQueueConfig,
14 |     SimpleMessageQueueServer,
15 | )
16 | 
17 | __all__ = [
18 |     "AbstractMessageQueue",
19 |     "KafkaMessageQueue",
20 |     "KafkaMessageQueueConfig",
21 |     "RabbitMQMessageQueue",
22 |     "RabbitMQMessageQueueConfig",
23 |     "RedisMessageQueue",
24 |     "RedisMessageQueueConfig",
25 |     "SimpleMessageQueueServer",
26 |     "SimpleMessageQueueConfig",
27 |     "SimpleMessageQueue",
28 | ]
29 | 


--------------------------------------------------------------------------------
/llama_deploy/message_queues/simple/__init__.py:
--------------------------------------------------------------------------------
 1 | from .client import SimpleMessageQueue
 2 | from .server import (
 3 |     SimpleMessageQueueConfig,
 4 |     SimpleMessageQueueServer,
 5 | )
 6 | 
 7 | __all__ = [
 8 |     "SimpleMessageQueueServer",
 9 |     "SimpleMessageQueueConfig",
10 |     "SimpleMessageQueue",
11 | ]
12 | 


--------------------------------------------------------------------------------
/llama_deploy/message_queues/simple/client.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from logging import getLogger
 3 | from typing import Any, AsyncIterator, Dict
 4 | 
 5 | import httpx
 6 | 
 7 | from llama_deploy.message_queues.base import AbstractMessageQueue
 8 | from llama_deploy.types import QueueMessage
 9 | 
10 | from .config import SimpleMessageQueueConfig
11 | 
12 | logger = getLogger(__name__)
13 | 
14 | 
15 | class SimpleMessageQueue(AbstractMessageQueue):
16 |     """Remote client to be used with a SimpleMessageQueue server."""
17 | 
18 |     def __init__(
19 |         self, config: SimpleMessageQueueConfig = SimpleMessageQueueConfig()
20 |     ) -> None:
21 |         self._config = config
22 |         self._topics: set[str] = set()
23 | 
24 |     async def _publish(
25 |         self, message: QueueMessage, topic: str, create_topic: bool
26 |     ) -> Any:
27 |         """Sends a message to the SimpleMessageQueueServer."""
28 |         if topic not in self._topics:
29 |             # call the server to create it
30 |             url = f"{self._config.base_url}topics/{topic}"
31 |             async with httpx.AsyncClient(**self._config.client_kwargs) as client:
32 |                 result = await client.post(url)
33 |                 result.raise_for_status()
34 |                 self._topics.add(topic)
35 | 
36 |         url = f"{self._config.base_url}messages/{topic}"
37 |         async with httpx.AsyncClient(**self._config.client_kwargs) as client:
38 |             result = await client.post(url, json=message.model_dump())
39 |         return result
40 | 
41 |     async def get_messages(self, topic: str) -> AsyncIterator[QueueMessage]:
42 |         url = f"{self._config.base_url}messages/{topic}"
43 |         client = httpx.AsyncClient(**self._config.client_kwargs)
44 |         while True:
45 |             try:
46 |                 result = await client.get(url)
47 |                 result.raise_for_status()
48 |                 if result.json():
49 |                     yield QueueMessage.model_validate(result.json())
50 |                 await asyncio.sleep(0.1)
51 | 
52 |             except httpx.HTTPError as e:
53 |                 logger.debug(f"HTTP error occurred while fetching messages: {e}")
54 |                 await asyncio.sleep(1)  # Back off on errors
55 |                 continue
56 | 
57 |             except Exception as e:
58 |                 logger.error(f"Unexpected error while fetching messages: {e}")
59 |                 await asyncio.sleep(1)  # Back off on errors
60 |                 continue
61 | 
62 |     async def cleanup(self, *args: Any, **kwargs: Dict[str, Any]) -> None:
63 |         # Nothing to clean up
64 |         pass
65 | 
66 |     def as_config(self) -> SimpleMessageQueueConfig:
67 |         return self._config
68 | 


--------------------------------------------------------------------------------
/llama_deploy/message_queues/simple/config.py:
--------------------------------------------------------------------------------
 1 | from logging import getLogger
 2 | from typing import Any, Literal
 3 | 
 4 | from pydantic import Field
 5 | from pydantic_settings import BaseSettings, SettingsConfigDict
 6 | 
 7 | logger = getLogger(__name__)
 8 | 
 9 | 
10 | class SimpleMessageQueueConfig(BaseSettings):
11 |     """Simple message queue configuration."""
12 | 
13 |     model_config = SettingsConfigDict(env_prefix="SIMPLE_MESSAGE_QUEUE_")
14 | 
15 |     type: Literal["simple"] = Field(default="simple")
16 |     host: str = "127.0.0.1"
17 |     port: int = 8001
18 |     client_kwargs: dict[str, Any] = Field(
19 |         default_factory=dict, description="The kwargs to pass to the httpx client."
20 |     )
21 |     raise_exceptions: bool = Field(
22 |         default=False, description="Whether to raise exceptions when an error occurs."
23 |     )
24 |     use_ssl: bool = Field(default=False)
25 | 
26 |     @property
27 |     def base_url(self) -> str:
28 |         protocol = "https" if self.use_ssl else "http"
29 |         if self.port != 80:
30 |             return f"{protocol}://{self.host}:{self.port}/"
31 |         return f"{protocol}://{self.host}/"
32 | 


--------------------------------------------------------------------------------
/llama_deploy/services/__init__.py:
--------------------------------------------------------------------------------
1 | from llama_deploy.services.workflow import WorkflowService, WorkflowServiceConfig
2 | 
3 | __all__ = [
4 |     "WorkflowService",
5 |     "WorkflowServiceConfig",
6 | ]
7 | 


--------------------------------------------------------------------------------
/llama_deploy/types/__init__.py:
--------------------------------------------------------------------------------
 1 | from .apiserver import DeploymentDefinition, Status, StatusEnum
 2 | from .core import (
 3 |     CONTROL_PLANE_NAME,
 4 |     ActionTypes,
 5 |     ChatMessage,
 6 |     EventDefinition,
 7 |     HumanResponse,
 8 |     QueueMessage,
 9 |     QueueMessageStats,
10 |     ServiceDefinition,
11 |     SessionDefinition,
12 |     TaskDefinition,
13 |     TaskResult,
14 |     TaskStream,
15 |     generate_id,
16 | )
17 | 
18 | __all__ = [
19 |     "CONTROL_PLANE_NAME",
20 |     "ActionTypes",
21 |     "ChatMessage",
22 |     "EventDefinition",
23 |     "HumanResponse",
24 |     "ServiceDefinition",
25 |     "SessionDefinition",
26 |     "TaskDefinition",
27 |     "TaskResult",
28 |     "TaskStream",
29 |     "generate_id",
30 |     "DeploymentDefinition",
31 |     "Status",
32 |     "StatusEnum",
33 |     "QueueMessage",
34 |     "QueueMessageStats",
35 | ]
36 | 


--------------------------------------------------------------------------------
/llama_deploy/types/apiserver.py:
--------------------------------------------------------------------------------
 1 | from enum import Enum
 2 | 
 3 | from pydantic import BaseModel
 4 | 
 5 | 
 6 | class StatusEnum(Enum):
 7 |     HEALTHY = "Healthy"
 8 |     UNHEALTHY = "Unhealthy"
 9 |     DOWN = "Down"
10 | 
11 | 
12 | class Status(BaseModel):
13 |     status: StatusEnum
14 |     status_message: str
15 |     max_deployments: int | None = None
16 |     deployments: list[str] | None = None
17 | 
18 | 
19 | class DeploymentDefinition(BaseModel):
20 |     name: str
21 | 


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | requires = ["hatchling"]
 3 | build-backend = "hatchling.build"
 4 | 
 5 | [dependency-groups]
 6 | dev = [
 7 |   "pytest>=8.2.2,<9",
 8 |   "pytest-asyncio>=0.23.7,<0.24",
 9 |   "pytest-mock>=3.14.0,<4",
10 |   "exceptiongroup>=1.2.0,<2",
11 |   "ruff>=0.4.7,<0.5",
12 |   "mypy>=1.10.0,<2",
13 |   "aio-pika>=9.4.2,<10",
14 |   "redis>=5.0.7,<6",
15 |   "pytest-cov>=5.0.0,<6",
16 |   "coverage>=7.6.0,<8",
17 |   "aiokafka>=0.11.0,<0.12",
18 |   "kafka-python-ng>=2.2.2,<3",
19 |   "pre-commit>=4.2.0",
20 |   "respx>=0.22.0"
21 | ]
22 | 
23 | [project]
24 | name = "llama-deploy"
25 | version = "0.9.0.dev0"
26 | description = ""
27 | authors = [
28 |   {name = "Logan Markewich", email = "logan.markewich@live.com"},
29 |   {name = "Andrei Fajardo", email = "andrei@runllama.ai"}
30 | ]
31 | requires-python = ">=3.10,<4.0"
32 | readme = "README.md"
33 | maintainers = [
34 |   {name = "Logan Markewich", email = "logan@llamaindex.ai"},
35 |   {name = "Andrei Fajardo", email = "andrei@runllama.ai"},
36 |   {name = "Jerry Liu", email = "jerry@llamaindex.ai"}
37 | ]
38 | dependencies = [
39 |   "fastapi>=0.109.1",
40 |   "llama-index-core>=0.11.17,<0.13.0",
41 |   "pydantic!=2.10",
42 |   "pydantic-settings>=2.0,<3.0",
43 |   "PyYAML>6",
44 |   "uvicorn[standard]>=0.12.0",
45 |   "gitpython>=3.1.43,<4",
46 |   "python-multipart>=0.0.18,<0.0.19",
47 |   "typing_extensions>=4.0.0,<5",
48 |   "asgiref>=3.8.1,<4",
49 |   "python-dotenv>=1.0.1,<2",
50 |   "prometheus-client>=0.21.1,<0.22",
51 |   "platformdirs>=4.3.6,<5",
52 |   "rich>=13.9.4,<14",
53 |   "brotli>=1.1.0",
54 |   "websockets>=15.0.1"
55 | ]
56 | 
57 | [project.optional-dependencies]
58 | kafka = ["aiokafka>=0.11.0,<0.12", "kafka-python-ng>=2.2.2,<3"]
59 | rabbitmq = ["aio-pika>=9.4.2,<10"]
60 | redis = ["redis>=5.0.7,<6"]
61 | observability = [
62 |   "opentelemetry-api>=1.20.0,<2.0",
63 |   "opentelemetry-sdk>=1.20.0,<2.0",
64 |   "opentelemetry-instrumentation-asyncio>=0.41b0,<1.0",
65 |   "opentelemetry-exporter-jaeger>=1.20.0,<2.0",
66 |   "opentelemetry-exporter-otlp>=1.20.0,<2.0"
67 | ]
68 | 
69 | [project.scripts]
70 | llamactl = "llama_deploy.cli.__main__:main"
71 | 
72 | [tool.codespell]
73 | ignore-words-list = "LITS"
74 | skip = "./examples,*/algolia.js,docs/poetry.lock"
75 | 
76 | [tool.coverage.run]
77 | omit = ["__main__.py", "tests/*", "llama_deploy/apiserver/stats.py"]
78 | 


--------------------------------------------------------------------------------
/system_diagram.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/system_diagram.png


--------------------------------------------------------------------------------
/templates/basic/src/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/templates/basic/src/__init__.py


--------------------------------------------------------------------------------
/templates/basic/src/workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | from llama_index.core.workflow import Workflow, StartEvent, StopEvent, step
 4 | from llama_index.llms.openai import OpenAI
 5 | 
 6 | 
 7 | # create a completion workflow
 8 | class CompletionWorkflow(Workflow):
 9 |     """A completion workflow with a single step."""
10 | 
11 |     llm: OpenAI = OpenAI(model="gpt-4.1-nano")
12 | 
13 |     @step()
14 |     async def run_step(self, ev: StartEvent) -> StopEvent:
15 |         message = str(ev.get("message", ""))
16 |         response = await self.llm.acomplete(message)
17 |         return StopEvent(result=response.text)
18 | 
19 | 
20 | workflow = CompletionWorkflow()
21 | 
22 | 
23 | async def main() -> None:
24 |     print(await workflow.run(message="Hello!"))
25 | 
26 | 
27 | if __name__ == "__main__":
28 |     asyncio.run(main())
29 | 


--------------------------------------------------------------------------------
/templates/basic/ui/.gitignore:
--------------------------------------------------------------------------------
 1 | # See https://help.github.com/articles/ignoring-files/ for more about ignoring files.
 2 | 
 3 | # dependencies
 4 | /node_modules
 5 | /.pnp
 6 | .pnp.*
 7 | .yarn/*
 8 | !.yarn/patches
 9 | !.yarn/plugins
10 | !.yarn/releases
11 | !.yarn/versions
12 | 
13 | # testing
14 | /coverage
15 | 
16 | # next.js
17 | /.next/
18 | /out/
19 | 
20 | # production
21 | /build
22 | 
23 | # misc
24 | .DS_Store
25 | *.pem
26 | 
27 | # debug
28 | npm-debug.log*
29 | yarn-debug.log*
30 | yarn-error.log*
31 | .pnpm-debug.log*
32 | 
33 | # env files (can opt-in for committing if needed)
34 | .env*
35 | 
36 | # vercel
37 | .vercel
38 | 
39 | # typescript
40 | *.tsbuildinfo
41 | next-env.d.ts
42 | 


--------------------------------------------------------------------------------
/templates/basic/ui/app/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/templates/basic/ui/app/favicon.ico


--------------------------------------------------------------------------------
/templates/basic/ui/app/globals.css:
--------------------------------------------------------------------------------
 1 | @import "tailwindcss";
 2 | 
 3 | :root {
 4 |   --background: #ffffff;
 5 |   --foreground: #171717;
 6 | }
 7 | 
 8 | @theme inline {
 9 |   --color-background: var(--background);
10 |   --color-foreground: var(--foreground);
11 |   --font-sans: var(--font-geist-sans);
12 |   --font-mono: var(--font-geist-mono);
13 | }
14 | 
15 | @media (prefers-color-scheme: dark) {
16 |   :root {
17 |     --background: #0a0a0a;
18 |     --foreground: #ededed;
19 |   }
20 | }
21 | 
22 | body {
23 |   background: var(--background);
24 |   color: var(--foreground);
25 |   font-family: Arial, Helvetica, sans-serif;
26 | }
27 | 


--------------------------------------------------------------------------------
/templates/basic/ui/app/layout.tsx:
--------------------------------------------------------------------------------
 1 | import type { Metadata } from "next";
 2 | import { Geist, Geist_Mono } from "next/font/google";
 3 | import "./globals.css";
 4 | 
 5 | const geistSans = Geist({
 6 |   variable: "--font-geist-sans",
 7 | });
 8 | 
 9 | const geistMono = Geist_Mono({
10 |   variable: "--font-geist-mono",
11 | });
12 | 
13 | export const metadata: Metadata = {
14 |   title: "Create Next App",
15 |   description: "Generated by create next app",
16 | };
17 | 
18 | export default function RootLayout({
19 |   children,
20 | }: Readonly<{
21 |   children: React.ReactNode;
22 | }>) {
23 |   return (
24 |     <html lang="en">
25 |       <body
26 |         className={`${geistSans.variable} ${geistMono.variable} antialiased`}
27 |       >
28 |         {children}
29 |       </body>
30 |     </html>
31 |   );
32 | }
33 | 


--------------------------------------------------------------------------------
/templates/basic/ui/eslint.config.mjs:
--------------------------------------------------------------------------------
 1 | import { dirname } from "path";
 2 | import { fileURLToPath } from "url";
 3 | import { FlatCompat } from "@eslint/eslintrc";
 4 | 
 5 | const __filename = fileURLToPath(import.meta.url);
 6 | const __dirname = dirname(__filename);
 7 | 
 8 | const compat = new FlatCompat({
 9 |   baseDirectory: __dirname,
10 | });
11 | 
12 | const eslintConfig = [
13 |   ...compat.extends("next/core-web-vitals", "next/typescript"),
14 | ];
15 | 
16 | export default eslintConfig;
17 | 


--------------------------------------------------------------------------------
/templates/basic/ui/next.config.ts:
--------------------------------------------------------------------------------
 1 | import type { NextConfig } from "next";
 2 | 
 3 | const nextConfig: NextConfig = {
 4 |   basePath: process.env.LLAMA_DEPLOY_NEXTJS_BASE_PATH,
 5 |   env: {
 6 |     NEXT_PUBLIC_LLAMA_DEPLOY_NEXTJS_DEPLOYMENT_NAME: process.env.LLAMA_DEPLOY_NEXTJS_DEPLOYMENT_NAME || "default",
 7 |     NEXT_PUBLIC_BASE_PATH: process.env.LLAMA_DEPLOY_NEXTJS_BASE_PATH,
 8 |   },
 9 | };
10 | 
11 | export default nextConfig;
12 | 


--------------------------------------------------------------------------------
/templates/basic/ui/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "ui",
 3 |   "version": "0.1.0",
 4 |   "private": true,
 5 |   "scripts": {
 6 |     "dev": "next dev --turbopack",
 7 |     "build": "next build",
 8 |     "start": "next start",
 9 |     "lint": "next lint"
10 |   },
11 |   "dependencies": {
12 |     "@heroicons/react": "^2.2.0",
13 |     "next": "15.3.2",
14 |     "react": "^19.0.0",
15 |     "react-dom": "^19.0.0"
16 |   },
17 |   "devDependencies": {
18 |     "@eslint/eslintrc": "^3",
19 |     "@tailwindcss/postcss": "^4",
20 |     "@types/node": "^20",
21 |     "@types/react": "^19",
22 |     "@types/react-dom": "^19",
23 |     "eslint": "^9",
24 |     "eslint-config-next": "15.3.2",
25 |     "tailwindcss": "^4",
26 |     "typescript": "^5"
27 |   }
28 | }
29 | 


--------------------------------------------------------------------------------
/templates/basic/ui/postcss.config.mjs:
--------------------------------------------------------------------------------
1 | const config = {
2 |   plugins: ["@tailwindcss/postcss"],
3 | };
4 | 
5 | export default config;
6 | 


--------------------------------------------------------------------------------
/templates/basic/ui/public/file.svg:
--------------------------------------------------------------------------------
1 | <svg fill="none" viewBox="0 0 16 16" xmlns="http://www.w3.org/2000/svg"><path d="M14.5 13.5V5.41a1 1 0 0 0-.3-.7L9.8.29A1 1 0 0 0 9.08 0H1.5v13.5A2.5 2.5 0 0 0 4 16h8a2.5 2.5 0 0 0 2.5-2.5m-1.5 0v-7H8v-5H3v12a1 1 0 0 0 1 1h8a1 1 0 0 0 1-1M9.5 5V2.12L12.38 5zM5.13 5h-.62v1.25h2.12V5zm-.62 3h7.12v1.25H4.5zm.62 3h-.62v1.25h7.12V11z" clip-rule="evenodd" fill="#666" fill-rule="evenodd"/></svg>
2 | 


--------------------------------------------------------------------------------
/templates/basic/ui/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "target": "ES2017",
 4 |     "lib": ["dom", "dom.iterable", "esnext"],
 5 |     "allowJs": true,
 6 |     "skipLibCheck": true,
 7 |     "strict": true,
 8 |     "noEmit": true,
 9 |     "esModuleInterop": true,
10 |     "module": "esnext",
11 |     "moduleResolution": "bundler",
12 |     "resolveJsonModule": true,
13 |     "isolatedModules": true,
14 |     "jsx": "preserve",
15 |     "incremental": true,
16 |     "plugins": [
17 |       {
18 |         "name": "next"
19 |       }
20 |     ],
21 |     "paths": {
22 |       "@/*": ["./*"]
23 |     }
24 |   },
25 |   "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
26 |   "exclude": ["node_modules"]
27 | }
28 | 


--------------------------------------------------------------------------------
/tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/__init__.py


--------------------------------------------------------------------------------
/tests/apiserver/conftest.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | from typing import Any, Iterator
 3 | from unittest import mock
 4 | 
 5 | import pytest
 6 | from fastapi.testclient import TestClient
 7 | from llama_index.core.workflow import Workflow, StartEvent, StopEvent, step
 8 | 
 9 | from llama_deploy.apiserver.app import app
10 | from llama_deploy.apiserver.deployment import Deployment
11 | from llama_deploy.apiserver.deployment_config_parser import DeploymentConfig
12 | 
13 | 
14 | class SmallWorkflow(Workflow):
15 |     @step()
16 |     async def run_step(self, ev: StartEvent) -> StopEvent:
17 |         return StopEvent(result="Hello, world!")
18 | 
19 | 
20 | @pytest.fixture
21 | def mock_importlib() -> Iterator[None]:
22 |     with mock.patch("llama_deploy.apiserver.deployment.importlib") as importlib:
23 |         importlib.import_module.return_value = mock.MagicMock(
24 |             my_workflow=SmallWorkflow()
25 |         )
26 |         yield
27 | 
28 | 
29 | @pytest.fixture
30 | def data_path() -> Path:
31 |     data_p = Path(__file__).parent / "data"
32 |     return data_p.resolve()
33 | 
34 | 
35 | @pytest.fixture
36 | def mocked_deployment(data_path: Path, mock_importlib: Any) -> Iterator[Deployment]:
37 |     config = DeploymentConfig.from_yaml(data_path / "git_service.yaml")
38 |     with mock.patch("llama_deploy.apiserver.deployment.SOURCE_MANAGERS") as sm_dict:
39 |         sm_dict["git"] = mock.MagicMock()
40 |         yield Deployment(config=config, base_path=data_path, deployment_path=Path("."))
41 | 
42 | 
43 | @pytest.fixture
44 | def http_client() -> TestClient:
45 |     return TestClient(app)
46 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/.env:
--------------------------------------------------------------------------------
1 | API_KEY=123
2 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/env_variables.yaml:
--------------------------------------------------------------------------------
 1 | name: MyDeployment
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | message-queue:
 7 |   type: simple
 8 |   host: "127.0.0.1"
 9 |   port: 8001
10 | 
11 | default-service: myworkflow
12 | 
13 | services:
14 |   myworkflow:
15 |     name: My Python Workflow
16 |     env:
17 |       VAR_1: x
18 |       VAR_2: y
19 |     env-files:
20 |       - .env
21 |     source:
22 |       type: local
23 |       location: workflow
24 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/example.yaml:
--------------------------------------------------------------------------------
 1 | name: MyDeployment
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | message-queue:
 7 |   type: simple
 8 |   host: "127.0.0.1"
 9 |   port: 8001
10 | 
11 | default-service: myworkflow
12 | 
13 | services:
14 |   myworkflow:
15 |     # A python workflow available in a git repo
16 |     name: My Python Workflow
17 |     source:
18 |       type: git
19 |       location: git@github.com/myorg/myrepo
20 |     import-path: src/python/app # relative to root of the repo
21 |     port: 1313
22 |     python-dependencies:
23 |       # this is a list to match the requirements.txt format
24 |       - "llama-index-core<1"
25 |       - "llama-index-llms-openai"
26 |       # we can also support installing a req file relative to `path`
27 |       # if source is a git repository
28 |       - "requirements.txt"
29 |     env:
30 |       VAR_1: x
31 |       VAR_2: y
32 |     env-files:
33 |       - ./.env
34 | 
35 |   another-workflow:
36 |     # A LITS workflow available in a git repo (might be the same)
37 |     name: My LITS Workflow
38 |     source:
39 |       type: git
40 |       location: git@github.com/myorg/myrepo
41 |     import-path: src/ts/app
42 |     port: 1313
43 |     ts-dependencies:
44 |       # this is a mapping to match the package.json format
45 |       "@llamaindex/core": "^0.2.0"
46 |       "@notionhq/client": "^2.2.15"
47 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/git_service.yaml:
--------------------------------------------------------------------------------
 1 | name: TestDeployment
 2 | 
 3 | control-plane: {}
 4 | 
 5 | services:
 6 |   test-workflow:
 7 |     name: Test Workflow
 8 |     port: 8002
 9 |     host: localhost
10 |     source:
11 |       type: git
12 |       location: https://github.com/run-llama/llama_deploy.git
13 |     import-path: tests/apiserver/data/workflow:my_workflow
14 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/local.yaml:
--------------------------------------------------------------------------------
 1 | name: LocalDeploymentRelativePath
 2 | 
 3 | control-plane: {}
 4 | 
 5 | services:
 6 |   test-workflow:
 7 |     name: Test Workflow
 8 |     port: 8002
 9 |     host: localhost
10 |     source:
11 |       type: local
12 |       location: workflow
13 |     import-path: workflow:my_workflow
14 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/python_dependencies.yaml:
--------------------------------------------------------------------------------
 1 | name: MyDeployment
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | message-queue:
 7 |   type: simple
 8 |   host: "127.0.0.1"
 9 |   port: 8001
10 | 
11 | default-service: myworkflow
12 | 
13 | services:
14 |   myworkflow:
15 |     name: My Python Workflow
16 |     python-dependencies:
17 |       - "llama-index-core<1"
18 |       - "llama-index-llms-openai"
19 |     source:
20 |       type: local
21 |       location: test
22 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/service_ports.yaml:
--------------------------------------------------------------------------------
 1 | name: TestDeployment
 2 | 
 3 | control-plane: {}
 4 | 
 5 | services:
 6 |   no-port:
 7 |     name: No Port
 8 |     source:
 9 |       type: local
10 |       location: workflow
11 | 
12 |   has-port:
13 |     name: Has Port
14 |     port: 9999
15 |     source:
16 |       type: local
17 |       location: workflow
18 | 
19 |   no-port-again:
20 |     name: Again no Port
21 |     source:
22 |       type: local
23 |       location: workflow
24 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/with_ui.yaml:
--------------------------------------------------------------------------------
 1 | name: test-deployment
 2 | 
 3 | control-plane:
 4 |   port: 8000
 5 | 
 6 | default-service: echo_workflow
 7 | 
 8 | services:
 9 |   test-workflow:
10 |     name: Test Workflow
11 |     port: 8002
12 |     host: localhost
13 |     source:
14 |       type: local
15 |       location: workflow
16 |     import-path: workflow:my_workflow
17 | 
18 | ui:
19 |   name: My Nextjs App
20 |   source:
21 |     type: git
22 |     location: https://github.com/run-llama/llama_deploy.git
23 |   import-path: src/ui
24 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/workflow/__init__.py:
--------------------------------------------------------------------------------
1 | from .workflow_test import MyWorkflow, _TestEnvWorkflow
2 | 
3 | my_workflow = MyWorkflow()
4 | env_reader_workflow = _TestEnvWorkflow()
5 | 


--------------------------------------------------------------------------------
/tests/apiserver/data/workflow/workflow_test.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | from llama_index.core.workflow import Context, StartEvent, StopEvent, Workflow, step
 3 | 
 4 | 
 5 | class MyWorkflow(Workflow):
 6 |     @step
 7 |     def do_something(self, ctx: Context, ev: StartEvent) -> StopEvent:
 8 |         return StopEvent(result=f"Received: {ev.data}")
 9 | 
10 | 
11 | class _TestEnvWorkflow(Workflow):
12 |     @step()
13 |     async def read_env_vars(self, ctx: Context, ev: StartEvent) -> StopEvent:
14 |         env_vars = [f"{v}: {os.environ.get(v)}" for v in ev.get("env_vars_to_read")]
15 |         return StopEvent(result=", ".join(env_vars))
16 | 


--------------------------------------------------------------------------------
/tests/apiserver/routers/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/apiserver/routers/__init__.py


--------------------------------------------------------------------------------
/tests/apiserver/routers/test_status.py:
--------------------------------------------------------------------------------
 1 | from typing import Any
 2 | from unittest import mock
 3 | 
 4 | import httpx
 5 | from fastapi.testclient import TestClient
 6 | 
 7 | from llama_deploy.apiserver.settings import settings
 8 | 
 9 | 
10 | def test_read_main(http_client: TestClient) -> None:
11 |     response = http_client.get("/status")
12 |     assert response.status_code == 200
13 |     assert response.json() == {
14 |         "max_deployments": 10,
15 |         "deployments": [],
16 |         "status": "Healthy",
17 |         "status_message": "",
18 |     }
19 | 
20 | 
21 | def test_prom_proxy_off(http_client: TestClient, monkeypatch: Any) -> None:
22 |     monkeypatch.setattr(settings, "prometheus_enabled", False)
23 |     response = http_client.get("/status/metrics/")
24 |     assert response.status_code == 204
25 |     assert response.text == ""
26 | 
27 | 
28 | def test_prom_proxy(http_client: TestClient) -> None:
29 |     mock_metrics_response = 'metric1{label="value"} 1.0\nmetric2{label="value"} 2.0'
30 |     mock_response = httpx.Response(200, text=mock_metrics_response)
31 | 
32 |     with mock.patch("httpx.AsyncClient.get", return_value=mock_response):
33 |         response = http_client.get("/status/metrics")
34 |         assert response.status_code == 200
35 |         assert response.text == mock_metrics_response
36 | 
37 | 
38 | def test_prom_proxy_failure(http_client: TestClient) -> None:
39 |     # Mock the HTTP client to raise an exception
40 |     with mock.patch(
41 |         "httpx.AsyncClient.get", side_effect=httpx.RequestError("Connection failed")
42 |     ):
43 |         response = http_client.get("/status/metrics")
44 |         assert response.status_code == 500
45 |         assert response.json()["detail"] == "Connection failed"
46 | 


--------------------------------------------------------------------------------
/tests/apiserver/source_managers/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/apiserver/source_managers/__init__.py


--------------------------------------------------------------------------------
/tests/apiserver/source_managers/test_git.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | from unittest import mock
 3 | 
 4 | import pytest
 5 | 
 6 | from llama_deploy.apiserver.deployment_config_parser import DeploymentConfig
 7 | from llama_deploy.apiserver.source_managers.git import GitSourceManager
 8 | 
 9 | 
10 | @pytest.fixture
11 | def config(data_path: Path) -> DeploymentConfig:
12 |     return DeploymentConfig.from_yaml(data_path / "git_service.yaml")
13 | 
14 | 
15 | def test_parse_source(config: DeploymentConfig) -> None:
16 |     sm = GitSourceManager(config)
17 |     assert sm._parse_source("https://example.com/llama_deploy.git@branch_name") == (
18 |         "https://example.com/llama_deploy.git",
19 |         "branch_name",
20 |     )
21 |     assert sm._parse_source("https://example.com/llama_deploy.git") == (
22 |         "https://example.com/llama_deploy.git",
23 |         None,
24 |     )
25 | 
26 | 
27 | def test_sync_wrong_params(config: DeploymentConfig) -> None:
28 |     sm = GitSourceManager(config)
29 |     with pytest.raises(ValueError, match="Destination cannot be empty"):
30 |         sm.sync("some_source")
31 | 
32 | 
33 | def test_sync(config: DeploymentConfig) -> None:
34 |     sm = GitSourceManager(config)
35 |     with mock.patch("llama_deploy.apiserver.source_managers.git.Repo") as repo_mock:
36 |         sm.sync("source", "dest")
37 |         repo_mock.clone_from.assert_called_with(to_path="dest", url="source")
38 |         sm.sync("source@branch", "dest")
39 |         repo_mock.clone_from.assert_called_with(
40 |             to_path="dest", url="source", multi_options=["-b branch", "--single-branch"]
41 |         )
42 | 
43 | 
44 | def test_sync_dir_exists(config: DeploymentConfig, tmp_path: Path) -> None:
45 |     sm = GitSourceManager(config)
46 |     with mock.patch("llama_deploy.apiserver.source_managers.git.Repo"):
47 |         with mock.patch(
48 |             "llama_deploy.apiserver.source_managers.git.shutil"
49 |         ) as shutil_mock:
50 |             sm.sync("source", str(tmp_path))
51 |             shutil_mock.rmtree.assert_called_once()
52 | 


--------------------------------------------------------------------------------
/tests/apiserver/test_app.py:
--------------------------------------------------------------------------------
1 | from fastapi.testclient import TestClient
2 | 
3 | 
4 | def test_read_main(http_client: TestClient) -> None:
5 |     response = http_client.get("/")
6 |     assert response.status_code == 200
7 |     assert set(response.json().keys()) == {"swagger_docs", "status"}
8 | 


--------------------------------------------------------------------------------
/tests/apiserver/test_config_parser.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | 
 3 | from llama_deploy.apiserver.deployment_config_parser import DeploymentConfig
 4 | 
 5 | 
 6 | def do_assert(config: DeploymentConfig) -> None:
 7 |     assert config.name == "MyDeployment"
 8 | 
 9 |     assert config.control_plane.port == 8000
10 | 
11 |     assert config.message_queue is not None
12 |     assert config.message_queue.type == "simple"
13 |     assert config.default_service == "myworkflow"
14 | 
15 |     wf_config = config.services["myworkflow"]
16 |     assert wf_config.name == "My Python Workflow"
17 |     assert wf_config.source
18 |     assert wf_config.source.type == "git"
19 |     assert wf_config.source.location == "git@github.com/myorg/myrepo"
20 |     assert wf_config.import_path == "src/python/app"
21 |     assert wf_config.port == 1313
22 |     assert wf_config.python_dependencies
23 |     assert len(wf_config.python_dependencies) == 3
24 |     assert wf_config.env == {"VAR_1": "x", "VAR_2": "y"}
25 |     assert wf_config.env_files == ["./.env"]
26 | 
27 |     wf_config = config.services["another-workflow"]
28 |     assert wf_config.name == "My LITS Workflow"
29 |     assert wf_config.source
30 |     assert wf_config.source.type == "git"
31 |     assert wf_config.source.location == "git@github.com/myorg/myrepo"
32 |     assert wf_config.import_path == "src/ts/app"
33 |     assert wf_config.port == 1313
34 |     assert wf_config.ts_dependencies
35 |     assert len(wf_config.ts_dependencies) == 2
36 |     assert wf_config.ts_dependencies["@llamaindex/core"] == "^0.2.0"
37 | 
38 | 
39 | def test_load_config_file(data_path: Path) -> None:
40 |     config = DeploymentConfig.from_yaml(data_path / "example.yaml")
41 |     do_assert(config)
42 | 
43 | 
44 | def test_from_yaml_bytes(data_path: Path) -> None:
45 |     with open(data_path / "example.yaml", "rb") as config_f:
46 |         config = DeploymentConfig.from_yaml_bytes(config_f.read())
47 |         do_assert(config)
48 | 


--------------------------------------------------------------------------------
/tests/apiserver/test_server.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | from pathlib import Path
 3 | from typing import Any
 4 | from unittest import mock
 5 | 
 6 | import pytest
 7 | 
 8 | from llama_deploy.apiserver.server import lifespan
 9 | 
10 | 
11 | @pytest.mark.asyncio
12 | @mock.patch("llama_deploy.apiserver.server.manager")
13 | async def test_lifespan(
14 |     mocked_manager: Any,
15 |     tmp_path: Path,
16 |     caplog: Any,
17 |     data_path: Path,
18 | ) -> None:  # type: ignore
19 |     source_file = data_path / "git_service.yaml"
20 |     config_file = tmp_path / "test.yml"
21 |     with open(config_file, "w") as f:
22 |         f.write(source_file.read_text())
23 | 
24 |     mocked_manager.serve = mock.AsyncMock()
25 |     with mock.patch("llama_deploy.apiserver.server.settings") as mocked_settings:
26 |         mocked_settings.rc_path = tmp_path
27 |         mocked_settings.deployments_path = tmp_path / "foo/bar"
28 |         mocked_manager.deployments_path = mocked_settings.deployments_path
29 |         caplog.set_level(logging.INFO)
30 |         async with lifespan(mock.AsyncMock()):
31 |             pass
32 | 
33 |         assert f"deployments folder: {mocked_settings.deployments_path}" in caplog.text
34 |         assert (
35 |             f"Browsing the rc folder {tmp_path} for deployments to start" in caplog.text
36 |         )
37 |         assert f"Deploying startup configuration from {config_file}" in caplog.text
38 |         mocked_manager.serve.assert_called_once()
39 | 


--------------------------------------------------------------------------------
/tests/apiserver/test_settings.py:
--------------------------------------------------------------------------------
 1 | from llama_deploy.apiserver.settings import ApiserverSettings
 2 | 
 3 | 
 4 | def test_settings_url() -> None:
 5 |     s = ApiserverSettings()
 6 |     assert s.url == "http://127.0.0.1:4501"
 7 | 
 8 |     s = ApiserverSettings(use_tls=True)
 9 |     assert s.url == "https://127.0.0.1:4501"
10 | 
11 |     s = ApiserverSettings(host="example.com", port=8080)
12 |     assert s.url == "http://example.com:8080"
13 | 
14 |     s = ApiserverSettings(host="example.com", port=80)
15 |     assert s.url == "http://example.com"
16 | 


--------------------------------------------------------------------------------
/tests/cli/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/cli/__init__.py


--------------------------------------------------------------------------------
/tests/cli/conftest.py:
--------------------------------------------------------------------------------
 1 | import shutil
 2 | from pathlib import Path
 3 | from typing import IO, TYPE_CHECKING, Any, Mapping, Optional, Sequence, Union
 4 | 
 5 | import pytest
 6 | from click.testing import CliRunner, Result
 7 | 
 8 | if TYPE_CHECKING:
 9 |     from click.core import BaseCommand
10 | 
11 | 
12 | class ConfigCliRunner(CliRunner):
13 |     tests_data_path: Path
14 |     temp_config: Path
15 | 
16 |     def invoke(  # type: ignore
17 |         self,
18 |         cli: "BaseCommand",
19 |         args: Optional[Union[str, Sequence[str]]] = None,
20 |         input: Optional[Union[str, bytes, IO[Any]]] = None,
21 |         env: Optional[Mapping[str, Optional[str]]] = None,
22 |         catch_exceptions: bool = True,
23 |         color: bool = False,
24 |         **extra: Any,
25 |     ) -> Result:
26 |         args = args or []
27 |         if "-c" not in args and "--config" not in args:
28 |             # If the config file was not specified explicitly in the test,
29 |             # we set it globally
30 |             args = ["-c", str(self.tests_data_path / "config.yaml")] + list(args)
31 |         else:
32 |             args = ["-c", str(self.temp_config)] + list(args)
33 | 
34 |         return super().invoke(cli, args, input, env, catch_exceptions, color, **extra)  # type: ignore
35 | 
36 | 
37 | @pytest.fixture
38 | def data_path() -> Path:
39 |     return Path(__file__).parent / "data"
40 | 
41 | 
42 | @pytest.fixture
43 | def runner(data_path: Path, tmp_config: Path) -> CliRunner:
44 |     runner = ConfigCliRunner()
45 |     runner.tests_data_path = data_path
46 |     runner.temp_config = tmp_config
47 |     return runner
48 | 
49 | 
50 | @pytest.fixture
51 | def tmp_config(data_path: Path, tmp_path: Path) -> Path:
52 |     src = data_path / "config.yaml"
53 |     dst = tmp_path / "config.yaml"
54 |     shutil.copy(src, tmp_path)
55 |     return dst
56 | 


--------------------------------------------------------------------------------
/tests/cli/data/config.yaml:
--------------------------------------------------------------------------------
 1 | current_profile: default
 2 | profiles:
 3 |   default:
 4 |     insecure: false
 5 |     server: http://localhost:4501
 6 |     timeout: 120.0
 7 | 
 8 |   test:
 9 |     insecure: false
10 |     server: http://localhost:4501
11 |     timeout: 120.0
12 | 


--------------------------------------------------------------------------------
/tests/cli/data/deployment.yaml:
--------------------------------------------------------------------------------
1 | name: TestDeployment
2 | 
3 | control-plane: {}
4 | 
5 | services:
6 |   test-workflow:
7 |     name: Test Workflow
8 | 


--------------------------------------------------------------------------------
/tests/cli/internal/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/cli/internal/__init__.py


--------------------------------------------------------------------------------
/tests/cli/internal/test_config.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | from unittest import mock
 3 | 
 4 | from llama_deploy.cli.internal.config import (
 5 |     Config,
 6 |     ConfigProfile,
 7 |     _default_config_path,
 8 |     load_config,
 9 | )
10 | from llama_deploy.cli.internal.utils import DEFAULT_CONFIG_FILE_NAME
11 | 
12 | 
13 | def test_load_config(data_path: Path) -> None:
14 |     test_config_file = data_path / DEFAULT_CONFIG_FILE_NAME
15 |     config = load_config(path=test_config_file)
16 |     assert "test" in config.profiles
17 | 
18 | 
19 | def test_load_config_no_path(tmp_path: Path) -> None:
20 |     with mock.patch("llama_deploy.cli.internal.utils.user_config_dir") as mock_dir:
21 |         mock_dir.return_value = tmp_path
22 |         config = load_config(path=None)
23 |         assert len(config.profiles) == 1
24 |         assert "default" in config.profiles
25 | 
26 | 
27 | def test__default_config_path() -> None:
28 |     assert str(_default_config_path()).endswith(DEFAULT_CONFIG_FILE_NAME)
29 | 
30 | 
31 | def test_config_write(tmp_path: Path) -> None:
32 |     config_path = tmp_path / "test.yaml"
33 |     assert not config_path.exists()
34 |     config = Config(
35 |         current_profile="test", profiles={"test": ConfigProfile()}, path=config_path
36 |     )
37 |     config.write()
38 |     assert config_path.exists()
39 | 
40 | 
41 | def test_config_dir_doesnt_exist(tmp_path: Path) -> None:
42 |     with mock.patch("llama_deploy.cli.internal.utils.user_config_dir") as mock_dir:
43 |         mock_dir.return_value = tmp_path / "config" / "folder"
44 |         config = load_config(path=None)
45 |         assert len(config.profiles) == 1
46 |         assert "default" in config.profiles
47 | 


--------------------------------------------------------------------------------
/tests/cli/test_cli.py:
--------------------------------------------------------------------------------
 1 | from unittest import mock
 2 | 
 3 | from click.testing import CliRunner
 4 | 
 5 | from llama_deploy.cli import llamactl
 6 | from llama_deploy.cli.__main__ import main
 7 | 
 8 | 
 9 | @mock.patch("llama_deploy.cli.__main__.sys")
10 | @mock.patch("llama_deploy.cli.__main__.llamactl")
11 | def test_main(mocked_cli, mocked_sys) -> None:  # type: ignore
12 |     mocked_cli.return_value = 0
13 |     main()
14 |     mocked_sys.exit.assert_called_with(0)
15 | 
16 | 
17 | def test_root_command(runner: CliRunner) -> None:
18 |     result = runner.invoke(llamactl)
19 |     assert result.exit_code == 0
20 |     # Ensure invoking the root command outputs the help
21 |     assert "Usage: llamactl" in result.output
22 | 
23 | 
24 | def test_wrong_profile(runner: CliRunner) -> None:
25 |     result = runner.invoke(llamactl, ["-p", "foo"])
26 |     assert result.exit_code == 1
27 | 


--------------------------------------------------------------------------------
/tests/cli/test_deploy.py:
--------------------------------------------------------------------------------
 1 | from pathlib import Path
 2 | from unittest import mock
 3 | 
 4 | import httpx
 5 | from click.testing import CliRunner
 6 | 
 7 | from llama_deploy.cli import llamactl
 8 | 
 9 | 
10 | def test_deploy(runner: CliRunner, data_path: Path) -> None:
11 |     test_config_file = data_path / "deployment.yaml"
12 |     mocked_result = mock.MagicMock(id="test_deployment")
13 |     with mock.patch("llama_deploy.cli.deploy.Client") as mocked_client:
14 |         mocked_client.return_value.sync.apiserver.deployments.create.return_value = (
15 |             mocked_result
16 |         )
17 | 
18 |         result = runner.invoke(llamactl, ["-t", "5.0", "deploy", str(test_config_file)])
19 | 
20 |         assert result.exit_code == 0
21 |         assert result.output == "Deployment successful: test_deployment\n"
22 |         mocked_client.assert_called_with(
23 |             api_server_url="http://localhost:4501", disable_ssl=False, timeout=5.0
24 |         )
25 |         file_arg = (
26 |             mocked_client.return_value.sync.apiserver.deployments.create.call_args
27 |         )
28 |         assert str(test_config_file) == file_arg.args[0].name
29 | 
30 | 
31 | def test_deploy_failed(runner: CliRunner, data_path: Path) -> None:
32 |     test_config_file = data_path / "deployment.yaml"
33 |     with mock.patch("llama_deploy.cli.deploy.Client") as mocked_client:
34 |         mocked_client.return_value.sync.apiserver.deployments.create.side_effect = (
35 |             httpx.HTTPStatusError(
36 |                 "Unauthorized!", response=mock.MagicMock(), request=mock.MagicMock()
37 |             )
38 |         )
39 | 
40 |         result = runner.invoke(llamactl, ["deploy", str(test_config_file)])
41 |         assert result.exit_code == 1
42 |         assert result.output == "Error: Unauthorized!\n"
43 | 


--------------------------------------------------------------------------------
/tests/cli/test_init.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import pytest
 3 | import tempfile
 4 | 
 5 | from click.testing import CliRunner
 6 | from llama_deploy.cli import llamactl
 7 | 
 8 | 
 9 | @pytest.fixture
10 | def runner() -> CliRunner:
11 |     return CliRunner()
12 | 
13 | 
14 | def test_basic_init_e2e(runner: CliRunner) -> None:
15 |     with tempfile.TemporaryDirectory() as temp_dir:
16 |         result = runner.invoke(
17 |             llamactl,
18 |             [
19 |                 "init",
20 |                 "--name",
21 |                 "test-project",
22 |                 "--destination",
23 |                 temp_dir,
24 |                 "--port",
25 |                 "8080",
26 |                 "--message-queue-type",
27 |                 "redis",
28 |                 "--template",
29 |                 "basic",
30 |             ],
31 |             input="y\n",  # Confirm UI inclusion
32 |         )
33 |         assert result.exit_code == 0
34 |         assert "Project test-project created successfully!" in result.output
35 | 
36 |         with open(os.path.join(temp_dir, "test-project", "deployment.yml"), "r") as f:
37 |             text = f.read()
38 |             assert "OPENAI_API_KEY" in text
39 |             assert "ui:" in text
40 |             assert "type: redis" in text
41 | 
42 | 
43 | def test_basic_init_e2e_no_ui(runner: CliRunner) -> None:
44 |     with tempfile.TemporaryDirectory() as temp_dir:
45 |         result = runner.invoke(
46 |             llamactl,
47 |             [
48 |                 "init",
49 |                 "--name",
50 |                 "test-project",
51 |                 "--destination",
52 |                 temp_dir,
53 |                 "--port",
54 |                 "8080",
55 |                 "--message-queue-type",
56 |                 "redis",
57 |                 "--template",
58 |                 "none",
59 |             ],
60 |         )
61 |         assert result.exit_code == 0
62 |         assert "Project test-project created successfully!" in result.output
63 | 
64 |         with open(os.path.join(temp_dir, "test-project", "deployment.yml"), "r") as f:
65 |             text = f.read()
66 |             assert "ui: null" in text
67 | 


--------------------------------------------------------------------------------
/tests/cli/test_sessions.py:
--------------------------------------------------------------------------------
 1 | from unittest import mock
 2 | 
 3 | import httpx
 4 | from click.testing import CliRunner
 5 | 
 6 | from llama_deploy.cli import llamactl
 7 | 
 8 | 
 9 | def test_session_create(runner: CliRunner) -> None:
10 |     with mock.patch("llama_deploy.cli.sessions.Client") as mocked_client:
11 |         mocked_deployment = mock.MagicMock()
12 |         mocked_deployment.sessions.create.return_value = mock.MagicMock(
13 |             id="test_session"
14 |         )
15 |         mocked_client.return_value.sync.apiserver.deployments.get.return_value = (
16 |             mocked_deployment
17 |         )
18 | 
19 |         result = runner.invoke(
20 |             llamactl,
21 |             ["sessions", "create", "-d", "deployment_name"],
22 |         )
23 | 
24 |         mocked_client.assert_called_with(
25 |             api_server_url="http://localhost:4501", disable_ssl=False, timeout=120.0
26 |         )
27 | 
28 |         mocked_deployment.sessions.create.assert_called_once()
29 |         assert result.exit_code == 0
30 | 
31 | 
32 | def test_sessions_create_error(runner: CliRunner) -> None:
33 |     with mock.patch("llama_deploy.cli.sessions.Client") as mocked_client:
34 |         mocked_client.return_value.sync.apiserver.deployments.get.side_effect = (
35 |             httpx.HTTPStatusError(
36 |                 "test error", response=mock.MagicMock(), request=mock.MagicMock()
37 |             )
38 |         )
39 | 
40 |         result = runner.invoke(
41 |             llamactl, ["sessions", "create", "-d", "deployment_name"]
42 |         )
43 | 
44 |         assert result.exit_code == 1
45 |         assert result.output == "Error: test error\n"
46 | 


--------------------------------------------------------------------------------
/tests/client/models/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/client/models/__init__.py


--------------------------------------------------------------------------------
/tests/client/models/conftest.py:
--------------------------------------------------------------------------------
 1 | from typing import Any, Iterator
 2 | from unittest import mock
 3 | 
 4 | import pytest
 5 | 
 6 | from llama_deploy.client import Client
 7 | 
 8 | 
 9 | @pytest.fixture
10 | def client(monkeypatch: Any) -> Iterator[Client]:
11 |     monkeypatch.setattr(Client, "request", mock.AsyncMock())
12 |     yield Client()
13 | 


--------------------------------------------------------------------------------
/tests/client/models/test_model.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from typing import AsyncGenerator
 3 | 
 4 | import pytest
 5 | 
 6 | from llama_deploy.client import Client
 7 | from llama_deploy.client.models import Collection, Model
 8 | from llama_deploy.client.models.model import _async_gen_to_list, make_sync
 9 | 
10 | 
11 | class SomeAsyncModel(Model):
12 |     async def method(self) -> int:
13 |         return 0
14 | 
15 |     async def generator_method(self) -> AsyncGenerator:
16 |         yield 4
17 |         yield 2
18 | 
19 | 
20 | def test_make_sync() -> None:
21 |     assert asyncio.iscoroutinefunction(getattr(SomeAsyncModel, "method"))
22 |     some_sync = make_sync(SomeAsyncModel)
23 |     assert not asyncio.iscoroutinefunction(getattr(some_sync, "method"))
24 | 
25 | 
26 | def test_make_sync_instance(client: Client) -> None:
27 |     some_sync = make_sync(SomeAsyncModel)(client=client, id="foo")
28 |     assert not asyncio.iscoroutinefunction(some_sync.method)
29 |     assert some_sync.method() + 1 == 1
30 |     assert some_sync.generator_method() == [4, 2]
31 | 
32 | 
33 | def test__prepare(client: Client) -> None:
34 |     some_sync = make_sync(SomeAsyncModel)(client=client, id="foo")
35 |     coll = some_sync._prepare(Collection)
36 |     assert coll._instance_is_sync
37 | 
38 | 
39 | def test_collection_get() -> None:
40 |     class MyCollection(Collection):
41 |         pass
42 | 
43 |     c = Client()
44 |     models_list = [
45 |         SomeAsyncModel(client=c, id="foo"),
46 |         SomeAsyncModel(client=c, id="bar"),
47 |     ]
48 | 
49 |     coll = MyCollection(client=c, items={m.id: m for m in models_list})
50 |     assert coll.get("foo").id == "foo"
51 |     assert coll.get("bar").id == "bar"
52 | 
53 | 
54 | @pytest.mark.asyncio
55 | async def test__async_gen_to_list() -> None:
56 |     async def aiter_lines():  # type: ignore
57 |         yield "one"
58 |         yield "two"
59 | 
60 |     assert await _async_gen_to_list(aiter_lines()) == ["one", "two"]
61 | 


--------------------------------------------------------------------------------
/tests/client/test_client.py:
--------------------------------------------------------------------------------
 1 | from unittest import mock
 2 | 
 3 | import pytest
 4 | 
 5 | from llama_deploy.client import Client
 6 | from llama_deploy.client.client import _SyncClient
 7 | from llama_deploy.client.models import ApiServer, Core
 8 | 
 9 | 
10 | def test_client_init_default() -> None:
11 |     c = Client()
12 |     assert c.api_server_url == "http://localhost:4501"
13 |     assert c.disable_ssl is False
14 |     assert c.timeout == 120.0
15 |     assert c.poll_interval == 0.5
16 | 
17 | 
18 | def test_client_init_settings() -> None:
19 |     c = Client(api_server_url="test")
20 |     assert c.api_server_url == "test"
21 | 
22 | 
23 | def test_client_sync() -> None:
24 |     c = Client()
25 |     sc = c.sync
26 |     assert type(sc) is _SyncClient
27 |     assert sc.api_server_url == "http://localhost:4501"
28 |     assert sc.disable_ssl is False
29 |     assert sc.timeout == 120.0
30 |     assert sc.poll_interval == 0.5
31 | 
32 | 
33 | @pytest.mark.asyncio
34 | async def test_client_sync_within_loop() -> None:
35 |     c = Client()
36 |     with pytest.raises(
37 |         RuntimeError,
38 |         match="You cannot use the sync client within an async event loop - just await the async methods directly.",
39 |     ):
40 |         c.sync
41 | 
42 | 
43 | def test_client_attributes() -> None:
44 |     c = Client()
45 |     assert type(c.apiserver) is ApiServer
46 |     assert type(c.core) is Core
47 |     assert issubclass(type(c.sync.apiserver), ApiServer)
48 |     assert issubclass(type(c.sync.core), Core)
49 | 
50 | 
51 | @pytest.mark.asyncio
52 | async def test_client_request() -> None:
53 |     with mock.patch("llama_deploy.client.base.httpx") as _httpx:
54 |         mocked_response = mock.MagicMock()
55 |         _httpx.AsyncClient.return_value.__aenter__.return_value.request.return_value = (
56 |             mocked_response
57 |         )
58 | 
59 |         c = Client()
60 |         await c.request("GET", "http://example.com", verify=False)
61 |         _httpx.AsyncClient.assert_called_with(verify=False)
62 |         mocked_response.raise_for_status.assert_called_once()
63 | 


--------------------------------------------------------------------------------
/tests/conftest.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from typing import Any
 3 | 
 4 | import pytest_asyncio
 5 | 
 6 | from llama_deploy.message_queues.simple.server import SimpleMessageQueueServer
 7 | 
 8 | 
 9 | @pytest_asyncio.fixture(scope="function")
10 | async def message_queue_server() -> Any:
11 |     """Starts a SimpleMessageQueueServer instance ready to serve requests."""
12 |     mqs = SimpleMessageQueueServer()
13 |     server_task = asyncio.create_task(mqs.launch_server())
14 |     await asyncio.sleep(0.5)
15 |     yield
16 |     server_task.cancel()
17 |     await server_task
18 | 


--------------------------------------------------------------------------------
/tests/control_plane/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/control_plane/__init__.py


--------------------------------------------------------------------------------
/tests/control_plane/conftest.py:
--------------------------------------------------------------------------------
 1 | from typing import Any
 2 | from unittest import mock
 3 | 
 4 | import pytest
 5 | from fastapi.testclient import TestClient
 6 | 
 7 | from llama_deploy.control_plane.server import ControlPlaneConfig, ControlPlaneServer
 8 | 
 9 | 
10 | @pytest.fixture
11 | def kvstore() -> Any:
12 |     with mock.patch(
13 |         "llama_deploy.control_plane.server.SimpleKVStore"
14 |     ) as mocked_kvstore:
15 |         mock_instance = mock.AsyncMock()
16 |         mocked_kvstore.return_value = mock_instance
17 |         yield mock_instance
18 | 
19 | 
20 | @pytest.fixture
21 | def http_client(kvstore: Any) -> TestClient:
22 |     server = ControlPlaneServer(
23 |         message_queue=mock.AsyncMock(), config=ControlPlaneConfig(cors_origins=["*"])
24 |     )
25 |     return TestClient(server.app)
26 | 


--------------------------------------------------------------------------------
/tests/control_plane/test_config.py:
--------------------------------------------------------------------------------
 1 | from unittest import mock
 2 | 
 3 | import pytest
 4 | 
 5 | from llama_deploy.control_plane import ControlPlaneConfig
 6 | from llama_deploy.control_plane.config import parse_state_store_uri
 7 | 
 8 | 
 9 | def test_config_url() -> None:
10 |     cfg = ControlPlaneConfig(host="localhost", port=4242)
11 |     assert cfg.url == "http://localhost:4242"
12 |     cfg = ControlPlaneConfig(host="localhost", port=4242, use_tls=True)
13 |     assert cfg.url == "https://localhost:4242"
14 | 
15 | 
16 | def test_parse_state_store_uri_malformed() -> None:
17 |     with pytest.raises(ValueError, match="key-value store '' is not supported."):
18 |         parse_state_store_uri("some_wrong_uri")
19 | 
20 |     with pytest.raises(ValueError, match="key-value store 'foo' is not supported."):
21 |         parse_state_store_uri("foo://user:pass@host/database")
22 | 
23 | 
24 | # Ensure the module is never available, even if the package is installed
25 | @mock.patch.dict("sys.modules", {"llama_index.storage.kvstore.redis": None})
26 | def test_parse_state_store_uri_redis_not_installed() -> None:
27 |     with pytest.raises(
28 |         ValueError, match="pip install llama-index-storage-kvstore-redis"
29 |     ):
30 |         parse_state_store_uri("redis://localhost/")
31 | 
32 | 
33 | def test_parse_state_store_uri_redis() -> None:
34 |     redis_mock = mock.MagicMock()
35 | 
36 |     with mock.patch.dict(
37 |         "sys.modules", {"llama_index.storage.kvstore.redis": redis_mock}
38 |     ):
39 |         parse_state_store_uri("redis://localhost/")
40 |         calls = redis_mock.mock_calls
41 |         assert len(calls) == 1
42 |         assert calls[0].kwargs == {"redis_uri": "redis://localhost/"}
43 | 
44 | 
45 | # Ensure the module is never available, even if the package is installed
46 | @mock.patch.dict("sys.modules", {"llama_index.storage.kvstore.mongodb": None})
47 | def test_parse_state_store_uri_mongodb_not_installed() -> None:
48 |     with pytest.raises(
49 |         ValueError, match="pip install llama-index-storage-kvstore-mongodb"
50 |     ):
51 |         parse_state_store_uri("mongodb+srv://localhost/")
52 | 
53 | 
54 | def test_parse_state_store_uri_mongodb() -> None:
55 |     redis_mock = mock.MagicMock()
56 | 
57 |     with mock.patch.dict(
58 |         "sys.modules", {"llama_index.storage.kvstore.mongodb": redis_mock}
59 |     ):
60 |         parse_state_store_uri("mongodb+srv://localhost/")
61 |         calls = redis_mock.mock_calls
62 |         assert len(calls) == 1
63 |         assert calls[0].kwargs == {"uri": "mongodb+srv://localhost/"}
64 | 


--------------------------------------------------------------------------------
/tests/control_plane/test_utils.py:
--------------------------------------------------------------------------------
 1 | from llama_deploy.control_plane.utils import get_result_key, get_stream_key
 2 | 
 3 | 
 4 | def test_get_result_key() -> None:
 5 |     assert get_result_key("test_task") == "result_test_task"
 6 | 
 7 | 
 8 | def test_get_stream_key() -> None:
 9 |     assert get_stream_key("test_task") == "stream_test_task"
10 | 


--------------------------------------------------------------------------------
/tests/message_queues/simple/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/message_queues/simple/__init__.py


--------------------------------------------------------------------------------
/tests/message_queues/simple/conftest.py:
--------------------------------------------------------------------------------
 1 | import pytest
 2 | from fastapi.testclient import TestClient
 3 | 
 4 | from llama_deploy.message_queues.simple.server import SimpleMessageQueueServer
 5 | 
 6 | 
 7 | @pytest.fixture
 8 | def http_client() -> TestClient:
 9 |     mqs = SimpleMessageQueueServer()
10 |     return TestClient(mqs._app)
11 | 


--------------------------------------------------------------------------------
/tests/message_queues/simple/test_client.py:
--------------------------------------------------------------------------------
 1 | import pytest
 2 | 
 3 | from llama_deploy.message_queues.simple.client import SimpleMessageQueue
 4 | from llama_deploy.message_queues.simple.config import SimpleMessageQueueConfig
 5 | 
 6 | 
 7 | @pytest.mark.asyncio
 8 | async def test_cleanup_local() -> None:
 9 |     mq = SimpleMessageQueue()
10 |     await mq.cleanup()
11 | 
12 | 
13 | def test_as_config() -> None:
14 |     cfg = SimpleMessageQueueConfig()
15 |     mq = SimpleMessageQueue(cfg)
16 |     assert mq.as_config() == cfg
17 | 


--------------------------------------------------------------------------------
/tests/message_queues/simple/test_config.py:
--------------------------------------------------------------------------------
1 | from llama_deploy.message_queues.simple.config import SimpleMessageQueueConfig
2 | 
3 | 
4 | def test_base_url() -> None:
5 |     cfg = SimpleMessageQueueConfig()
6 |     assert cfg.base_url == "http://127.0.0.1:8001/"
7 |     cfg = SimpleMessageQueueConfig(port=80)
8 |     assert cfg.base_url == "http://127.0.0.1/"
9 | 


--------------------------------------------------------------------------------
/tests/message_queues/test_apache_kafka.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | from unittest.mock import AsyncMock, MagicMock, patch
 3 | 
 4 | import pytest
 5 | 
 6 | from llama_deploy.message_queues.apache_kafka import (
 7 |     KafkaMessageQueue,
 8 |     KafkaMessageQueueConfig,
 9 | )
10 | from llama_deploy.types import QueueMessage
11 | 
12 | try:
13 |     import aiokafka
14 | except (ModuleNotFoundError, ImportError):
15 |     aiokafka = None
16 | 
17 | 
18 | def test_init() -> None:
19 |     # arrange/act
20 |     mq = KafkaMessageQueue(KafkaMessageQueueConfig(url="0.0.0.0:5555"))
21 | 
22 |     # assert
23 |     assert mq._config.url == "0.0.0.0:5555"
24 | 
25 | 
26 | def test_from_url_params() -> None:
27 |     # arrange
28 |     host = "mock-host"
29 |     port = 8080
30 | 
31 |     # act
32 |     mq = KafkaMessageQueue.from_url_params(host=host, port=port)
33 | 
34 |     # assert
35 |     assert mq._config.url == f"{host}:{port}"
36 | 
37 | 
38 | @pytest.mark.asyncio()
39 | @pytest.mark.skipif(aiokafka is None, reason="aiokafka not installed")
40 | async def test_publish() -> None:
41 |     from aiokafka import AIOKafkaProducer
42 | 
43 |     # Arrange
44 |     mq = KafkaMessageQueue()
45 |     mq._create_new_topic = MagicMock()  # type: ignore
46 | 
47 |     # message types
48 |     queue_message = QueueMessage(publisher_id="test", id_="1")
49 |     message_body = json.dumps(queue_message.model_dump()).encode("utf-8")
50 | 
51 |     with patch.object(AIOKafkaProducer, "start", new_callable=AsyncMock) as mock_start:
52 |         with patch.object(
53 |             AIOKafkaProducer, "send_and_wait", new_callable=AsyncMock
54 |         ) as mock_send_and_wait:
55 |             # Act
56 |             _ = await mq._publish(queue_message, "test", True)
57 | 
58 |             # Assert
59 |             mock_start.assert_awaited_once()
60 |             mock_send_and_wait.assert_awaited_once_with("test", message_body)
61 | 


--------------------------------------------------------------------------------
/tests/services/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/run-llama/llama_deploy/8c5430d57910cb90a0cf82fb1e0ff68f6299f692/tests/services/__init__.py


--------------------------------------------------------------------------------
/tests/services/test_workflow_service_config.py:
--------------------------------------------------------------------------------
 1 | from llama_deploy.services.workflow import (
 2 |     WorkflowServiceConfig,
 3 | )
 4 | 
 5 | 
 6 | def test_config_creation() -> None:
 7 |     """Test basic config creation."""
 8 |     config = WorkflowServiceConfig(
 9 |         host="localhost", port=8000, service_name="test_service"
10 |     )
11 |     assert config.host == "localhost"
12 |     assert config.port == 8000
13 |     assert config.service_name == "test_service"
14 | 
15 | 
16 | def test_config_defaults() -> None:
17 |     """Test default values."""
18 |     config = WorkflowServiceConfig(host="localhost", port=8000)
19 |     assert config.service_name == "default_workflow_service"
20 |     assert config.description == "A service that wraps a llama-index workflow."
21 |     assert config.step_interval == 0.1
22 |     assert config.max_concurrent_tasks == 8
23 |     assert config.raise_exceptions is False
24 |     assert config.use_tls is False
25 |     assert config.internal_host is None
26 |     assert config.internal_port is None
27 | 
28 | 
29 | def test_url_property_http() -> None:
30 |     """Test URL property for HTTP."""
31 |     config = WorkflowServiceConfig(host="localhost", port=8000, use_tls=False)
32 |     assert config.url == "http://localhost:8000"
33 | 
34 | 
35 | def test_url_property_https() -> None:
36 |     """Test URL property for HTTPS."""
37 |     config = WorkflowServiceConfig(host="localhost", port=8443, use_tls=True)
38 |     assert config.url == "https://localhost:8443"
39 | 


--------------------------------------------------------------------------------
/tests/services/test_workflow_state.py:
--------------------------------------------------------------------------------
 1 | from llama_deploy.services.workflow import (
 2 |     WorkflowState,
 3 | )
 4 | 
 5 | 
 6 | def test_workflow_state_creation() -> None:
 7 |     """Test basic workflow state creation."""
 8 |     state = WorkflowState(task_id="test_task")
 9 |     assert state.task_id == "test_task"
10 |     assert state.hash is None
11 |     assert state.state == {}
12 |     assert state.run_kwargs == {}
13 |     assert state.session_id is None
14 | 
15 | 
16 | def test_workflow_state_with_data() -> None:
17 |     """Test workflow state with full data."""
18 |     state = WorkflowState(
19 |         task_id="test_task",
20 |         hash="test_hash",
21 |         state={"key": "value"},
22 |         run_kwargs={"param": "value"},
23 |         session_id="test_session",
24 |     )
25 |     assert state.task_id == "test_task"
26 |     assert state.hash == "test_hash"
27 |     assert state.state == {"key": "value"}
28 |     assert state.run_kwargs == {"param": "value"}
29 |     assert state.session_id == "test_session"
30 | 
31 | 
32 | def test_workflow_state_json_serialization() -> None:
33 |     """Test JSON serialization/deserialization."""
34 |     state = WorkflowState(
35 |         task_id="test_task", state={"key": "value"}, run_kwargs={"param": "value"}
36 |     )
37 |     json_str = state.model_dump_json()
38 |     deserialized = WorkflowState.model_validate_json(json_str)
39 |     assert deserialized.task_id == state.task_id
40 |     assert deserialized.state == state.state
41 |     assert deserialized.run_kwargs == state.run_kwargs
42 | 


--------------------------------------------------------------------------------